BBuf
diff --git a/‎License Plate Recognition System/LP.cpp
Lines changed: 800 additions & 0 deletions b/‎License Plate Recognition System/LP.cpp
Lines changed: 800 additions & 0 deletions
diff --git a/‎License Plate Recognition System/README.md
Lines changed: 7 additions & 0 deletions b/‎License Plate Recognition System/README.md
Lines changed: 7 additions & 0 deletions
diff --git a/‎License Plate Recognition System/estimate_character.py
Lines changed: 103 additions & 0 deletions b/‎License Plate Recognition System/estimate_character.py
Lines changed: 103 additions & 0 deletions
diff --git a/‎License Plate Recognition System/estimate_chinese.py
Lines changed: 106 additions & 0 deletions b/‎License Plate Recognition System/estimate_chinese.py
Lines changed: 106 additions & 0 deletions
diff --git a/‎License Plate Recognition System/train-license-digits.py
Lines changed: 177 additions & 0 deletions b/‎License Plate Recognition System/train-license-digits.py
Lines changed: 177 additions & 0 deletions
@@ -0,0 +1,7 @@
+# 车牌号码识别算法
+
+- LP.cpp 利用OpenCV实现了对车牌区域的检测，判断，切割，以及调用Python脚本进行预测字符
+- train-license-digits.py 实现对英文和字数字字符识别模型进行训练
+- train-license-province.py 实现对汉字字符识别模型进行训练
+- estimate_chinese.py 利用汉字字符识别模型对省份字符进行预测
+- estimate_character.py 利用英文和数字字符识别模型对英文和数字进行预测
@@ -0,0 +1,103 @@
+import sys
+import os
+import time
+import random
+import numpy as np
+import tensorflow as tf
+import cv2
+from PIL import Image
+import io
+import Image, ImageFont, ImageDraw
+import pygame
+INPUT_SIZE = 784
+WIDTH = 28
+HEIGHT = 28
+NUM_CLASSES = 34
+
+SAVER_DIR = "python/train-saver/digits/"
+
+LETTERS_DIGITS = ("0","1","2","3","4","5","6","7","8","9","A","B","C","D","E","F","G","H","J","K","L","M","N","P","Q","R","S","T","U","V","W","X","Y","Z")
+license_num = ""
+time_begin = time.time()
+# 定义输入节点，对应于图片像素值矩阵集合和图片标签(即所代表的数字)
+x = tf.placeholder(tf.float32, shape=[None, INPUT_SIZE])
+y_ = tf.placeholder(tf.float32, shape=[None, NUM_CLASSES])
+x_image = tf.reshape(x, [-1, WIDTH, HEIGHT, 1])
+def conv_layer(inputs, W, b, conv_strides, kernel_size, pool_strides, padding):
+    L1_conv = tf.nn.conv2d(inputs, W, strides=conv_strides, padding=padding)
+    L1_relu = tf.nn.relu(L1_conv + b)
+    return tf.nn.max_pool(L1_relu, ksize=kernel_size, strides=pool_strides, padding='SAME')
+    # 定义全连接层函数
+def full_connect(inputs, W, b):
+    return tf.nn.relu(tf.matmul(inputs, W) + b)
+
+pygame.init()
+
+if __name__ =='__main__':
+    start = time.time()
+    saver = tf.train.import_meta_graph("%smodel.ckpt.meta"%(SAVER_DIR))
+    with tf.Session() as sess:
+        model_file=tf.train.latest_checkpoint(SAVER_DIR)
+        saver.restore(sess, model_file)
+
+        # 第一个卷积层
+        W_conv1 = sess.graph.get_tensor_by_name("W_conv1:0")
+        b_conv1 = sess.graph.get_tensor_by_name("b_conv1:0")
+        conv_strides = [1, 1, 1, 1]
+        kernel_size = [1, 2, 2, 1]
+        pool_strides = [1, 2, 2, 1]
+        L1_pool = conv_layer(x_image, W_conv1, b_conv1, conv_strides, kernel_size, pool_strides, padding='SAME')
+        # 第二个卷积层
+        W_conv2 = sess.graph.get_tensor_by_name("W_conv2:0")
+        b_conv2 = sess.graph.get_tensor_by_name("b_conv2:0")
+        conv_strides = [1, 1, 1, 1]
+        kernel_size = [1, 2, 2, 1]
+        pool_strides = [1, 2, 2, 1]
+        L2_pool = conv_layer(L1_pool, W_conv2, b_conv2, conv_strides, kernel_size, pool_strides, padding='SAME')
+        # 全连接层
+        W_fc1 = sess.graph.get_tensor_by_name("W_fc1:0")
+        b_fc1 = sess.graph.get_tensor_by_name("b_fc1:0")
+        h_pool2_flat = tf.reshape(L2_pool, [-1, 7 * 7 * 64])
+        h_fc1 = full_connect(h_pool2_flat, W_fc1, b_fc1)
+        # dropout
+        keep_prob = tf.placeholder(tf.float32)
+        h_fc1_drop = tf.nn.dropout(h_fc1, keep_prob)
+        # readout层
+        W_fc2 = sess.graph.get_tensor_by_name("W_fc2:0")
+        b_fc2 = sess.graph.get_tensor_by_name("b_fc2:0")
+        # 定义优化器和训练op
+        conv_result = tf.nn.softmax(tf.matmul(h_fc1_drop, W_fc2) + b_fc2)
+        for n in range(2,8):
+            path = "python/zxytest_images/%s.jpg" % (n)
+            nowimage = Image.open(path)
+            nowimage = nowimage.convert('1')
+            width = nowimage.size[0]
+            height = nowimage.size[1]
+            img_input = [[0]*INPUT_SIZE for i in range(1)]
+            for h in range(0, height):
+                for w in range(0, width):
+                    if nowimage.getpixel((w, h)) < 190:
+                        img_input[0][w+h*width] = 1
+                    else:
+                        img_input[0][w+h*width] = 0
+            result = sess.run(conv_result, feed_dict = {x: np.array(img_input), keep_prob: 1.0})
+            maxx1 = 0
+            maxx1_index = 0
+            for i in range(NUM_CLASSES):
+                if result[0][i] > maxx1:
+                    maxx1 = result[0][i]
+                    maxx1_index = i
+            license_num = license_num + LETTERS_DIGITS[maxx1_index]
+    y = license_num
+    text = "其它字符识别结果为:%s"%y
+    im = Image.new("RGB", (300, 300), (255, 255, 255))
+    font = pygame.font.Font(os.path.join("python/fonts/", "msyh.ttc"), 34)
+    rtext = font.render(text, True, (0, 0, 0), (255, 255, 255))
+    pygame.image.save(rtext, "python/result/3.jpg")
+    mat = cv2.imread("python/result/3.jpg")
+    cv2.namedWindow("now")
+    cv2.moveWindow("now", 430, 400)
+    cv2.imshow("now", mat)
+    cv2.waitKey(0)
+    cv2.destroyAllWindows()
+    writer=tf.summary.FileWriter("logs/",sess.graph)
@@ -0,0 +1,106 @@
+#!/usr/bin/python3.5
+# -*- coding: utf-8 -*-
+
+import sys
+import os
+import time
+import random
+import cv2
+import numpy as np
+import tensorflow as tf
+from PIL import Image
+import io
+import Image, ImageFont, ImageDraw
+import pygame
+
+SIZE = 1280
+WIDTH = 32
+HEIGHT = 40
+NUM_CLASSES = 31
+iterations = 300
+pygame.init()
+SAVER_DIR = "python/train-saver/province/"
+
+PROVINCES = ("川","鄂","赣","甘","贵","桂","黑","沪","冀","津","京","吉","辽","鲁","蒙","闽","宁","青","琼","陕","苏","晋","皖","湘","新","豫","渝","粤","云","藏","浙")
+# 定义输入节点，对应于图片像素值矩阵集合和图片标签(即所代表的数字)
+x = tf.placeholder(tf.float32, shape=[None, SIZE])
+y_ = tf.placeholder(tf.float32, shape=[None, NUM_CLASSES])
+
+x_image = tf.reshape(x, [-1, WIDTH, HEIGHT, 1])
+# 定义卷积函数
+def conv_layer(inputs, W, b, conv_strides, kernel_size, pool_strides, padding):
+    L1_conv = tf.nn.conv2d(inputs, W, strides=conv_strides, padding=padding)
+    L1_relu = tf.nn.relu(L1_conv + b)
+    return tf.nn.max_pool(L1_relu, ksize=kernel_size, strides=pool_strides, padding='SAME')
+
+    # 定义全连接层函数
+def full_connect(inputs, W, b):
+    return tf.nn.relu(tf.matmul(inputs, W) + b)
+
+if __name__ =='__main__':
+    start = time.time()
+    saver = tf.train.import_meta_graph("%smodel.ckpt.meta"%(SAVER_DIR))
+    with tf.Session() as sess:
+        model_file=tf.train.latest_checkpoint(SAVER_DIR)
+        saver.restore(sess, model_file)
+        # 第一个卷积层
+        W_conv1 = sess.graph.get_tensor_by_name("W_conv1:0")
+        b_conv1 = sess.graph.get_tensor_by_name("b_conv1:0")
+        conv_strides = [1, 1, 1, 1]
+        kernel_size = [1, 2, 2, 1]
+        pool_strides = [1, 2, 2, 1]
+        L1_pool = conv_layer(x_image, W_conv1, b_conv1, conv_strides, kernel_size, pool_strides, padding='SAME')
+        # 第二个卷积层
+        W_conv2 = sess.graph.get_tensor_by_name("W_conv2:0")
+        b_conv2 = sess.graph.get_tensor_by_name("b_conv2:0")
+        conv_strides = [1, 1, 1, 1]
+        kernel_size = [1, 1, 1, 1]
+        pool_strides = [1, 1, 1, 1]
+        L2_pool = conv_layer(L1_pool, W_conv2, b_conv2, conv_strides, kernel_size, pool_strides, padding='SAME')
+        # 全连接层
+        W_fc1 = sess.graph.get_tensor_by_name("W_fc1:0")
+        b_fc1 = sess.graph.get_tensor_by_name("b_fc1:0")
+        h_pool2_flat = tf.reshape(L2_pool, [-1, 16 * 20*32])
+        h_fc1 = full_connect(h_pool2_flat, W_fc1, b_fc1)
+        # dropout
+        keep_prob = tf.placeholder(tf.float32)
+        h_fc1_drop = tf.nn.dropout(h_fc1, keep_prob)
+        # readout层
+        W_fc2 = sess.graph.get_tensor_by_name("W_fc2:0")
+        b_fc2 = sess.graph.get_tensor_by_name("b_fc2:0")
+        # 定义优化器和训练op
+        conv = tf.nn.softmax(tf.matmul(h_fc1_drop, W_fc2) + b_fc2)
+        for n in range(1,2):
+            path = "python/zxytest_images/%s.jpg" % (n)
+            img = Image.open(path)
+            width = img.size[0]
+            height = img.size[1]
+            print(width)
+            print(height)
+            img_data = [[0]*SIZE for i in range(1)]
+            for h in range(0, height):
+                for w in range(0, width):
+                    if img.getpixel((w, h)) < 190:
+                        img_data[0][w+h*width] = 1
+                    else:
+                        img_data[0][w+h*width] = 0
+            result = sess.run(conv, feed_dict = {x: np.array(img_data), keep_prob: 1.0})
+            max1 = 0
+            max1_index = 0
+            for j in range(NUM_CLASSES):
+                if result[0][j] > max1:
+                    max1 = result[0][j]
+                    max1_index = j
+                    continue
+            nProvinceIndex = max1_index
+        text = "中文字符为:%s"%PROVINCES[nProvinceIndex]
+        im = Image.new("RGB", (300, 50), (255, 255, 255))
+        font = pygame.font.Font(os.path.join("python/fonts/", "msyh.ttc"), 34)
+        rtext = font.render(text, True, (0, 0, 0), (255, 255, 255))
+        pygame.image.save(rtext, "python/result/2.jpg")
+        mat = cv2.imread("python/result/2.jpg")
+        cv2.namedWindow("now")
+        cv2.moveWindow("now", 200, 400)
+        cv2.imshow("now", mat);
+        cv2.waitKey(0)
+        end = time.time()
@@ -0,0 +1,177 @@
+#!/usr/bin/python3.5
+# -*- coding: utf-8 -*-
+
+import sys
+import os
+import time
+import random
+
+import numpy as np
+import tensorflow as tf
+import cv2
+from PIL import Image
+
+
+SIZE = 784
+WIDTH = 28
+HEIGHT = 28
+NUM_CLASSES = 34
+iterations = 100
+
+SAVER_DIR = "python/train-saver/digits/"
+
+LETTERS_DIGITS = ("0","1","2","3","4","5","6","7","8","9","A","B","C","D","E","F","G","H","J","K","L","M","N","P","Q","R","S","T","U","V","W","X","Y","Z")
+license_num = ""
+time_begin = time.time()
+# 定义输入节点，对应于图片像素值矩阵集合和图片标签(即所代表的数字)
+x = tf.placeholder(tf.float32, shape=[None, SIZE])
+y_ = tf.placeholder(tf.float32, shape=[None, NUM_CLASSES])
+x_image = tf.reshape(x, [-1, WIDTH, HEIGHT, 1])
+# 定义卷积函数
+def conv_layer(inputs, W, b, conv_strides, kernel_size, pool_strides, padding):
+    L1_conv = tf.nn.conv2d(inputs, W, strides=conv_strides, padding=padding)
+    L1_relu = tf.nn.relu(L1_conv + b)
+    return tf.nn.max_pool(L1_relu, ksize=kernel_size, strides=pool_strides, padding='SAME')
+    # 定义全连接层函数
+def full_connect(inputs, W, b):
+    return tf.nn.relu(tf.matmul(inputs, W) + b)
+if __name__ =='__main__':
+    # 第一次遍历图片目录是为了获取图片总数
+    input_count = 0
+    for i in range(0,NUM_CLASSES):
+        dir = 'python/train_images/training-set/%s/' % i
+        for rt, dirs, files in os.walk(dir):
+            for filename in files:
+                input_count += 1
+
+                # 定义对应维数和各维长度的数组
+    input_images = np.array([[0]*SIZE for i in range(input_count)])
+    input_labels = np.array([[0]*NUM_CLASSES for i in range(input_count)])
+
+    # 第二次遍历图片目录是为了生成图片数据和标签
+    index = 0
+    for i in range(0,NUM_CLASSES):
+        dir = 'python/train_images/training-set/%s/' % i
+        for rt, dirs, files in os.walk(dir):
+            for filename in files:
+                filename = dir + filename
+                img = Image.open(filename)
+                img = img.convert('1')
+                width = img.size[0]
+                height = img.size[1]
+                for h in range(0, height):
+                    for w in range(0, width):
+                        # 通过这样的处理，使数字的线条变细，有利于提高识别准确率
+                        if img.getpixel((w, h)) > 230:
+                            input_images[index][w+h*width] = 0
+                        else:
+                            input_images[index][w+h*width] = 1
+                input_labels[index][i] = 1
+                index += 1
+                # 第一次遍历图片目录是为了获取图片总数
+    val_count = 0
+    for i in range(0,NUM_CLASSES):
+        dir = 'python/train_images/validation-set/%s/' % i
+        for rt, dirs, files in os.walk(dir):
+            for filename in files:
+                val_count += 1
+
+                # 定义对应维数和各维长度的数组
+    val_images = np.array([[0]*SIZE for i in range(val_count)])
+    val_labels = np.array([[0]*NUM_CLASSES for i in range(val_count)])
+
+    # 第二次遍历图片目录是为了生成图片数据和标签
+    index = 0
+    for i in range(0,NUM_CLASSES):
+        dir = 'python/train_images/validation-set/%s/' % i
+        for rt, dirs, files in os.walk(dir):
+            for filename in files:
+                filename = dir + filename
+                img = Image.open(filename)
+                img = img.convert('1')
+                width = img.size[0]
+                height = img.size[1]
+                for h in range(0, height):
+                    for w in range(0, width):
+                        # 通过这样的处理，使数字的线条变细，有利于提高识别准确率
+                        if img.getpixel((w, h)) > 230:
+                            val_images[index][w+h*width] = 0
+                        else:
+                            val_images[index][w+h*width] = 1
+                val_labels[index][i] = 1
+                index += 1
+
+    with tf.Session() as sess:
+        # 第一个卷积层
+        W_conv1 = tf.Variable(tf.truncated_normal([5, 5, 1, 32], stddev=0.1), name="W_conv1")
+        b_conv1 = tf.Variable(tf.constant(0.1, shape=[32]), name="b_conv1")
+        conv_strides = [1, 1, 1, 1]
+        kernel_size = [1, 2, 2, 1]
+        pool_strides = [1, 2, 2, 1]
+        L1_pool = conv_layer(x_image, W_conv1, b_conv1, conv_strides, kernel_size, pool_strides, padding='SAME')
+        # 第二个卷积层
+        W_conv2 = tf.Variable(tf.truncated_normal([5, 5, 32, 64], stddev=0.1), name="W_conv2")
+        b_conv2 = tf.Variable(tf.constant(0.1, shape=[64]), name="b_conv2")
+        conv_strides = [1, 1, 1, 1]
+        kernel_size = [1, 2, 2, 1]
+        pool_strides = [1, 2, 2, 1]
+        L2_pool = conv_layer(L1_pool, W_conv2, b_conv2, conv_strides, kernel_size, pool_strides, padding='SAME')
+        # 全连接层
+        W_fc1 = tf.Variable(tf.truncated_normal([7 * 7 * 64, 1024], stddev=0.1), name="W_fc1")
+        b_fc1 = tf.Variable(tf.constant(0.1, shape=[1024]), name="b_fc1")
+        h_pool2_flat = tf.reshape(L2_pool, [-1, 7 * 7 * 64])
+        h_fc1 = full_connect(h_pool2_flat, W_fc1, b_fc1)
+        # dropout
+        keep_prob = tf.placeholder(tf.float32)
+        h_fc1_drop = tf.nn.dropout(h_fc1, keep_prob)
+        # readout层
+        W_fc2 = tf.Variable(tf.truncated_normal([1024, NUM_CLASSES], stddev=0.1), name="W_fc2")
+        b_fc2 = tf.Variable(tf.constant(0.1, shape=[NUM_CLASSES]), name="b_fc2")
+
+        # 定义优化器和训练op
+        y_conv = tf.matmul(h_fc1_drop, W_fc2) + b_fc2
+        cross_entropy = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(labels=y_, logits=y_conv))
+        train_step = tf.train.AdamOptimizer((1e-4)).minimize(cross_entropy)
+        correct_prediction = tf.equal(tf.argmax(y_conv, 1), tf.argmax(y_, 1))
+        accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))
+        sess.run(tf.global_variables_initializer())
+        time_elapsed = time.time() - time_begin
+        print("读取图片文件耗费时间：%d秒" % time_elapsed)
+        time_begin = time.time()
+        print ("一共读取了 %s 个训练图像， %s 个标签" % (input_count, input_count))
+        # 设置每次训练op的输入个数和迭代次数，这里为了支持任意图片总数，定义了一个余数remainder，譬如，如果每次训练op的输入个数为60，图片总数为150张，则前面两次各输入60张，最后一次输入30张（余数30）
+        batch_size = 60
+        iterations = iterations
+        batches_count = int(input_count / batch_size)
+        remainder = input_count % batch_size
+        print ("训练数据集分成 %s 批, 前面每批 %s 个数据，最后一批 %s 个数据" % (batches_count+1, batch_size, remainder))
+
+        # 执行训练迭代
+        for it in range(iterations):
+            # 这里的关键是要把输入数组转为np.array
+            for n in range(batches_count):
+                train_step.run(feed_dict={x: input_images[n*batch_size:(n+1)*batch_size], y_: input_labels[n*batch_size:(n+1)*batch_size], keep_prob: 0.5})
+            if remainder > 0:
+                start_index = batches_count * batch_size;
+                train_step.run(feed_dict={x: input_images[start_index:input_count-1], y_: input_labels[start_index:input_count-1], keep_prob: 0.5})
+
+                # 每完成五次迭代，判断准确度是否已达到100%，达到则退出迭代循环
+            iterate_accuracy = 0
+            if it%1 == 0:
+                iterate_accuracy = accuracy.eval(feed_dict={x: val_images, y_: val_labels, keep_prob: 1.0})
+                print ('第 %d 次训练迭代: 准确率 %0.5f%%' % (it, iterate_accuracy*100))
+                if iterate_accuracy >= 0.9999 and it >= iterations:
+                    break
+
+        print ('完成训练!')
+        time_elapsed = time.time() - time_begin
+        print ("训练耗费时间：%d秒" % time_elapsed)
+        time_begin = time.time()
+
+        # 保存训练结果
+        if not os.path.exists(SAVER_DIR):
+            print ('不存在训练数据保存目录，现在创建保存目录')
+            os.makedirs(SAVER_DIR)
+            # 初始化saver
+        saver = tf.train.Saver()
+        saver_path = saver.save(sess, "%smodel.ckpt"%(SAVER_DIR))