# ##################################################################################
# # 数据清理
# # 作者: Xinyu Ou (http://ouxinyu.cn)
# # 数据集名称：车牌识别数据集
# # 数据集简介: VehicleLicense车牌识别数据集包含16151张单字符数据，所有的单字符均为严格切割且都转换为黑白二值图像。
# # 本程序功能:
# # 1. 对样本文件进行改名，屏蔽特殊命名符号对训练的影响
# ###################################################################################

# import os
# dataset_root_path = 'D:\\WorkSpace\\ExpDatasets\\VehicleLicense'

# data_path = os.path.join(dataset_root_path, 'Data')
# character_folders = os.listdir(data_path)

# num_image = 0 
# for character_folder in character_folders:
#     character_imgs = os.listdir(os.path.join(data_path, character_folder))
    
#     id = 0
#     for character_img in character_imgs:
#         newname = character_folder + '_' + str(id).rjust(4,'0') + os.path.splitext(character_img)[1]
#         os.rename(os.path.join(data_path, character_folder, character_img), os.path.join(data_path, character_folder, newname))
#         id += 1
#         num_image += 1

#     print('\r 已完成{}副图片的改名'.format(num_image), end='')
        
# print(', 已完成。')


##################################################################################
# 数据集预处理
# 作者: Xinyu Ou (http://ouxinyu.cn)
# 数据集名称：车牌识别数据集
# 数据集简介: VehicleLicense车牌识别数据集包含16151张单字符数据，所有的单字符均为严格切割且都转换为黑白二值图像。
# 本程序功能:
# 1. 将数据集按照7:1:2的比例划分为训练验证集、训练集、验证集、测试集
# 2. 代码将生成4个文件：训练验证集trainval.txt, 训练集列表train.txt, 验证集列表val.txt, 测试集列表test.txt, 数据集信息dataset_info.json
# 3. 代码输出信息：图像列表已生成, 其中训练验证集样本12877，训练集样本11232个, 验证集样本1645个, 测试集样本3274个, 共计16151个。
# 4. 生成数据集标签词典时，需要根据标签-文件夹列表匹配标签列表
###################################################################################

import os
import json
import codecs

num_trainval = 0
num_train = 0
num_val = 0
num_test = 0
class_dim = 0
dataset_info = {
    'dataset_name': '',
    'num_trainval': -1,
    'num_train': -1,
    'num_val': -1,
    'num_test': -1,
    'class_dim': -1,
    'label_dict': {}
}
# 本地运行时，需要修改数据集的名称和绝对路径，注意和文件夹名称一致
dataset_name = 'VehicleLicense'
dataset_path = 'D:\\Workspace\\ExpDatasets\\'
dataset_root_path = os.path.join(dataset_path, dataset_name)
excluded_folder = ['.DS_Store', '.ipynb_checkpoints']      # 被排除的文件夹

# 获取标签和文件夹的对应关系，即省市拼音和中文对照关系
json_label_match = os.path.join(dataset_root_path, 'label_match.json')
label_match = json.loads(open(json_label_match, 'r', encoding='utf-8').read()) 
    
# 定义生成文件的路径
data_path = os.path.join(dataset_root_path, 'Data')
trainval_list = os.path.join(dataset_root_path, 'trainval.txt')
train_list = os.path.join(dataset_root_path, 'train.txt')
val_list = os.path.join(dataset_root_path, 'val.txt')
test_list = os.path.join(dataset_root_path, 'test.txt')
dataset_info_list = os.path.join(dataset_root_path, 'dataset_info.json')

# 检测数据集列表是否存在，如果存在则先删除。其中测试集列表是一次写入，因此可以通过'w'参数进行覆盖写入，而不用进行手动删除。
if os.path.exists(trainval_list):
    os.remove(trainval_list)
if os.path.exists(train_list):
    os.remove(train_list)
if os.path.exists(val_list):
    os.remove(val_list)
if os.path.exists(test_list):
    os.remove(test_list)

# 按照比例进行数据分割
class_name_list = os.listdir(data_path)
with codecs.open(trainval_list, 'a', 'utf-8') as f_trainval:
    with codecs.open(train_list, 'a', 'utf-8') as f_train:
        with codecs.open(val_list, 'a', 'utf-8') as f_val:
            with codecs.open(test_list, 'a', 'utf-8') as f_test:
                for class_name in class_name_list:
                    if class_name not in excluded_folder:
                        dataset_info['label_dict'][str(class_dim)] = label_match[class_name]        # 按照文件夹名称和label_match进行标签匹配
                        images = os.listdir(os.path.join(data_path, class_name))
                        count = 0
                        for image in images:
                            if count % 10 == 0:  # 抽取大约10%的样本作为验证数据
                                f_val.write("{0}\t{1}\n".format(os.path.join(data_path, class_name, image), class_dim))
                                f_trainval.write("{0}\t{1}\n".format(os.path.join(data_path, class_name, image), class_dim))
                                num_val += 1
                                num_trainval += 1
                            elif count % 10 == 1 or count % 10 == 2:  # 抽取大约20%的样本作为测试数据
                                f_test.write("{0}\t{1}\n".format(os.path.join(data_path, class_name, image), class_dim))
                                num_test += 1
                            else:
                                f_train.write("{0}\t{1}\n".format(os.path.join(data_path, class_name, image), class_dim))
                                f_trainval.write("{0}\t{1}\n".format(os.path.join(data_path, class_name, image), class_dim))
                                num_train += 1
                                num_trainval += 1
                            count += 1
                    class_dim += 1        

# 将数据集信息保存到json文件中供训练时使用
dataset_info['dataset_name'] = dataset_name
dataset_info['num_trainval'] = num_trainval
dataset_info['num_train'] = num_train
dataset_info['num_val'] = num_val
dataset_info['num_test'] = num_test
dataset_info['class_dim'] = class_dim

with codecs.open(dataset_info_list, 'w', encoding='utf-8') as f_dataset_info:
    json.dump(dataset_info, f_dataset_info, ensure_ascii=False, indent=4, separators=(',', ':')) # 格式化字典格式的参数列表

print("图像列表已生成, 其中训练验证集样本{}，训练集样本{}个, 验证集样本{}个, 测试集样本{}个, 共计{}个。".format(num_trainval, num_train, num_val, num_test, num_train+num_val+num_test))

图像列表已生成, 其中训练验证集样本12878，训练集样本11233个, 验证集样本1645个, 测试集样本3274个, 共计16152个。


# 1. 导入依赖库
import os
import cv2
import numpy as np
import codecs
import json
import time                        # 载入time时间库,用于计算训练时间
from random import randint         # 导入随机数生成函数
import paddle as paddle            # 载入PaddlePaddle基本库
import paddle.fluid as fluid       # 载入基于fluid框架的paddle
from paddle.fluid.dygraph import Linear, Conv2D, Pool2D
from PIL import Image              # 载入python的第三方图像处理库
import matplotlib.pyplot as plt    # 载入matplotlib绘图库
from multiprocessing import cpu_count
plt.rcParams['font.family'] = 'sans-serif'  
plt.rcParams['font.sans-serif'] = 'SimHei,Times New Roman'# 中文设置成宋体，除此之外的字体设置成New Roman 
np.set_printoptions(precision=5, suppress=True) # 设置numpy的精度，用于打印输出


# 2. 全局参数配置
# 定义使用CPU还是GPU，使用CPU时use_cuda = False,使用GPU时use_cuda = True
use_cuda          = True  # True, False 如果设备有GPU，怎么我们可以启用GPU进行快速训练
PLACE             = fluid.CUDAPlace(0) if use_cuda else fluid.CPUPlace()

project_name      = 'Project06CNN'
architecture      = 'CNN'
dataset_name      = 'VehicleLicense'
result_root_path  = 'D:\\WorkSpace\\ExpResults\\'

model_name = dataset_name + '_' + architecture

# 2.1 定义数据集列表文件及模型路径
dataset_path      = 'D:\\WorkSpace\\ExpDatasets\\'
dataset_root_path = os.path.join(dataset_path, dataset_name)

trainval_list = os.path.join(dataset_root_path, 'trainval.txt')
train_list = os.path.join(dataset_root_path, 'train.txt')
val_list = os.path.join(dataset_root_path, 'val.txt')
test_list = os.path.join(dataset_root_path, 'test.txt')

result_root_path  = os.path.join(result_root_path, project_name, model_name)
final_models_path = os.path.join(result_root_path, 'final_models')
final_figures_path = os.path.join(result_root_path, 'final_figures')

# 2.2 图像基本信息
img_size = 20
img_channel = 1

# 2.3 训练参数定义
total_epoch        = 40       # 总迭代次数, 代码调试好后考虑Epochs_num = 50
log_interval       = 100
eval_interval      = 1        # 设置在训练过程中,每隔一定的周期进行一次测试
learning_rate      = 0.001    # 学习率
momentum           = 0.9      # 动量
BUF_SIZE           = 512      # 设置存储数据的缓存大小
BATCH_SIZE         = 128      # 设置每个批次的数据大小，同时对训练提供器和测试提供器有效


# 定义数据集映射函数获取数据的图像矩阵和label
def data_mapper(sample):
    img, label = sample
    img = cv2.imread(img, 0)
    img = cv2.resize(img, (img_size, img_size))       # 将图像尺度resize为指定尺寸
    img = np.array(img).reshape(1, img_channel, img_size, img_size).astype('float32')   # 将图像数据类型转化为float32
#     img = img.transpose((2, 0, 1))          # 调整数据形状paddle默认格式(通道,高度,宽度)
    img = img/255.0                         # 将像素值归一化到[0,1]之间
    
    return img, label

# 定义数据集reader，用于从列表文件中批量获取图像
def data_reader(data_list_path):
    #定义读取函数，从列表文件中读取
    def reader():
        with open(data_list_path, 'r') as f:
            lines = f.readlines()
            for line in lines:
                img_path, label = line.split('\t')
                yield img_path, int(label)
    #使用多线程方式，通过用户自定义的映射器mapper来映射reader返回的样本（到输出队列） 
    return paddle.reader.xmap_readers(data_mapper, reader, cpu_count(), 512)

C:\Users\Administrator\anaconda3\lib\site-packages\ipykernel\ipkernel.py:287: DeprecationWarning: `should_run_async` will not call `transform_cell` automatically in the future. Please pass the result to `transformed_cell` argument and any exception that happen during thetransform in `preprocessing_exc_tuple` in IPython 7.17 and above.
  and should_run_async(code)


# 用于训练/测试的数据提供器，每次从缓存中随机读取批次大小的数据
trainval_reader = paddle.batch(paddle.reader.shuffle(reader=data_reader(trainval_list), buf_size=BUF_SIZE), batch_size=BATCH_SIZE, drop_last=False)
train_reader = paddle.batch(paddle.reader.shuffle(reader=data_reader(train_list), buf_size=BUF_SIZE), batch_size=BATCH_SIZE, drop_last=False)
val_reader = paddle.batch(paddle.reader.shuffle(reader=data_reader(val_list), buf_size=BUF_SIZE), batch_size=BATCH_SIZE, drop_last=False)
test_reader = paddle.batch(paddle.reader.shuffle(reader=data_reader(test_list), buf_size=BUF_SIZE), batch_size=BATCH_SIZE, drop_last=False)


# 测试：输出第0个batch的数据形态
for batch_id, data in enumerate(train_reader()):
    print(data[0][0].shape)
    break

(1, 1, 20, 20)


# 绘制训练batch精度和平均loss
def draw_process(title, loss_label, accuracy_label, iters, losses, accuracies, figure_path=None, figurename=None, isShow=False):

    # 1.第一组坐标轴 Loss
    _, ax1 = plt.subplots()   # plt.subplots(figsize=(14,6))
    ax1.plot(iters, losses, color='red', label=loss_label)
    ax1.set_xlabel('Iters', fontsize=20)
    ax1.set_ylabel(loss_label, fontsize=20)
    max_loss = max(losses)
    ax1.set_ylim(0, max_loss*1.2)
    
    # 2.第二组坐标轴 accuracy
    ax2 = ax1.twinx()
    ax2.plot(iters, accuracies, color='blue', label=accuracy_label)
    ax2.set_ylabel(accuracy_label, fontsize=20)
    max_acc = max(accuracies)
    ax2.set_ylim(0, max_acc*1.2)
    
    # 3.配置图例
    plt.title(title, fontsize=24)
    handles1, labels1 = ax1.get_legend_handles_labels()
    handles2, labels2 = ax2.get_legend_handles_labels()
    plt.legend(handles1+handles2, labels1+labels2, loc='best')
    plt.grid()
    
    # 4.将绘图结果保存到 final_figures 目录
    plt.savefig(os.path.join(figure_path, figurename + '.png'))
    
    # 5.显示绘图结果
    if isShow is True:
        plt.show()
        
### 测试可视化函数 ###################################################
if __name__ == '__main__':
    try:
        train_log = json.loads(open(os.path.join(final_figures_path, 'train.json'), 'r', encoding='utf-8').read())
        draw_process('Training', 'loss', 'accuracy', train_log['iters'], train_log['losses'], train_log['accs_top1'], figure_path=final_figures_path, figurename='train', isShow=True)
    except:
        print('数据不存在，无法进行绘制')


# 定义多层感知机(CNN)
class CNN(fluid.dygraph.Layer):
    name_scope = 'CNN'
    def __init__(self, num_classes=65): # 初始化CNN类,并为CNN增加对象self.x
        super(CNN, self).__init__()
        self.conv1 = Conv2D(num_channels=1, num_filters=28, filter_size=5, stride=1, act='relu')
        self.pool1 = Pool2D(pool_size=2, pool_stride=1, pool_type='max')
        self.conv2 = Conv2D(num_channels=28, num_filters=32, filter_size=3, stride=1, act='relu')
        self.pool2 = Pool2D(pool_size=2, pool_stride=1, pool_type='max')
        self.conv3 = Conv2D(num_channels=32, num_filters=32, filter_size=3, stride=1, act='relu')
        self.fc1 = Linear(input_dim=32*10*10, output_dim=num_classes)
 
    def forward(self,input): # 为CN类增加forward方法
#         print(input.shape)
        x = self.conv1(input)
        x = self.pool1(x)
        x = self.conv2(x)
        x = self.pool2(x)
        x = self.conv3(x)
        x = fluid.layers.reshape(x, [x.shape[0], -1])  # x_shape=[32*10*10, -1]
        y = self.fc1(x)

        return y
    
# Best result: epoch=94, 
# 测试集精度accuracy=[0.97664]
if __name__ == '__main__':
    model = CNN()
    paddle.summary(model, (10,1,20,20))

---------------------------------------------------------------------------
 Layer (type)       Input Shape          Output Shape         Param #    
===========================================================================
   Conv2D-1      [[10, 1, 20, 20]]     [10, 28, 16, 16]         728      
   Pool2D-1      [[10, 28, 16, 16]]    [10, 28, 15, 15]          0       
   Conv2D-2      [[10, 28, 15, 15]]    [10, 32, 13, 13]        8,096     
   Pool2D-2      [[10, 32, 13, 13]]    [10, 32, 12, 12]          0       
   Conv2D-3      [[10, 32, 12, 12]]    [10, 32, 10, 10]        9,248     
   Linear-1         [[10, 3200]]           [10, 65]           208,065    
===========================================================================
Total params: 226,137
Trainable params: 226,137
Non-trainable params: 0
---------------------------------------------------------------------------
Input size (MB): 0.02
Forward/backward pass size (MB): 2.04
Params size (MB): 0.86
Estimated Total Size (MB): 2.92
---------------------------------------------------------------------------


def test(model, data_reader):
    accs = []
    losses = []
    model.eval() #评估模式
    for batch_id,data in enumerate(data_reader):#测试集
        images = np.array([x[0] for x in data], dtype='float32').reshape(-1, img_channel, img_size, img_size)            
        labels = np.array([x[1] for x in data], dtype='int64').reshape(-1,1)

        image = fluid.dygraph.to_variable(images)
        label = fluid.dygraph.to_variable(labels)

        digits = model(image)
        predict = fluid.layers.softmax(digits)
                
        loss = fluid.layers.cross_entropy(predict, label) # 获取批loss值
        loss = fluid.layers.mean(loss) # 求单个样本的loss
        acc = fluid.layers.accuracy(predict,label)
        losses.append(loss.numpy())
        accs.append(acc.numpy())
        
    avg_loss = np.mean(losses)    
    avg_acc = np.mean(accs)
    
    return avg_loss, avg_acc


def train(model):
    # 启动训练和在线测试            
    start = time.perf_counter()
    print('启动训练...')    

    optimizer = fluid.optimizer.Momentum(learning_rate=learning_rate, momentum=momentum, parameter_list=model.parameters())#优化器选用SGD随机梯度下降，学习率为0.001.
#     optimizer = fluid.optimizer.AdamOptimizer(learning_rate=learning_rate, parameter_list=model.parameters())#优化器选用SGD随机梯度下降，学习率为0.001.
#     optimizer = fluid.optimizer.SGDOptimizer(learning_rate=learning_rate, parameter_list=model.parameters())#优化器选用SGD随机梯度下降，学习率为0.001.

    num_batch = 0
    best_result = 0
    best_result_id = 0
    elapsed = 0
    for epoch in range(1, total_epoch+1):
        
        model.train() #训练模式
        for batch_id, data in enumerate(train_reader()):
            num_batch += 1
            
            # 定义输入层数据的形状和类型
            images = np.array([x[0] for x in data], dtype='float32').reshape(-1, img_channel, img_size, img_size)            
            labels = np.array([x[1] for x in data], dtype='int64').reshape(-1,1)

            image = fluid.dygraph.to_variable(images)
            label = fluid.dygraph.to_variable(labels)
            
            # 定义输出层 loss+accuracy
            # 预测结果 = softmax(预测概率)，模型的输出是预测概率
            # 损失loss = cross_entropy(预测结果 与 label 之间的距离）
            # 精度acc = accuracy(预测结果 与 label之间的距离)            
            digits = model(image) # 前向传播输出的分值，未进行归一化
            predict = fluid.layers.softmax(digits) # 预测结果，归一化概率 = softmax(输出概率)
#             print(digits)
#             print(predict)

            loss = fluid.layers.cross_entropy(predict, label)
            avg_loss = fluid.layers.mean(loss)                  # 获取一批的平均loss值
            acc = fluid.layers.accuracy(predict, label)         # 计算一批的精度
            
            # 执行反向传播算法    
            avg_loss.backward()   # 使用backward() 方法可以执行反向网络
            optimizer.minimize(avg_loss)
            model.clear_gradients() # 将参数梯度清零以保证下一轮训练的正确性
            
            # 每隔log_interval个batch打印一次训练损失, 也可根据TOTAL_EPOCH设定按照周期epoch进行输出
            if num_batch % log_interval == 0: # 每log_interval个batch打印一次信息
                elapsed_step = time.perf_counter() - elapsed - start
                elapsed = time.perf_counter() - start
                print("Epoch:{}/{}, batch:{}, train_loss:{}, train_accuracy:{} ({:.2f}s)".format(epoch,total_epoch,num_batch,avg_loss.numpy(),acc.numpy(),elapsed_step))
                
                # 记录训练过程，用于可视化训练过程中的loss和accuracy
                train_log['iters'].append(num_batch)
                train_log['losses'].append(float(avg_loss))
                train_log['accs_top1'].append(float(acc))
            
        # 每隔一定周期进行一次测试    
        if epoch % eval_interval == 0 or epoch == total_epoch:        
            #模型校验
            val_avg_loss, val_avg_acc = test(model, val_reader())               
            print('[validation] Epoch:{}/{}, test_loss:[{:.5f}], test_accuracy:[{:.5f}]'.format(epoch, total_epoch, val_avg_loss, val_avg_acc))
            
            # 将性能最好的模型保存为final模型
            if val_avg_acc > best_result:
                best_result = val_avg_acc
                best_result_id = epoch
                
                # 保存最优模型
                fluid.save_dygraph(model.state_dict(), os.path.join(final_models_path, 'best_model'))
            print('当前性能最好的模型 epoch_{} 的精度: {:.5f}, 已将其赋值为：best_model'.format(best_result_id, best_result))

            # 记录测试过程，用于可视化训练过程中的loss和accuracy
            val_log['iters'].append(epoch)
            val_log['losses'].append(float(val_avg_loss))
            val_log['accs_top1'].append(float(val_avg_acc))

            
    # 输出训练过程图
    # 将日志字典保存为json格式，绘图数据可以在训练结束后自动显示，也可以在训练中手动执行以显示结果
    if not os.path.exists(final_figures_path):
        os.makedirs(final_figures_path)

    with codecs.open(os.path.join(final_figures_path, 'train.json'), 'w', encoding='utf-8') as f_train_log:
        json.dump(train_log, f_train_log, ensure_ascii=False, indent=4, separators=(',', ':'))
    with codecs.open(os.path.join(final_figures_path, 'val.json'), 'w', encoding='utf-8') as f_val_log:
        json.dump(val_log, f_val_log, ensure_ascii=False, indent=4, separators=(',', ':'))
        
    print('训练完成，最终性能accuracy={:.5f}(epoch={}), 总耗时{:.2f}s, 已将其保存为：best_model'.format(best_result, best_result_id, time.perf_counter() - start))
    draw_process("Training Process", 'Train Loss', 'Train Accuracy', train_log['iters'], train_log['losses'], train_log['accs_top1'], figure_path=final_figures_path, figurename='train')
    draw_process("Validation Results", 'Validation Loss', 'Validation Accuracy', val_log['iters'], val_log['losses'], val_log['accs_top1'], figure_path=final_figures_path, figurename='val')


if __name__ == '__main__':
    # 初始化绘图列表
    train_log = {'iters': [], 'losses': [], 'accs_top1': []}
    val_log = {'iters': [], 'losses': [], 'accs_top1': []}
    
    with fluid.dygraph.guard(PLACE): 
        model = CNN() #模型实例化
        
        # 启动训练过程
        train(model) 
        
# 训练完成，最终性能accuracy=0.97864(epoch=10), 总耗时52.69s, 已将其保存为：best_model
# 训练完成，最终性能accuracy=0.98348(epoch=19), 总耗时105.66s, 已将其保存为：best_model

启动训练...
[validation] Epoch:1/40, test_loss:[4.07275], test_accuracy:[0.14423]
当前性能最好的模型 epoch_1 的精度: 0.14423, 已将其赋值为：best_model
Epoch:2/40, batch:100, train_loss:[3.07254], train_accuracy:[0.] (0.90s)
[validation] Epoch:2/40, test_loss:[3.97742], test_accuracy:[0.17668]
当前性能最好的模型 epoch_2 的精度: 0.17668, 已将其赋值为：best_model
Epoch:3/40, batch:200, train_loss:[2.03744], train_accuracy:[0.19531] (0.87s)
[validation] Epoch:3/40, test_loss:[3.99710], test_accuracy:[0.12200]
当前性能最好的模型 epoch_2 的精度: 0.17668, 已将其赋值为：best_model
Epoch:4/40, batch:300, train_loss:[0.0494], train_accuracy:[1.] (0.87s)
[validation] Epoch:4/40, test_loss:[3.82511], test_accuracy:[0.29147]
当前性能最好的模型 epoch_4 的精度: 0.29147, 已将其赋值为：best_model
Epoch:5/40, batch:400, train_loss:[0.88937], train_accuracy:[0.85156] (0.86s)
[validation] Epoch:5/40, test_loss:[3.55012], test_accuracy:[0.32572]
当前性能最好的模型 epoch_5 的精度: 0.32572, 已将其赋值为：best_model
Epoch:6/40, batch:500, train_loss:[3.35874], train_accuracy:[0.00781] (1.03s)
[validation] Epoch:6/40, test_loss:[3.27110], test_accuracy:[0.39603]
当前性能最好的模型 epoch_6 的精度: 0.39603, 已将其赋值为：best_model
Epoch:7/40, batch:600, train_loss:[3.55404], train_accuracy:[0.07812] (0.90s)
[validation] Epoch:7/40, test_loss:[2.67955], test_accuracy:[0.47656]
当前性能最好的模型 epoch_7 的精度: 0.47656, 已将其赋值为：best_model
Epoch:8/40, batch:700, train_loss:[3.85814], train_accuracy:[0.] (0.86s)
[validation] Epoch:8/40, test_loss:[2.24445], test_accuracy:[0.56731]
当前性能最好的模型 epoch_8 的精度: 0.56731, 已将其赋值为：best_model
[validation] Epoch:9/40, test_loss:[1.80623], test_accuracy:[0.61001]
当前性能最好的模型 epoch_9 的精度: 0.61001, 已将其赋值为：best_model
Epoch:10/40, batch:800, train_loss:[0.45419], train_accuracy:[0.90625] (0.97s)
[validation] Epoch:10/40, test_loss:[2.38987], test_accuracy:[0.53095]
当前性能最好的模型 epoch_9 的精度: 0.61001, 已将其赋值为：best_model
Epoch:11/40, batch:900, train_loss:[0.18748], train_accuracy:[0.98438] (0.86s)
[validation] Epoch:11/40, test_loss:[1.61611], test_accuracy:[0.62744]
当前性能最好的模型 epoch_11 的精度: 0.62744, 已将其赋值为：best_model
Epoch:12/40, batch:1000, train_loss:[1.29553], train_accuracy:[0.71875] (0.86s)
[validation] Epoch:12/40, test_loss:[1.37060], test_accuracy:[0.69882]
当前性能最好的模型 epoch_12 的精度: 0.69882, 已将其赋值为：best_model
Epoch:13/40, batch:1100, train_loss:[0.3879], train_accuracy:[0.92188] (0.87s)
[validation] Epoch:13/40, test_loss:[1.14783], test_accuracy:[0.72992]
当前性能最好的模型 epoch_13 的精度: 0.72992, 已将其赋值为：best_model
Epoch:14/40, batch:1200, train_loss:[0.87254], train_accuracy:[0.6875] (0.88s)
[validation] Epoch:14/40, test_loss:[1.10103], test_accuracy:[0.74189]
当前性能最好的模型 epoch_14 的精度: 0.74189, 已将其赋值为：best_model
Epoch:15/40, batch:1300, train_loss:[1.48974], train_accuracy:[0.66406] (0.86s)
[validation] Epoch:15/40, test_loss:[1.07390], test_accuracy:[0.74680]
当前性能最好的模型 epoch_15 的精度: 0.74680, 已将其赋值为：best_model
Epoch:16/40, batch:1400, train_loss:[1.58466], train_accuracy:[0.60938] (0.87s)
[validation] Epoch:16/40, test_loss:[1.21864], test_accuracy:[0.71283]
当前性能最好的模型 epoch_15 的精度: 0.74680, 已将其赋值为：best_model
[validation] Epoch:17/40, test_loss:[0.91765], test_accuracy:[0.77633]
当前性能最好的模型 epoch_17 的精度: 0.77633, 已将其赋值为：best_model
Epoch:18/40, batch:1500, train_loss:[0.31404], train_accuracy:[0.94531] (0.97s)
[validation] Epoch:18/40, test_loss:[0.78194], test_accuracy:[0.81254]
当前性能最好的模型 epoch_18 的精度: 0.81254, 已将其赋值为：best_model
Epoch:19/40, batch:1600, train_loss:[0.11698], train_accuracy:[0.96875] (0.89s)
[validation] Epoch:19/40, test_loss:[0.74436], test_accuracy:[0.83530]
当前性能最好的模型 epoch_19 的精度: 0.83530, 已将其赋值为：best_model
Epoch:20/40, batch:1700, train_loss:[0.15437], train_accuracy:[0.96094] (1.03s)
[validation] Epoch:20/40, test_loss:[0.69880], test_accuracy:[0.82470]
当前性能最好的模型 epoch_19 的精度: 0.83530, 已将其赋值为：best_model
Epoch:21/40, batch:1800, train_loss:[0.07969], train_accuracy:[0.97656] (0.97s)
[validation] Epoch:21/40, test_loss:[0.70179], test_accuracy:[0.84374]
当前性能最好的模型 epoch_21 的精度: 0.84374, 已将其赋值为：best_model
Epoch:22/40, batch:1900, train_loss:[0.54401], train_accuracy:[0.84375] (0.94s)
[validation] Epoch:22/40, test_loss:[0.58002], test_accuracy:[0.85237]
当前性能最好的模型 epoch_22 的精度: 0.85237, 已将其赋值为：best_model
Epoch:23/40, batch:2000, train_loss:[0.83155], train_accuracy:[0.75] (0.96s)
[validation] Epoch:23/40, test_loss:[0.54806], test_accuracy:[0.87272]
当前性能最好的模型 epoch_23 的精度: 0.87272, 已将其赋值为：best_model
Epoch:24/40, batch:2100, train_loss:[0.58758], train_accuracy:[0.89062] (0.90s)
[validation] Epoch:24/40, test_loss:[0.50172], test_accuracy:[0.86901]
当前性能最好的模型 epoch_23 的精度: 0.87272, 已将其赋值为：best_model
Epoch:25/40, batch:2200, train_loss:[0.82464], train_accuracy:[0.81443] (0.91s)
[validation] Epoch:25/40, test_loss:[0.43689], test_accuracy:[0.88945]
当前性能最好的模型 epoch_25 的精度: 0.88945, 已将其赋值为：best_model
[validation] Epoch:26/40, test_loss:[0.38249], test_accuracy:[0.90288]
当前性能最好的模型 epoch_26 的精度: 0.90288, 已将其赋值为：best_model
Epoch:27/40, batch:2300, train_loss:[0.07135], train_accuracy:[0.97656] (1.11s)
[validation] Epoch:27/40, test_loss:[0.33852], test_accuracy:[0.92130]
当前性能最好的模型 epoch_27 的精度: 0.92130, 已将其赋值为：best_model
Epoch:28/40, batch:2400, train_loss:[0.03607], train_accuracy:[0.99219] (0.92s)
[validation] Epoch:28/40, test_loss:[0.33881], test_accuracy:[0.90698]
当前性能最好的模型 epoch_27 的精度: 0.92130, 已将其赋值为：best_model
Epoch:29/40, batch:2500, train_loss:[0.11255], train_accuracy:[0.98438] (0.87s)
[validation] Epoch:29/40, test_loss:[0.30653], test_accuracy:[0.92391]
当前性能最好的模型 epoch_29 的精度: 0.92391, 已将其赋值为：best_model
Epoch:30/40, batch:2600, train_loss:[0.15478], train_accuracy:[0.96094] (0.88s)
[validation] Epoch:30/40, test_loss:[0.29564], test_accuracy:[0.92140]
当前性能最好的模型 epoch_29 的精度: 0.92391, 已将其赋值为：best_model
Epoch:31/40, batch:2700, train_loss:[0.52736], train_accuracy:[0.84375] (0.87s)
[validation] Epoch:31/40, test_loss:[0.26435], test_accuracy:[0.93282]
当前性能最好的模型 epoch_31 的精度: 0.93282, 已将其赋值为：best_model
Epoch:32/40, batch:2800, train_loss:[0.30632], train_accuracy:[0.92969] (0.86s)
[validation] Epoch:32/40, test_loss:[0.25930], test_accuracy:[0.92992]
当前性能最好的模型 epoch_31 的精度: 0.93282, 已将其赋值为：best_model
Epoch:33/40, batch:2900, train_loss:[0.31913], train_accuracy:[0.94531] (0.86s)
[validation] Epoch:33/40, test_loss:[0.24070], test_accuracy:[0.93554]
当前性能最好的模型 epoch_33 的精度: 0.93554, 已将其赋值为：best_model
[validation] Epoch:34/40, test_loss:[0.23492], test_accuracy:[0.93684]
当前性能最好的模型 epoch_34 的精度: 0.93684, 已将其赋值为：best_model
Epoch:35/40, batch:3000, train_loss:[0.07634], train_accuracy:[0.99219] (0.98s)
[validation] Epoch:35/40, test_loss:[0.22327], test_accuracy:[0.93995]
当前性能最好的模型 epoch_35 的精度: 0.93995, 已将其赋值为：best_model
Epoch:36/40, batch:3100, train_loss:[0.21794], train_accuracy:[0.97656] (0.86s)
[validation] Epoch:36/40, test_loss:[0.21491], test_accuracy:[0.93995]
当前性能最好的模型 epoch_35 的精度: 0.93995, 已将其赋值为：best_model
Epoch:37/40, batch:3200, train_loss:[0.08067], train_accuracy:[0.99219] (0.87s)
[validation] Epoch:37/40, test_loss:[0.20955], test_accuracy:[0.94406]
当前性能最好的模型 epoch_37 的精度: 0.94406, 已将其赋值为：best_model
Epoch:38/40, batch:3300, train_loss:[0.15168], train_accuracy:[0.96875] (0.88s)
[validation] Epoch:38/40, test_loss:[0.20086], test_accuracy:[0.94667]
当前性能最好的模型 epoch_38 的精度: 0.94667, 已将其赋值为：best_model
Epoch:39/40, batch:3400, train_loss:[0.32322], train_accuracy:[0.85156] (0.87s)
[validation] Epoch:39/40, test_loss:[0.19395], test_accuracy:[0.94787]
当前性能最好的模型 epoch_39 的精度: 0.94787, 已将其赋值为：best_model
Epoch:40/40, batch:3500, train_loss:[0.23203], train_accuracy:[0.96094] (0.88s)
[validation] Epoch:40/40, test_loss:[0.18764], test_accuracy:[0.94957]
当前性能最好的模型 epoch_40 的精度: 0.94957, 已将其赋值为：best_model
训练完成，最终性能accuracy=0.94957(epoch=40), 总耗时31.99s, 已将其保存为：best_model


with fluid.dygraph.guard(PLACE):
    model_dict, _ = fluid.load_dygraph(os.path.join(final_models_path, 'best_model'))
    model = CNN() #模型实例化
    model.load_dict(model_dict) #加载模型参数    
 
    #启动训练过程
    _, avg_acc = test(model, test_reader())            
    print('测试集精度为:{:.5f}'.format(avg_acc))

测试集精度为:0.95714


# 导入依赖库
import os
import cv2
import json
import numpy as np
import paddle                      # 载入PaddlePaddle基本库
import paddle.fluid as fluid       # 载入基于fluid框架的paddle
from paddle.fluid.dygraph import Linear, Conv2D, Pool2D
import matplotlib.pyplot as plt    # 载入python的第三方图像处理库

dataset_name      = 'VehicleLicense'
architecture      = 'CNN'
result_root_path  = 'D:\\Workspace\\ExpResults\\'
final_model_path  = os.path.join(result_root_path, 'Project06CNN', dataset_name + '_' + architecture, 'final_models')


def load_image(img_path):
    img = cv2.imread(img_path, 0)                                                        # cv2.imread(path, 0|1)，其中0表示灰度模式，1表示彩色模式
    img = cv2.resize(img, (img_size, img_size))                                          # resize image with high-quality 图像大小为28*28
    img = np.array(img).reshape(img_channel, img_size, img_size).astype('float32')    # 返回新形状的数组,把它变成一个 numpy 数组以匹配数据馈送格式。
    img = img/255.0                                                                      # 将数据归一化到[0~1]之间,也可以归一化为[-1,1]之间, img = img/255.0*2.0-1.0                       
    return img

# 将图像转换为二值模式
def color2bin(img_path):
    img_gray = cv2.imread(img_path, 0)                                                   # cv2.imread(path, 0|1)，其中0表示灰度模式，1表示彩色模式
    ret, img_bin = cv2.threshold(img_gray, 120, 255, cv2.THRESH_BINARY)                  # 将图像转换为二值模式，分割阈值为120
    return img_bin


# 定义车牌字符分割函数，实现将车牌分割成单字符
def Segmentation(img_path, img_name):
    
    img_bin = color2bin(os.path.join(img_path, img_name))
    print(img_bin.shape)

    # 对车牌图片进行处理，分割出车牌中的每一个字符并保存
    result = []
    for col in range(img_bin.shape[1]):
        result.append(0)
        for row in range(img_bin.shape[0]):
            result[col] = result[col] + img_bin[row][col]/255
    character_dict = {}
    num = 0
    i = 0
    while i < len(result):
        if result[i] == 0:
            i += 1        
        else:
            index = i + 1
            while result[index] != 0:
                index += 1
            character_dict[num] = [i, index-1]
            num += 1
            i = index
#     print(character_dict)

    for i in range(8):
        if i==2:
            continue
        padding = (170 - (character_dict[i][1] - character_dict[i][0])) / 2
        ndarray = np.pad(img_bin[:,character_dict[i][0]:character_dict[i][1]], ((0,0), (int(padding), int(padding))), 'constant', constant_values=(0,0))
        ndarray = cv2.resize(ndarray, (20,20))
        
        tmp_path = os.path.join(img_path, 'tmp')        
        if not os.path.exists(tmp_path):
            os.makedirs(tmp_path)        
        cv2.imwrite(os.path.join(tmp_path, str(i) + '.png'), ndarray)
        
######################################################################        
# 输出二值化后的图像示例
if __name__ == "__main__":
    img_name = 'test02.png'                            
    img_path = os.path.join(dataset_root_path, 'Infer')

    img_bin = color2bin(os.path.join(img_path, img_name))
    print(img_bin)
    plt.imshow(img_bin, cmap='gray')

[[0 0 0 ... 0 0 0]
 [0 0 0 ... 0 0 0]
 [0 0 0 ... 0 0 0]
 ...
 [0 0 0 ... 0 0 0]
 [0 0 0 ... 0 0 0]
 [0 0 0 ... 0 0 0]]


# 0. 设置待预测样本
img_name = 'test02.png'                            
img_path = os.path.join(dataset_root_path, 'Infer') 

# 1. 获取标签名称和标签ID的对应关系
json_label_match = os.path.join(dataset_root_path, 'dataset_info.json')
label_match = json.loads(open(json_label_match, 'r', encoding='utf-8').read()) 

# 2. 构建预测动态图过程
with fluid.dygraph.guard():
    model = CNN()#模型实例化
    model_dict,_= fluid.load_dygraph(os.path.join(final_model_path, 'best_model'))
    model.load_dict(model_dict)#加载模型参数
    model.eval()#评估模式
    
    Segmentation(img_path, img_name) # 原始车牌图片切割成单字符，并进行二值化处理
    lab = [] # 定义每个预测车牌的预测标签
    for i in range(8):
        if i==2:
            continue
        infer_imgs = []
        infer_imgs.append(load_image(os.path.join(img_path, 'tmp', str(i) + '.png')))
        infer_imgs = np.array(infer_imgs)
        infer_imgs = fluid.dygraph.to_variable(infer_imgs)
        result = model(infer_imgs)
        lab.append(np.argmax(result.numpy()))

# 3. 输出预测结果
print('\n车牌识别结果为：',end='')
for i in range(len(lab)):
    print(label_match['label_dict'][str(lab[i])], end='')
display(Image.open(os.path.join(img_path, img_name)))

(170, 722)

车牌识别结果为：京N8P8F8

Layer	Input	Kernels_num	Kernels_size	Stride	Padding	PoolingType	Output	Parameters
Input	1×20×20
Conv1	1×20×20	28	1×5×5	1	0		28×16×16	(1×5×5+1)×28=728
Pool1	28×16×16	28	6×2×2	1	0	max	28×15×15	0
Conv2	28×15×15	32	28×3×3	1	0		32×13×13	(28×3×3+1)×32=8096
Pool2	32×13×13	16	32×2×2	2	0	max	32×12×12	0
Conv3	32×12×12	32	32×3×3	1	0		32×10×10	(32×3×3+1)×32=9248
FC1	(32×10×10)×1						65×1	(32×10×10+1)×65=208065
Output							65×1
								Total = 226137

【项目04】基于卷积神经网络N的图片识别 —— 车牌识别¶

【实验目的】¶

【实验要求】¶

【实验一】数据集准备¶

1.1 数据集介绍¶

1.2 数据集预处理¶

1.2.1 处理数据集中样本命名的非法字符¶

1.2.2 生成数据列表¶

【实验二】全局参数设置及数据准备¶

2.1 导入依赖及全局参数设置¶

2.2 数据预处理¶

2.3 设置训练和测试数据提供器¶

2.4 定义过程可视化函数¶

【实验三】模型训练与评估¶

3.1 配置网络¶

3.1.1 网络拓扑结构图¶

3.1.2 网络参数配置表¶

3.1.3 定义神经网络类¶

3.2 模型训练及评估¶

3.2.1 定义测试函数¶

3.2.2 定义训练函数¶

3.2.3 训练主函数¶

3.2.4 离线测试¶

【实验四】模型预测（应用）¶

4.1 导入依赖库及全局参数配置¶

4.2 获取待预测数据及数据预处理¶

4.3 载入模型并开始进行推理¶

【项目04】基于卷积神经网络N的图片识别 —— 车牌识别¶

【实验目的】¶

【实验要求】¶

【实验一】 数据集准备¶

1.1 数据集介绍¶

1.2 数据集预处理¶

1.2.1 处理数据集中样本命名的非法字符¶

1.2.2 生成数据列表¶

【实验二】 全局参数设置及数据准备¶

2.1 导入依赖及全局参数设置¶

2.2 数据预处理¶

2.3 设置训练和测试数据提供器¶

2.4 定义过程可视化函数¶

【实验三】 模型训练与评估¶

3.1 配置网络¶

3.1.1 网络拓扑结构图¶

3.1.2 网络参数配置表¶

3.1.3 定义神经网络类¶

3.2 模型训练及评估¶

3.2.1 定义测试函数¶

3.2.2 定义训练函数¶

3.2.3 训练主函数¶

3.2.4 离线测试¶

【实验四】 模型预测（应用）¶

4.1 导入依赖库及全局参数配置¶

4.2 获取待预测数据及数据预处理¶

4.3 载入模型并开始进行推理¶

【实验一】数据集准备¶

【实验二】全局参数设置及数据准备¶

【实验三】模型训练与评估¶

【实验四】模型预测（应用）¶