master

分支 (1)

管理

管理

master

tflite_train
/
train.py

# -*- coding: utf-8 -*-
import json

import tensorflow as tf
import numpy as np
import matplotlib.pyplot as plt
import time
from PIL import Image
import random
import os
from cnn import CNN


class TrainError(Exception):
    pass


class TrainModel(CNN):
    def __init__(self, cycle_train, max_captcha, train_img_path, verify_img_path, char_set, model_save_dir, cycle_stop, acc_stop, cycle_save,
                 image_suffix, image_width, image_height, train_batch_size, test_batch_size, verify=False):
        # 训练相关参数
        self.cycle_stop = cycle_stop
        self.cycle_train = cycle_train
        self.acc_stop = acc_stop
        self.cycle_save = cycle_save
        self.train_batch_size = train_batch_size
        self.test_batch_size = test_batch_size

        self.image_suffix = image_suffix
        self.image_height = image_height
        self.image_width = image_width
        self.max_captcha = max_captcha
        char_set = [str(i) for i in char_set]

        # 打乱文件顺序+校验图片格式
        self.train_img_path = train_img_path
        self.train_images_list = os.listdir(train_img_path)
        # 校验格式
        if verify:
            self.confirm_image_suffix()
        # 打乱文件顺序
        random.seed(time.time())
        random.shuffle(self.train_images_list)

        # 验证集文件
        self.verify_img_path = verify_img_path
        self.verify_images_list = os.listdir(verify_img_path)

        # 初始化变量
        super(TrainModel, self).__init__(image_height, image_width,
                                         int(max_captcha), char_set, model_save_dir)

        # 相关信息打印
        print("-->图片尺寸: {} X {}".format(image_height, image_width))
        print("-->验证码长度: {}".format(self.max_captcha))
        print("-->验证码共{}类 {}".format(self.char_set_len, char_set))
        print("-->使用测试集为 {}".format(train_img_path))
        print("-->使验证集为 {}".format(verify_img_path))

        # test model input and output
        print(">>> Start model test")
        batch_x, batch_y = self.get_batch(0, size=train_batch_size)
        print(">>> input batch images shape: {}".format(batch_x.shape))
        print(">>> input batch labels shape: {}".format(batch_y.shape))

    def gen_captcha_text_image(self, img_path, img_name, width, height):
        """
        返回一个验证码的array形式和对应的字符串标签
        :return:tuple (str, numpy.array)
        """
        # 标签
        label = img_name.split("_")[0]
        # 文件
        img_file = os.path.join(img_path, img_name)
        captcha_image = Image.open(img_file)
        captcha_array = self.img2input(captcha_image, width, height)  # 图片转输入向量
        return label, captcha_array

    def img2input(self, img, width, height):
        img = np.array(img)
        test_image = 0.3 * img[:, :, 0] + 0.6 * \
            img[:, :, 1] + 0.1 * img[:, :, 2]
        tmpe_array = test_image.flatten() / 255
        input_array = np.expand_dims(tmpe_array, axis=0)
        return input_array

    def get_batch(self, n, size=128):
        batch_x = np.zeros([size, self.image_height * self.image_width])  # 初始化
        batch_y = np.zeros([size, self.max_captcha * self.char_set_len])  # 初始化
        max_batch = int(len(self.train_images_list) / size)
        if max_batch - 1 < 0:
            raise TrainError("训练集图片数量需要大于每批次训练的图片数量")
        if n > max_batch - 1:
            n = n % max_batch
        s = n * size
        e = (n + 1) * size
        this_batch = self.train_images_list[s:e]

        for i, img_name in enumerate(this_batch):
            label, image_array = self.gen_captcha_text_image(
                self.train_img_path, img_name, self.image_width, self.image_height)
            batch_x[i, :] = image_array  # 输入图片数组
            batch_y[i, :] = self.text2vec(label)  # 生成 oneHot
        return batch_x, batch_y

    def get_verify_batch(self, size=100):
        batch_x = np.zeros([size, self.image_height * self.image_width])  # 初始化
        batch_y = np.zeros([size, self.max_captcha * self.char_set_len])  # 初始化

        verify_images = []
        for i in range(size):
            verify_images.append(random.choice(self.verify_images_list))

        for i, img_name in enumerate(verify_images):
            label, image_array = self.gen_captcha_text_image(
                self.verify_img_path, img_name, self.image_width, self.image_height)
            batch_x[i, :] = image_array  # 输入图片数组
            batch_y[i, :] = self.text2vec(label)  # 生成 oneHot
        return batch_x, batch_y

    def confirm_image_suffix(self):
        # 在训练前校验所有文件格式
        print("开始校验所有图片后缀")
        for index, img_name in enumerate(self.train_images_list):
            print("{} image pass".format(index), end='\r')
            if not img_name.endswith(self.image_suffix):
                raise TrainError('confirm images suffix：you request [.{}] file but get file [{}]'
                                 .format(self.image_suffix, img_name))
        print("所有图片格式校验通过")

    def train_cnn(self):
        y_predict = self.model()
        print(">>> input batch predict shape: {}".format(y_predict.shape))
        print(">>> End model test")
        # 计算概率 损失
        with tf.compat.v1.name_scope('cost'):
            cost = tf.reduce_mean(input_tensor=tf.nn.sigmoid_cross_entropy_with_logits(
                logits=y_predict, labels=self.Y))
        # 梯度下降
        with tf.compat.v1.name_scope('train'):
            optimizer = tf.compat.v1.train.AdamOptimizer(
                learning_rate=0.0001).minimize(cost)
        # 计算准确率
        predict = tf.reshape(
            y_predict, [-1, self.max_captcha, self.char_set_len])  # 预测结果
        max_idx_p = tf.argmax(input=predict, axis=2)  # 预测结果
        max_idx_l = tf.argmax(input=tf.reshape(
            self.Y, [-1, self.max_captcha, self.char_set_len]), axis=2)  # 标签
        # 计算准确率
        correct_pred = tf.equal(max_idx_p, max_idx_l)
        with tf.compat.v1.name_scope('char_acc'):
            accuracy_char_count = tf.reduce_mean(
                input_tensor=tf.cast(correct_pred, tf.float32))
        with tf.compat.v1.name_scope('image_acc'):
            accuracy_image_count = tf.reduce_mean(input_tensor=tf.reduce_min(
                input_tensor=tf.cast(correct_pred, tf.float32), axis=1))
        # 模型保存对象
        saver = tf.compat.v1.train.Saver()
        with tf.compat.v1.Session() as sess:
            init = tf.compat.v1.global_variables_initializer()
            sess.run(init)
            # 恢复模型
            if os.path.exists(self.model_save_dir):
                try:
                    saver.restore(sess, self.model_save_dir)
                # 判断捕获model文件夹中没有模型文件的错误
                except ValueError:
                    print("model文件夹为空，将创建新模型")
            else:
                pass
            # 写入日志
            tf.compat.v1.summary.FileWriter("logs/", sess.graph)

            step = 1
            for i in range(self.cycle_stop):
                batch_x, batch_y = self.get_batch(
                    i, size=self.train_batch_size)
                # 梯度下降训练
                _, cost_ = sess.run([optimizer, cost],
                                    feed_dict={self.X: batch_x, self.Y: batch_y})
                if step % self.cycle_train == 0:  # 输出一次日志
                    # 基于训练集的测试
                    batch_x_test, batch_y_test = self.get_batch(
                        i, size=self.train_batch_size)
                    acc_char = sess.run(accuracy_char_count, feed_dict={
                                        self.X: batch_x_test, self.Y: batch_y_test})
                    acc_image = sess.run(accuracy_image_count, feed_dict={
                                         self.X: batch_x_test, self.Y: batch_y_test})
                    print("第{}次训练 >>> ".format(step))
                    print("[训练集] 字符准确率为 {:.5f} 图片准确率为 {:.5f} >>> loss {:.10f}".format(
                        acc_char, acc_image, cost_))

                    # 基于验证集的测试
                    batch_x_verify, batch_y_verify = self.get_verify_batch(
                        size=self.test_batch_size)
                    acc_char = sess.run(accuracy_char_count, feed_dict={
                                        self.X: batch_x_verify, self.Y: batch_y_verify})
                    acc_image = sess.run(accuracy_image_count, feed_dict={
                                         self.X: batch_x_verify, self.Y: batch_y_verify})
                    print("[验证集] 字符准确率为 {:.5f} 图片准确率为 {:.5f} >>> loss {:.10f}".format(
                        acc_char, acc_image, cost_))

                    # 准确率达到acc_stop后保存并停止
                    if acc_image > self.acc_stop:
                        saver.save(sess, self.model_save_dir)
                        print("验证集准确率达到{}%，保存模型成功".format(self.acc_stop*100))
                        break

                # 每训练cycle_save轮就保存一次
                if i % self.cycle_save == 0:
                    saver.save(sess, self.model_save_dir)
                    print("定时保存模型成功")
                step += 1
            saver.save(sess, self.model_save_dir)


def main():
    with open("config.json", "r") as f:
        sample_conf = json.load(f)

    train_image_dir = sample_conf["train_image_dir"]
    verify_image_dir = sample_conf["test_image_dir"]
    model_save_dir = sample_conf["model_save_dir"]
    cycle_stop = sample_conf["cycle_stop"]
    cycle_train = sample_conf["cycle_train"]
    acc_stop = sample_conf["acc_stop"]
    cycle_save = sample_conf["cycle_save"]
    enable_gpu = sample_conf["enable_gpu"]
    image_suffix = sample_conf['image_suffix']
    image_width = sample_conf['image_width']
    image_height = sample_conf['image_height']
    max_captcha = sample_conf['max_captcha']
    train_batch_size = sample_conf['train_batch_size']
    test_batch_size = sample_conf['test_batch_size']

    char_set = sample_conf["char_set"]

    if not enable_gpu:
        # 设置以下环境变量可开启CPU识别
        os.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID"
        os.environ["CUDA_VISIBLE_DEVICES"] = "-1"  # 禁用GPU

    tm = TrainModel(cycle_train, max_captcha, train_image_dir, verify_image_dir, char_set, model_save_dir, cycle_stop, acc_stop, cycle_save,
                    image_suffix, image_width, image_height, train_batch_size, test_batch_size, verify=False)
    tm.train_cnn()  # 开始训练模型


if __name__ == '__main__':
    main()