cnn汉字识别 tensorflow demo

# -*- coding: utf-8 -*-

import tensorflow as tf

import os

import random

import tensorflow.contrib.slim as slim

import time

import numpy as np

import pickle

from PIL import Image

mode = "inference"

char_size = 3755

epochs = 5

batch_size = 128

checkpoint_dir = '/aiml/code/'

#train_data_dir = 'D:/Yang/softwares/Spider_ws/WordRecognition/data/train/'

#test_data_dir = 'D:/Yang/softwares/Spider_ws/WordRecognition/data/test/'

class DataIterator:

    def __init__(self, data_dir):

        self.image_names = []

        for root, sub_folder, file_list in os.walk(data_dir):

            self.image_names += [os.path.join(root, file_path) for file_path in file_list]

        random.shuffle(self.image_names)

        self.labels = [int(file_name[len(data_dir):].split(os.sep)[0]) for file_name in self.image_names]

    @property

    def size(self):

        return len(self.labels)

    def input_pipeline(self, batch_size, num_epochs=None):

        images_tensor = tf.convert_to_tensor(self.image_names, dtype=tf.string)

        labels_tensor = tf.convert_to_tensor(self.labels, dtype=tf.int64)

        input_queue = tf.train.slice_input_producer([images_tensor, labels_tensor], num_epochs=num_epochs)

        labels = input_queue[1]

        images_content = tf.read_file(input_queue[0])

        images = tf.image.convert_image_dtype(tf.image.decode_png(images_content, channels=1), tf.float32)

        new_size = tf.constant([64, 64], dtype=tf.int32)

        images = tf.image.resize_images(images, new_size)

        image_batch, label_batch = tf.train.shuffle_batch([images, labels], batch_size=batch_size, capacity=50000,

                                                          min_after_dequeue=10000)

        return image_batch, label_batch

def build_graph(top_k):

    # with tf.device('/cpu:0'):

    images = tf.placeholder(dtype=tf.float32, shape=[None, 64, 64, 1], name='input_image')

    labels = tf.placeholder(dtype=tf.int64, shape=[None], name='label_batch')

    conv_1 = slim.conv2d(images, 64, [3, 3], 1, padding='SAME', scope='conv1')

    max_pool_1 = slim.max_pool2d(conv_1, [2, 2], [2, 2], padding='SAME')

    conv_2 = slim.conv2d(max_pool_1, 128, [3, 3], padding='SAME', scope='conv2')

    max_pool_2 = slim.max_pool2d(conv_2, [2, 2], [2, 2], padding='SAME')

    conv_3 = slim.conv2d(max_pool_2, 256, [3, 3], padding='SAME', scope='conv3')

    max_pool_3 = slim.max_pool2d(conv_3, [2, 2], [2, 2], padding='SAME')

    flatten = slim.flatten(max_pool_3)

    fc1 = slim.fully_connected(flatten, 1024, activation_fn=tf.nn.tanh, scope='fc1')

    logits = slim.fully_connected(fc1, char_size, activation_fn=None, scope='output_logit')

    loss = tf.reduce_mean(tf.nn.sparse_softmax_cross_entropy_with_logits(logits=logits, labels=labels))

    accuracy = tf.reduce_mean(tf.cast(tf.equal(tf.argmax(logits, 1), labels), tf.float32))

    global_step = tf.get_variable("step", [], initializer=tf.constant_initializer(0.0), trainable=False)

    rate = tf.train.exponential_decay(2e-4, global_step, decay_steps=2000, decay_rate=0.97, staircase=True)

    train_op = tf.train.AdamOptimizer(learning_rate=rate).minimize(loss, global_step = global_step)

    probabilities = tf.nn.softmax(logits)

    pred = tf.identity(probabilities, name = 'prediction')

    return {'images': images,

            'labels': labels,

            'global_step': global_step,

            'train_op': train_op,

            'loss': loss,

            'accuracy': accuracy}

def train():

    train_feeder = DataIterator(data_dir=train_data_dir)

    test_feeder = DataIterator(data_dir=test_data_dir)

    with tf.Session() as sess:

        train_images, train_labels = train_feeder.input_pipeline(batch_size)

        test_images, test_labels = test_feeder.input_pipeline(batch_size)

        graph = build_graph(top_k=1)

        sess.run(tf.global_variables_initializer())

        coord = tf.train.Coordinator()

        threads = tf.train.start_queue_runners(sess=sess, coord=coord)

        saver = tf.train.Saver()

        print (':::Training Start:::')

        try:

            while not coord.should_stop():

                start_time = time.time()

                train_images_batch, train_labels_batch = sess.run([train_images, train_labels])

                feed_dict = {graph['images']: train_images_batch,

                             graph['labels']: train_labels_batch}

                _, loss_val, step = sess.run(

                    [graph['train_op'], graph['loss'], graph['global_step']],

                    feed_dict=feed_dict)

                end_time = time.time()

                if step % 10 == 1:

                    print ("the step {0} takes {1} loss {2}".format(step, end_time - start_time, loss_val))

                if step > 200000:

                    break

                if step % 50 == 1:

                    test_images_batch, test_labels_batch = sess.run([test_images, test_labels])

                    feed_dict = {graph['images']: test_images_batch,

                                 graph['labels']: test_labels_batch}

                    accuracy_test = sess.run(

                        graph['accuracy'],

                        feed_dict=feed_dict)

                    print ('===============Eval a batch=======================')

                    print ('the step {0} test accuracy: {1}'.format(step, accuracy_test))

                    print ('===============Eval a batch=======================')

                if step % 200 == 1:

                    print ('Save the ckpt of {0}'.format(step))

                    saver.save(sess, os.path.join(checkpoint_dir, 'my-model'),

                               global_step=graph['global_step'])

        except tf.errors.OutOfRangeError:

            print ('==================Train Finished================')

            saver.save(sess, os.path.join(checkpoint_dir, 'my-model'), global_step=graph['global_step'])

        finally:

            coord.request_stop()

        coord.join(threads)

def new_inference(predict_dir):

    saver = tf.train.import_meta_graph( checkpoint_dir + "my-model-164152.meta", clear_devices=True)

    image_list = []

    new_file_list = []

    for root, _, file_list in os.walk(predict_dir):

        new_file_list += [file for file in file_list if ".nfs" not in file]

        new_file_list.sort(key= lambda x:int(x[:-4]))

        for file in new_file_list:

#            print (new_file_list)

            image = os.path.join(root, file)

            temp_image = Image.open(image).convert('L')

            temp_image = temp_image.resize((64, 64), Image.ANTIALIAS)

            temp_image = np.asarray(temp_image) / 255.0

            image_list.append(temp_image)

    image_list = np.asarray(image_list)

    temp_image = image_list.reshape([len(new_file_list), 64, 64, 1])

    with tf.Session() as sess:

        saver.restore(sess, checkpoint_dir + "my-model-164152") #读入模型参数

        graph = tf.get_default_graph()

        op = graph.get_tensor_by_name("prediction:0")

        input_tensor = graph.get_tensor_by_name('input_image:0')

        probs = sess.run(op,feed_dict = {input_tensor:temp_image})

        result = []

        for word in probs:

            result.append(np.argsort(-word)[:3])

        return result

def main():

    if mode == "train":

        train()

    if mode == 'inference':

        word_dict = pickle.load(open("/aiml/code/word_dict", "rb"))

        image_path = '/aiml/data/'

        index = new_inference(image_path)

        file = open("/aiml/result/result.txt", "w")

#        print ("预测文字为: ")

        pred_list = []

        for i in index:

#            print ("最大几率三个:")

#            print (word_dict[str(i[0])],word_dict[str(i[1])],word_dict[str(i[2])])

            pred_list.append(word_dict[str(i[0])])

            file.write(word_dict[str(i[0])])

if __name__ == "__main__":

#    tf.app.run()

    main()

cnn汉字识别 tensorflow demo的更多相关文章

深度学习之卷积神经网络CNN及tensorflow代码实例
深度学习之卷积神经网络CNN及tensorflow代码实例什么是卷积? 卷积的定义从数学上讲,卷积就是一种运算,是我们学习高等数学之后,新接触的一种运算,因为涉及到积分.级数,所以看起来觉得很复杂 ...
深度学习之卷积神经网络CNN及tensorflow代码实现示例
深度学习之卷积神经网络CNN及tensorflow代码实现示例 2017年05月01日 13:28:21 cxmscb 阅读数 151413更多分类专栏: 机器学习深度学习机器学习版权声明 ...
android应用市场、社区客户端、漫画App、TensorFlow Demo、歌词显示、动画效果等源码
Android精选源码 MVP架构Android应用市场项目 android刻度盘控件源码 Android实现一个社区客户端 android商品详情页上拉查看详情基于RxJava+Retrofit2 ...
TensorFlow —— Demo
import tensorflow as tf g = tf.Graph() # 创建一个Graph对象在模型中有两个"全局"风格的Variable对象:global_step ...
TensorFlow 在android上的Demo（1）
转载时请注明出处: 修雨轩陈系统环境说明: ------------------------------------ 操作系统 : ubunt 14.03 _ x86_64 操作系统内存: 8GB ...
tensorflow学习之（十）使用卷积神经网络（CNN）分类手写数字0-9
#卷积神经网络cnn import tensorflow as tf from tensorflow.examples.tutorials.mnist import input_data #数据包,如 ...
TensorFlow Lite demo——就是为嵌入式设备而存在的，底层调用NDK神经网络API，注意其使用的tf model需要转换下，同时提供java和C++ API，无法使用tflite的见后
Introduction to TensorFlow Lite TensorFlow Lite is TensorFlow’s lightweight solution for mobile and ...
Caffe、TensorFlow、MXnet三个开源库对比
库名称开发语言支持接口安装难度(ubuntu) 文档风格示例支持模型上手难易 Caffe c++/cuda c++/python/matlab *** * *** CNN ** MXNet ...
YOLO2：实时目标检测视频教程，视频演示， Android Demo ，开源教学项目，论文。
实时目标检测和分类 GIF 图: 视频截图: 论文: https://arxiv.org/pdf/1506.02640.pdf https://arxiv.org/pdf/1612.08242.pdf ...

随机推荐

Android开发——内存优化图片处理
8. 用缓存避免内存泄漏很常见的一个例子就是图片的三级缓存结构,分别为网络缓存,本地缓存以及内存缓存.在内存缓存逻辑类中,通常会定义这样的集合类. private HashMap<Strin ...
4.【nuxt起步】-具体练习一个h5实例
目标地址:https://www.vyuan8.com/vyuan/plugin.php?id=vyuan_fangchan&module=fangchan&pid=10079& ...
webpack入门（六）——html-webpack-plugin
html-webpack-plugin 该插件可以简化创建调用webpack bundles的html文件.在每次编译后,文件名会包含有hash值的bundles 特别有用.你可以让插件为您生成一个H ...
c语言函数---I
函数名: imagesize 功能: 返回保存位图像所需的字节数用法: unsigned far imagesize(int left, int top, int right, int bott ...
flex操作XML，强力总结帖
初始化XML对象 XML对象可以代表一个XML元素.属性.注释.处理指令或文本元素.在ActionScript 3.0中我们可以直接将XML数据赋值给变量: var myXML:XML = &l ...
每日一支TED——帕特里夏·瑞安：不要固执于英语
瑞安讲述了她在科威特教学英语30年最大的关于语言的一个感受:英语在迅速的在全世界传播,而其它的语言在逐渐的消失. 瑞安想要说的是.拥有一种国际性的语言,大家都能够理解,让全部人的 ...
【Access2007】Access2007的打开方式
Access2007提供了多种打开方式仅仅读与非仅仅读就不用说了,就是能编辑与不可以编辑的差别是否以独占的方式打开是Access2007的打开方式的核心这里什么都没有写的打开是指以"共 ...
SpringBoot学习之pom文件常见错误
错误1 上图的错误需要添加jar包的版本号,springboot自动生成不需要添加版本号,手动添加的需要指定版本号. 所以pom.xml如下方式:
UUID随机字符串
public static void main(String[] args){ System.out.println(UUID.randomUUID().toString()); } //输出:698 ...
Cocos2d-x 3.0的启动流程
Cocos2d-x 3.0变动非常大,包含启动的方式,我看了下对android的启动总结例如以下: Java方面: AppActivity继承Cocos2dxActivity Coco ...

cnn汉字识别 tensorflow demo

cnn汉字识别 tensorflow demo的更多相关文章

随机推荐

热门专题