CNN学习（三）—Tensorflow 进行MNIST手写体识别

最新推荐文章于 2024-10-15 15:12:58 发布

原创最新推荐文章于 2024-10-15 15:12:58 发布 · 1.1k 阅读

8 ·

CC 4.0 BY-SA版权

文章标签：

#cnn #tensorflow #mnist手写体数字识别

Python-杂篇同时被 3 个专栏收录

31 篇文章

订阅专栏

TensorFlow 学习

24 篇文章

订阅专栏

机器学习-实践

20 篇文章

订阅专栏

本文构建了一个六层的卷积神经网络（CNN）并应用于MNIST手写数字数据集的训练中，通过详细的代码实现展示了从搭建网络结构、定义损失函数到训练过程的全部细节。

前言

本节，我们牛刀小试一下，使用Tensor的构建一个简单的六层CNN网络来对MNIST手写体数据集进行训练。

网络结构：

这里写图片描述

代码

__author__ = 'jmh081701'
#coding:utf-8
import  tensorflow as tf
import numpy as np
import pandas as pd
from tensorflow.examples.tutorials.mnist import input_data
#载入MNIST数据
mnist = input_data.read_data_sets('MNIST_data', one_hot=True)
#mnist.train.images是一个列表：shape:(55000,784)，在输入前需要先转换为con2v的input参数个数的形式
#mnist.train.labels标签，也是一个列表,shape:(55000,10)
#mnist.test.images是测试集的

imageX=tf.placeholder(dtype=tf.float32,shape=[None,784])
#imageX是训练是的输入图像
labelY=tf.placeholder(dtype=tf.float32,shape=[None,10])
#keep_prob=tf.placeholder(tf.float32)
#lableY是训练时图像对应的标签。shape第一个参数为-1意为具体样本数待定
with tf.name_scope('C1'):
    W_C1=tf.Variable(tf.truncated_normal([5,5,1,32],stddev=0.1),dtype=tf.float32)
    b_C1=tf.Variable(tf.constant(0.1,tf.float32,shape=[32]))
    #W_C1是C1层的权值矩阵,它也是卷积核，共有10个卷积核。
    # b_C1则是偏置
    X=tf.reshape(imageX,[-1,28,28,1])
    #需要对输入转化为conv2d想要的格式
    featureMap_C1=tf.nn.conv2d(X,W_C1,[1,1,1,1],padding='SAME')+b_C1
    #conv2d的参数：
    #input:[图片个数,图片长，图片宽，图片的通道数]
    #filter:[滤波器长，滤波器宽，输入通道数，输出通道数]
    #stride:[1,1,1,1] 在四个轴上跳跃的大小
    #OK,C1卷积完成

with tf.name_scope('f'):
    relu_C1=tf.nn.relu(featureMap_C1)  #激活层
with tf.name_scope('S2'):
    featureMap_S2=tf.nn.max_pool(relu_C1,ksize=[1,2,2,1],strides=[1,2,2,1],padding='SAME')
    #S2的池化。
with tf.name_scope('C3'):
    W_C3=tf.Variable(tf.truncated_normal([5,5,32,64],stddev=0.1))
    b_C3=tf.Variable(tf.constant(0.1,tf.float32,shape=[64]))
    featureMap_C3=tf.nn.conv2d(featureMap_S2,W_C3,[1,1,1,1],padding='SAME')+b_C3

with tf.name_scope('f'):
    relu_C3=tf.nn.relu(featureMap_C3)
with tf.name_scope('S4'):
    featureMap_S4=tf.nn.max_pool(relu_C3,ksize=[1,2,2,1],strides=[1,2,2,1],padding='SAME')
#C3以及S4的过程
with tf.name_scope('flat'):
    fetureMap_flatter=tf.reshape(featureMap_S4,[-1,7*7*64])
#栅格化
with tf.name_scope('fullcont'):
    W_F5=tf.Variable(tf.truncated_normal([7*7*64,1024],stddev=0.1))
    b_F5=tf.Variable(tf.constant(0.1,tf.float32,shape=[1024]))
    out_F5=tf.nn.relu(tf.matmul(fetureMap_flatter,W_F5)+b_F5)
    #out_F5_drop=tf.nn.dropout(out_F5,keep_prob)
#全连接层完成
with tf.name_scope('output'):
    W_OUTPUT=tf.Variable(tf.truncated_normal([1024,10],stddev=0.1))
    b_OUTPUT=tf.Variable(tf.constant(0.1,tf.float32,shape=[10]))
    predictY=tf.nn.softmax(tf.matmul(out_F5,W_OUTPUT)+b_OUTPUT)

#输出层,使用softmax函数

loss=tf.reduce_mean(-tf.reduce_sum(labelY*tf.log(predictY)))
tf.summary.histogram('loss',loss)
tf.summary.scalar('loss',loss)
#残差函数loss设置为交叉熵
learning_rate=1e-4
#train_op=tf.train.AdamOptimizer(learning_rate).minimize(loss)
train_op=tf.train.AdamOptimizer(learning_rate).minimize(loss)

#设置训练方法，采用Ada最优化方法
y_pred=tf.arg_max(predictY,1)
bool_pred=tf.equal(tf.arg_max(labelY,1),y_pred)

right_rate=tf.reduce_mean(tf.to_float(bool_pred))

#检查错误率
saver=tf.train.Saver()
def load_model(sess,dir,modelname):
    ckpt=tf.train.get_checkpoint_state(dir)
    if ckpt and ckpt.model_checkpoint_path:
        print("*"*30)
        print("load lastest model......")
        saver.restore(sess,dir+".\\"+modelname)
        print("*"*30)

def save_model(sess,dir,modelname):
    saver.save(sess,dir+modelname)
dir=r"C:\\Users\\jmh081701\\Documents\\TempWorkStation\\python\\tensorflow\\cnnmodel\\"
modelname="cnnmodel"
with tf.Session() as sess:
    init =tf.global_variables_initializer()
    sess.run(init)
    step=1
    sameMAX=10
    sameStep=0
    accSum=0
    batch_epoch=int(mnist.train.num_examples/100)
    load_model(sess,dir,modelname)

    writer=tf.summary.FileWriter(".//cnngrahph",tf.get_default_graph())
    merged=tf.summary.merge_all()
    while True:
        if(step%batch_epoch==0):
            #测试一下
            test_img,test_lab=mnist.test.next_batch(1000)
            #test_img=mnist.test.images
            #test_lab=mnist.test.labels
            acc=sess.run(right_rate,{imageX:test_img,labelY:test_lab})
            tf.summary.histogram('rightrate',acc)
            print({"!!!!!!!!!!!!!!testing:"+str(step):acc})
            accSum=accSum+acc
            if(sameStep%sameMAX==0):
                if(acc==accSum/sameMAX):
                    print({step:acc})
                    break;
                else:
                    accSum=0
                    sameStep=0
            step=step+1
            save_model(sess,dir,modelname)
            continue
        image_batch,label_batch=mnist.train.next_batch(100)
        l,op,summary=sess.run([loss,train_op,merged],feed_dict={imageX:image_batch,labelY:label_batch})
        print(step,l)
        if(step%20==0):
            #每隔20批,跟踪一次
            writer.add_summary(summary,step)
        step=step+1
    save_model(sess,dir,modelname)
    print(sess.run([right_rate],feed_dict={imageX:mnist.test.images,labelY:mnist.test.labels}))
#注意点！在随机化参数的时候,不能标准差不能太大，否则很容易在计算log时出现nan

#注意点！在随机化参数的时候,不能标准差不能太大，否则很容易在计算log时出现nan

运行结果

···
547 17.2985
548 10.7501
549 22.6312
{'!!!!!!!!!!!!!!testing:550': 0.95200002}
551 14.7252
552 6.515
553 8.9048
554 7.67524
···
1098 11.3033
1099 8.11119
{'!!!!!!!!!!!!!!testing:1100': 0.977}
1101 8.80489
1102 6.89097
···
···
第一轮跑完后的正确率就有95.2%了,
第二轮跑完就有97.7%的正确率了
到第10轮就有99.0%以上