三种方法实现MNIST 手写数字识别

MNIST数据集下载：

import tensorflow as tf

from tensorflow.examples.tutorials.mnist import input_data

mnist = input_data.read_data_sets("MNIST_data/", one_hot=True) #one_hot 独热编码，也叫一位有效编码。在任意时候只有一位为1，其他位都是0

1 使用逻辑回归：

import tensorflow as tf

# 导入数据集

#from tensorflow.examples.tutorials.mnist import input_data

mnist = input_data.read_data_sets("MNIST_data/", one_hot=True)

# 变量

batch_size = 50

#训练的x(image),y(label)

# x = tf.Variable()

# y = tf.Variable()

x = tf.placeholder(tf.float32, [None, 784])

y = tf.placeholder(tf.float32, [None, 10])

# 模型权重

#[55000,784] * W = [55000,10]

W = tf.Variable(tf.zeros([784, 10]))

b = tf.Variable(tf.zeros([10]))

# 用softmax构建逻辑回归模型

pred = tf.nn.softmax(tf.matmul(x, W) + b)

# 损失函数(交叉熵)

cost = tf.reduce_mean(-tf.reduce_sum(y*tf.log(pred), 1))

# 低度下降

optimizer = tf.train.GradientDescentOptimizer(0.01).minimize(cost)

# 初始化所有变量

init = tf.global_variables_initializer()

# 加载session图

with tf.Session() as sess:

    sess.run(init)

    # 开始训练

    for epoch in range(25):

        avg_cost = 0.

        total_batch = int(mnist.train.num_examples/batch_size)

        for i in range(total_batch):

            batch_xs, batch_ys = mnist.train.next_batch(batch_size)

            sess.run(optimizer, {x: batch_xs,y: batch_ys})

            #计算损失平均值

            avg_cost += sess.run(cost,{x: batch_xs,y: batch_ys}) / total_batch

        if (epoch+1) % 5 == 0:

            print("Epoch:", '%04d' % (epoch+1), "cost=", "{:.9f}".format(avg_cost))

    print("运行完成")

    # 测试求正确率

    correct = tf.equal(tf.argmax(pred, 1), tf.argmax(y, 1))

    accuracy = tf.reduce_mean(tf.cast(correct, tf.float32))

    print("正确率:", accuracy.eval({x: mnist.test.images, y: mnist.test.labels}))

结果：

Extracting MNIST_data/train-images-idx3-ubyte.gz

Extracting MNIST_data/train-labels-idx1-ubyte.gz

Extracting MNIST_data/t10k-images-idx3-ubyte.gz

Extracting MNIST_data/t10k-labels-idx1-ubyte.gz

Epoch: 0005 cost= 0.394426425

Epoch: 0010 cost= 0.344705163

Epoch: 0015 cost= 0.323814137

Epoch: 0020 cost= 0.311426675

Epoch: 0025 cost= 0.302971779

运行完成

正确率: 0.9188

2 使用神经网络：

import tensorflow as tf

import numpy as np

from tensorflow.examples.tutorials.mnist import input_data

def init_weights(shape):

    return tf.Variable(tf.random_normal(shape, stddev=0.01))

def model(X, w_h, w_o):

    h = tf.nn.sigmoid(tf.matmul(X, w_h)) # this is a basic mlp, think 2 stacked logistic regressions

    return tf.matmul(h, w_o) # note that we dont take the softmax at the end because our cost fn does that for us

mnist = input_data.read_data_sets("MNIST_data/", one_hot=True)

trX, trY, teX, teY = mnist.train.images, mnist.train.labels, mnist.test.images, mnist.test.labels

X = tf.placeholder("float", [None, 784])

Y = tf.placeholder("float", [None, 10])

w_h = init_weights([784, 625]) # create symbolic variables

w_o = init_weights([625, 10])

py_x = model(X, w_h, w_o)

cost = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(logits=py_x, labels=Y)) # compute costs

train_op = tf.train.GradientDescentOptimizer(0.05).minimize(cost) # construct an optimizer

predict_op = tf.argmax(py_x, 1)

# Launch the graph in a session

with tf.Session() as sess:

    # you need to initialize all variables

    tf.global_variables_initializer().run()

    for i in range(100):

        for start, end in zip(range(0, len(trX), 128), range(128, len(trX)+1, 128)):

            sess.run(train_op, feed_dict={X: trX[start:end], Y: trY[start:end]})

        print(i, np.mean(np.argmax(teY, axis=1) ==

                         sess.run(predict_op, feed_dict={X: teX})))

结果：

3 使用卷积神经网络：

import tensorflow as tf

import numpy as np

from tensorflow.examples.tutorials.mnist import input_data

batch_size = 128

test_size = 256

def init_weights(shape):

    return tf.Variable(tf.random_normal(shape, stddev=0.01))

def model(X, w, w2, w3, w4, w_o, p_keep_conv, p_keep_hidden):

    l1a = tf.nn.relu(tf.nn.conv2d(X, w,                       # l1a shape=(?, 28, 28, 32)

                        strides=[1, 1, 1, 1], padding='SAME'))

    l1 = tf.nn.max_pool(l1a, ksize=[1, 2, 2, 1],              # l1 shape=(?, 14, 14, 32)

                        strides=[1, 2, 2, 1], padding='SAME')

    l1 = tf.nn.dropout(l1, p_keep_conv)

    l2a = tf.nn.relu(tf.nn.conv2d(l1, w2,                     # l2a shape=(?, 14, 14, 64)

                        strides=[1, 1, 1, 1], padding='SAME'))

    l2 = tf.nn.max_pool(l2a, ksize=[1, 2, 2, 1],              # l2 shape=(?, 7, 7, 64)

                        strides=[1, 2, 2, 1], padding='SAME')

    l2 = tf.nn.dropout(l2, p_keep_conv)

    l3a = tf.nn.relu(tf.nn.conv2d(l2, w3,                     # l3a shape=(?, 7, 7, 128)

                        strides=[1, 1, 1, 1], padding='SAME'))

    l3 = tf.nn.max_pool(l3a, ksize=[1, 2, 2, 1],              # l3 shape=(?, 4, 4, 128)

                        strides=[1, 2, 2, 1], padding='SAME')

    l3 = tf.reshape(l3, [-1, w4.get_shape().as_list()[0]])    # reshape to (?, 2048)

    l3 = tf.nn.dropout(l3, p_keep_conv)

    l4 = tf.nn.relu(tf.matmul(l3, w4))

    l4 = tf.nn.dropout(l4, p_keep_hidden)

    pyx = tf.matmul(l4, w_o)

    return pyx

mnist = input_data.read_data_sets("MNIST_data/", one_hot=True)

trX, trY, teX, teY = mnist.train.images, mnist.train.labels, mnist.test.images, mnist.test.labels

trX = trX.reshape(-1, 28, 28, 1)  # 28x28x1 input img

teX = teX.reshape(-1, 28, 28, 1)  # 28x28x1 input img

X = tf.placeholder("float", [None, 28, 28, 1])

Y = tf.placeholder("float", [None, 10])

w = init_weights([3, 3, 1, 32])       # 3x3x1 conv, 32 outputs

w2 = init_weights([3, 3, 32, 64])     # 3x3x32 conv, 64 outputs

w3 = init_weights([3, 3, 64, 128])    # 3x3x32 conv, 128 outputs

w4 = init_weights([128 * 4 * 4, 625]) # FC 128 * 4 * 4 inputs, 625 outputs

w_o = init_weights([625, 10])         # FC 625 inputs, 10 outputs (labels)

p_keep_conv = tf.placeholder("float")

p_keep_hidden = tf.placeholder("float")

py_x = model(X, w, w2, w3, w4, w_o, p_keep_conv, p_keep_hidden)

cost = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(logits=py_x, labels=Y))

train_op = tf.train.RMSPropOptimizer(0.001, 0.9).minimize(cost)

predict_op = tf.argmax(py_x, 1)

# Launch the graph in a session

with tf.Session() as sess:

    # you need to initialize all variables

    tf.global_variables_initializer().run()

    for i in range(10):

        training_batch = zip(range(0, len(trX), batch_size),

                             range(batch_size, len(trX)+1, batch_size))

        for start, end in training_batch:

            sess.run(train_op, feed_dict={X: trX[start:end], Y: trY[start:end],

                                          p_keep_conv: 0.8, p_keep_hidden: 0.5})

        test_indices = np.arange(len(teX)) # Get A Test Batch

        np.random.shuffle(test_indices)

        test_indices = test_indices[0:test_size]

        print(i, np.mean(np.argmax(teY[test_indices], axis=1) ==

                         sess.run(predict_op, feed_dict={X: teX[test_indices],

                                                         Y: teY[test_indices],

                                                         p_keep_conv: 1.0,

                                                         p_keep_hidden: 1.0})))

结果：

0 0.9453125

1 0.9765625

2 0.9921875

3 0.98828125

4 0.984375

5 0.9921875

6 0.984375

7 0.9921875

8 0.98828125

9 0.99609375

三种方法实现MNIST 手写数字识别的更多相关文章

【TensorFlow-windows】(三) 多层感知器进行手写数字识别（mnist）
主要内容: 1.基于多层感知器的mnist手写数字识别(代码注释) 2.该实现中的函数总结平台: 1.windows 10 64位 2.Anaconda3-4.2.0-Windows-x86_64. ...
基于tensorflow的MNIST手写数字识别（二）--入门篇
http://www.jianshu.com/p/4195577585e6 基于tensorflow的MNIST手写字识别(一)--白话卷积神经网络模型基于tensorflow的MNIST手写数字识 ...
Android+TensorFlow+CNN+MNIST 手写数字识别实现
Android+TensorFlow+CNN+MNIST 手写数字识别实现 SkySeraph 2018 Email:skyseraph00#163.com 更多精彩请直接访问SkySeraph个人站 ...
Tensorflow之MNIST手写数字识别：分类问题（1）
一.MNIST数据集读取 one hot 独热编码独热编码是一种稀疏向量,其中:一个向量设为1,其他元素均设为0.独热编码常用于表示拥有有限个可能值的字符串或标识符优点: 1.将离散特征的取值扩展 ...
基于TensorFlow的MNIST手写数字识别-初级
一:MNIST数据集下载地址 MNIST是一个包含很多手写数字图片的数据集,一共4个二进制压缩文件分别是test set images,test set labels,training se ...
mnist手写数字识别——深度学习入门项目（tensorflow+keras+Sequential模型）
前言今天记录一下深度学习的另外一个入门项目——<mnist数据集手写数字识别>,这是一个入门必备的学习案例,主要使用了tensorflow下的keras网络结构的Sequential模型 ...
Pytorch入门——手把手教你MNIST手写数字识别
MNIST手写数字识别教程要开始带组内的小朋友了,特意出一个Pytorch教程来指导一下 [!] 这里是实战教程,默认读者已经学会了部分深度学习原理,若有不懂的地方可以先停下来查查资料目录 MNI ...
TensorFlow——MNIST手写数字识别
MNIST手写数字识别 MNIST数据集介绍和下载:http://yann.lecun.com/exdb/mnist/ 一.数据集介绍: MNIST是一个入门级的计算机视觉数据集下载下来的数据集 ...
Tensorflow实现MNIST手写数字识别
之前我们讲了神经网络的起源.单层神经网络.多层神经网络的搭建过程.搭建时要注意到的具体问题.以及解决这些问题的具体方法.本文将通过一个经典的案例:MNIST手写数字识别,以代码的形式来为大家梳理一遍神 ...

随机推荐

php 连接mysql 主机 localhost，显示 No such file or directory
打开 php.ini文件,找到这1行 mysql.default_socket 然后将它修改为 mysql.default_socket=/path/to/mysql.sock /path/to/my ...
python 获取年月日时分秒获取当前时间 datetime函数
import datetime#取当前时间print(datetime.datetime.now())#取年print(datetime.datetime.now().year)#取月print(da ...
Web响应的提高
想象一下,如果用户在页面上触发一个点击事件,结果反应延迟比较明显,这将是一个令人沮丧的事情.而造成这个问题的原因就是响应延迟. 浏览器UI 线程大家都知道浏览器的UI线程,大多数浏览器都是一个独立的 ...
七牛云-C#SDK-上传-前期准备
1.创建一个asp.net core MVC 程序(这里随便) 这是一个空的程序 2.创建UploadController 3.添加引用 Install-Package Newtonsoft.Json ...
gulp 安装与使用
一.Gulp 是基于node.js 流(stream)的一个前端自动化构建工具,可以使用它构建自动化工作流程,简化我们工作量,让我们把重点放在功能的开发上,从而提高我们的开发效率和工作质量我们可以用 ...
Core Data could not fulfill a fault
做项目的时候在iOS4系统遇到过这样一个crash,console显示的错误信息是"Core Data could not fulfill a fault". 字面意思是什么?&q ...
Spring随笔-bean装配-自动装配
Spring提供了三种装配方式 1.XML文件进行显式装配 2.java中进行显示装配 3.自动化装配 1.自动化装配的两种实现方式 1.组件扫描:Spring会自动发现应用上下文中创建的bean 2 ...
Typora--终于找到一个能够解决将csdn文章同步到hexo的完美编辑器（解决csdn图片防盗链导致无法直接复制文章的问题）。
文章目录需求背景新宠告诉我,我的名字叫什么?大声点我听不见~ 页面神奇之处看得见的优点如何设置项目根目录如何显示图片? 于是最终操作流程个人博客:https://mmmmmm.me ...
记录一次像github开源项目提交pull request（Hexo Next）
文章目录背景 fork到自己github 像往常一样的操作克隆到本地与上游建立连接创建分支修改项目代码收尾工作提交pull request 个人博客:https://mmmmmm.me ...
20140421 常量指针与指针常量； const指针； reinterpret_cast ；const_cast作用
1.reinterpret_cast<type_id>(表达式)的作用: type-id 必须是一个指针.引用.算术类型.函数指针或者成员指针.它可以把一个指针转换成一个整数,也可以把一个 ...

三种方法实现MNIST 手写数字识别

三种方法实现MNIST 手写数字识别的更多相关文章

随机推荐

热门专题