Softmax回归（使用theano）

 # coding:utf8

 import numpy as np

 import cPickle

 import theano

 import os

 import theano.tensor as T

 class SoftMax:

     def __init__(self,MAXT=50,step=0.15,landa=0):

         self.MAXT = MAXT

         self.step = step

         self.landa = landa  #在此权重衰减项未能提升正确率

     def load_theta(self,datapath):

         self.theta = cPickle.load(open(datapath,'rb'))

     def process_train(self,data,label,typenum,batch_size=500):

         valuenum=data.shape[1]

         batches =  data.shape[0] / batch_size

         data = theano.shared(np.asarray(data,dtype=theano.config.floatX))

         label = T.cast(theano.shared(np.asarray(label,dtype=theano.config.floatX)), 'int32')

         x = T.matrix('x')

         y = T.ivector('y')

         index = T.lscalar()

         theta =  theano.shared(value=0.001*np.zeros((valuenum,typenum),

             dtype=theano.config.floatX),

             name='theta',borrow=True)

         hx=T.nnet.softmax(T.dot(x,theta))

         cost =  -T.mean(T.log(hx)[T.arange(y.shape[0]), y]) +0.5*self.landa*T.sum(theta ** 2)  #权重衰减项

         g_theta = T.grad(cost, theta)

         updates = [(theta, theta - self.step * g_theta)]

         train_model = theano.function(

         inputs=[index],outputs=cost,updates=updates,givens={

             x: data[index * batch_size: (index + 1) * batch_size],

             y: label[index * batch_size: (index + 1) * batch_size]

         },allow_input_downcast=True

         )

         lastcostJ = np.inf

         stop = False

         epoch = 0

         costj=[]

         while (epoch < self.MAXT) and (not stop):

             epoch = epoch + 1

             for minibatch_index in xrange(batches):

                 costj.append(train_model(minibatch_index))

             if np.mean(costj)>=lastcostJ:

                 print "costJ is increasing !!!"

                 stop=True

             else:

                 lastcostJ=np.mean(costj)

                 print(( 'epoch %i, minibatch %i/%i,averange cost is %f') %

                         (epoch,minibatch_index + 1,batches,lastcostJ))

         self.theta=theta

         if not os.path.exists('data/softmax.pkl'):

             f= open("data/softmax.pkl",'wb')

             cPickle.dump(self.theta.get_value(),f)

             f.close()

         return self.theta.get_value()

     def process_test(self,data,label,batch_size=500):

         batches = label.shape[0] / batch_size

         data = theano.shared(np.asarray(data,dtype=theano.config.floatX))

         label = T.cast(theano.shared(np.asarray(label,dtype=theano.config.floatX)), 'int32')

         x = T.matrix('x')

         y = T.ivector('y')

         index = T.lscalar()

         hx=T.nnet.softmax(T.dot(x,self.theta))

         predict = T.argmax(hx, axis=1)

         errors=T.mean(T.neq(predict, y))

         test_model = theano.function(

         inputs=[index],outputs=errors,givens={

             x: data[index * batch_size: (index + 1) * batch_size],

             y: label[index * batch_size: (index + 1) * batch_size]

         },allow_input_downcast=True

         )

         test_losses=[]

         for minibatch_index in xrange(batches):

             test_losses.append(test_model(minibatch_index))

         test_score = np.mean(test_losses)

         print(( 'minibatch %i/%i, test error of model %f %%') %

               (minibatch_index + 1,batches,test_score * 100.))

     def h(self,x):

         m = np.exp(np.dot(x,self.theta))

         sump = np.sum(m,axis=1)

         return m/sump

     def predict(self,x):

         return np.argmax(self.h(x),axis=1)

 if __name__ == '__main__':

     f = open('mnist.pkl', 'rb')

     training_data, validation_data, test_data = cPickle.load(f)

     training_inputs = [np.reshape(x, 784) for x in training_data[0]]

     data = np.array(training_inputs)

     training_inputs = [np.reshape(x, 784) for x in validation_data[0]]

     vdata = np.array(training_inputs)

     f.close()

     softmax = SoftMax()

     softmax.process_train(data,training_data[1],10)

     softmax.process_test(vdata,validation_data[1])

     #minibatch 20/20, test error of model 7.530000 %

Softmax回归（使用theano）的更多相关文章

Softmax回归
Reference: http://ufldl.stanford.edu/wiki/index.php/Softmax_regression http://deeplearning.net/tutor ...
Softmax回归（Softmax Regression）
转载请注明出处:http://www.cnblogs.com/BYRans/ 多分类问题在一个多分类问题中,因变量y有k个取值,即.例如在邮件分类问题中,我们要把邮件分为垃圾邮件.个人邮件.工作邮件 ...
DeepLearning之路（二）SoftMax回归
Softmax回归 1. softmax回归模型 softmax回归模型是logistic回归模型在多分类问题上的扩展(logistic回归解决的是二分类问题). 对于训练集,有. 对于给定的测试 ...
Machine Learning 学习笔记 (3) —— 泊松回归与Softmax回归
本系列文章允许转载,转载请保留全文! [请先阅读][说明&总目录]http://www.cnblogs.com/tbcaaa8/p/4415055.html 1. 泊松回归 (Poisson ...
Softmax 回归原理介绍
考虑一个多分类问题,即预测变量y可以取k个离散值中的任何一个.比如一个邮件分类系统将邮件分为私人邮件,工作邮件和垃圾邮件.由于y仍然是一个离散值,只是相对于二分类的逻辑回归多了一些类别.下面将根据多项 ...
UFLDL教程（四）之Softmax回归
关于Andrew Ng的machine learning课程中,有一章专门讲解逻辑回归(Logistic回归),具体课程笔记见另一篇文章. 下面,对Logistic回归做一个简单的小结: 给定一个待分 ...
机器学习 —— 基础整理（五）线性回归；二项Logistic回归；Softmax回归及其梯度推导；广义线性模型
本文简单整理了以下内容: (一)线性回归 (二)二分类:二项Logistic回归 (三)多分类:Softmax回归 (四)广义线性模型闲话:二项Logistic回归是我去年入门机器学习时学的第一个模 ...
LR多分类推广 - Softmax回归*
LR是一个传统的二分类模型,它也可以用于多分类任务,其基本思想是:将多分类任务拆分成若干个二分类任务,然后对每个二分类任务训练一个模型,最后将多个模型的结果进行集成以获得最终的分类结果.一般来说,可以 ...
Logistic回归（逻辑回归）和softmax回归
一.Logistic回归 Logistic回归(Logistic Regression,简称LR)是一种常用的处理二类分类问题的模型. 在二类分类问题中,把因变量y可能属于的两个类分别称为负类和正类, ...
手写数字识别 ----Softmax回归模型官方案例注释（基于Tensorflow,Python）
# 手写数字识别 ----Softmax回归模型 # regression import os import tensorflow as tf from tensorflow.examples.tut ...

随机推荐

三极管的妙用之C118自动刷机
首先咱们要搞清楚咱们自动刷机的原理,不谈修改固件那么高深的东西,简单的就是控制开机键. 使用继电器来控制基本上算是上个世纪的想法吧,之前博主也做过,做出来的感觉其实也很不错,就像是一个收藏品.因为继电 ...
<xliff:g>标签
摘要: 这是Android4.3Mms源码中的strings.xml的一段代码: <!--Settings item desciption for integer auto-delete sms ...
【LeetCode OJ】Longest Consecutive Sequence
Problem Link: http://oj.leetcode.com/problems/longest-consecutive-sequence/ This problem is a classi ...
React Native 组件之Image
Image组件类似于iOS中UIImage控件,该组件可以通过多种方式加载图片资源. 使用方式,加载方式有如下几种: /** * Sample React Native App * https://g ...
Weblogic项目部署及数据源配置
号线项目总结: weblogic项目配置: 把工作区放到磁盘上,建立weblogic域在安装的weblogic服务器的开始项里选择进入weblogic域的建立. 建立完域后用Myeclipse打开 ...
第四部分：python性能技巧
4.1 查询操作为主时,选择字典结构比list结构效率更高 4.2 取list的交集.并集.差集时,可借助set数据结构如listintersection = list(set(lista)& ...
[转]国内良心DNS汇集
http://www.changbizi.net/archives/664.html 长鼻子实验室湖北电信的DNS服务器真是烂到掉渣,曾经有一年我给他们的售后打电话到人家都记住我的手机号码,但是DN ...
12. Integer to Roman
Given an integer, convert it to a roman numeral. Input is guaranteed to be within the range from 1 t ...
Sprint第二个冲刺（第三天）
一.Sprint 计划会议: 今天我们召开了第二个Sprint的第三次会议,会议上我们把各自完成的情况进行了一次总结,现在主界面和美化按钮.增添图片的功能已经完成了,Doing里面的其他 ...
javabean实现serializable有什么用？为什么数据库持久就Bean实现这个接口？
Java的"对象序列化"能让你将一个实现了Serializable接口的对象转换成一组byte,这样日后要用这个对象时候,你就能把这些byte数据恢复出来,并据此重新构建那个对象了 ...

Softmax回归（使用theano）

Softmax回归（使用theano）的更多相关文章

随机推荐

热门专题