Softmax回归（使用theano）

 # coding:utf8

 import numpy as np

 import cPickle

 import theano

 import os

 import theano.tensor as T

 class SoftMax:

     def __init__(self,MAXT=50,step=0.15,landa=0):

         self.MAXT = MAXT

         self.step = step

         self.landa = landa  #在此权重衰减项未能提升正确率

     def load_theta(self,datapath):

         self.theta = cPickle.load(open(datapath,'rb'))

     def process_train(self,data,label,typenum,batch_size=500):

         valuenum=data.shape[1]

         batches =  data.shape[0] / batch_size

         data = theano.shared(np.asarray(data,dtype=theano.config.floatX))

         label = T.cast(theano.shared(np.asarray(label,dtype=theano.config.floatX)), 'int32')

         x = T.matrix('x')

         y = T.ivector('y')

         index = T.lscalar()

         theta =  theano.shared(value=0.001*np.zeros((valuenum,typenum),

             dtype=theano.config.floatX),

             name='theta',borrow=True)

         hx=T.nnet.softmax(T.dot(x,theta))

         cost =  -T.mean(T.log(hx)[T.arange(y.shape[0]), y]) +0.5*self.landa*T.sum(theta ** 2)  #权重衰减项

         g_theta = T.grad(cost, theta)

         updates = [(theta, theta - self.step * g_theta)]

         train_model = theano.function(

         inputs=[index],outputs=cost,updates=updates,givens={

             x: data[index * batch_size: (index + 1) * batch_size],

             y: label[index * batch_size: (index + 1) * batch_size]

         },allow_input_downcast=True

         )

         lastcostJ = np.inf

         stop = False

         epoch = 0

         costj=[]

         while (epoch < self.MAXT) and (not stop):

             epoch = epoch + 1

             for minibatch_index in xrange(batches):

                 costj.append(train_model(minibatch_index))

             if np.mean(costj)>=lastcostJ:

                 print "costJ is increasing !!!"

                 stop=True

             else:

                 lastcostJ=np.mean(costj)

                 print(( 'epoch %i, minibatch %i/%i,averange cost is %f') %

                         (epoch,minibatch_index + 1,batches,lastcostJ))

         self.theta=theta

         if not os.path.exists('data/softmax.pkl'):

             f= open("data/softmax.pkl",'wb')

             cPickle.dump(self.theta.get_value(),f)

             f.close()

         return self.theta.get_value()

     def process_test(self,data,label,batch_size=500):

         batches = label.shape[0] / batch_size

         data = theano.shared(np.asarray(data,dtype=theano.config.floatX))

         label = T.cast(theano.shared(np.asarray(label,dtype=theano.config.floatX)), 'int32')

         x = T.matrix('x')

         y = T.ivector('y')

         index = T.lscalar()

         hx=T.nnet.softmax(T.dot(x,self.theta))

         predict = T.argmax(hx, axis=1)

         errors=T.mean(T.neq(predict, y))

         test_model = theano.function(

         inputs=[index],outputs=errors,givens={

             x: data[index * batch_size: (index + 1) * batch_size],

             y: label[index * batch_size: (index + 1) * batch_size]

         },allow_input_downcast=True

         )

         test_losses=[]

         for minibatch_index in xrange(batches):

             test_losses.append(test_model(minibatch_index))

         test_score = np.mean(test_losses)

         print(( 'minibatch %i/%i, test error of model %f %%') %

               (minibatch_index + 1,batches,test_score * 100.))

     def h(self,x):

         m = np.exp(np.dot(x,self.theta))

         sump = np.sum(m,axis=1)

         return m/sump

     def predict(self,x):

         return np.argmax(self.h(x),axis=1)

 if __name__ == '__main__':

     f = open('mnist.pkl', 'rb')

     training_data, validation_data, test_data = cPickle.load(f)

     training_inputs = [np.reshape(x, 784) for x in training_data[0]]

     data = np.array(training_inputs)

     training_inputs = [np.reshape(x, 784) for x in validation_data[0]]

     vdata = np.array(training_inputs)

     f.close()

     softmax = SoftMax()

     softmax.process_train(data,training_data[1],10)

     softmax.process_test(vdata,validation_data[1])

     #minibatch 20/20, test error of model 7.530000 %

Softmax回归（使用theano）的更多相关文章

Softmax回归
Reference: http://ufldl.stanford.edu/wiki/index.php/Softmax_regression http://deeplearning.net/tutor ...
Softmax回归（Softmax Regression）
转载请注明出处:http://www.cnblogs.com/BYRans/ 多分类问题在一个多分类问题中,因变量y有k个取值,即.例如在邮件分类问题中,我们要把邮件分为垃圾邮件.个人邮件.工作邮件 ...
DeepLearning之路（二）SoftMax回归
Softmax回归 1. softmax回归模型 softmax回归模型是logistic回归模型在多分类问题上的扩展(logistic回归解决的是二分类问题). 对于训练集,有. 对于给定的测试 ...
Machine Learning 学习笔记 (3) —— 泊松回归与Softmax回归
本系列文章允许转载,转载请保留全文! [请先阅读][说明&总目录]http://www.cnblogs.com/tbcaaa8/p/4415055.html 1. 泊松回归 (Poisson ...
Softmax 回归原理介绍
考虑一个多分类问题,即预测变量y可以取k个离散值中的任何一个.比如一个邮件分类系统将邮件分为私人邮件,工作邮件和垃圾邮件.由于y仍然是一个离散值,只是相对于二分类的逻辑回归多了一些类别.下面将根据多项 ...
UFLDL教程（四）之Softmax回归
关于Andrew Ng的machine learning课程中,有一章专门讲解逻辑回归(Logistic回归),具体课程笔记见另一篇文章. 下面,对Logistic回归做一个简单的小结: 给定一个待分 ...
机器学习 —— 基础整理（五）线性回归；二项Logistic回归；Softmax回归及其梯度推导；广义线性模型
本文简单整理了以下内容: (一)线性回归 (二)二分类:二项Logistic回归 (三)多分类:Softmax回归 (四)广义线性模型闲话:二项Logistic回归是我去年入门机器学习时学的第一个模 ...
LR多分类推广 - Softmax回归*
LR是一个传统的二分类模型,它也可以用于多分类任务,其基本思想是:将多分类任务拆分成若干个二分类任务,然后对每个二分类任务训练一个模型,最后将多个模型的结果进行集成以获得最终的分类结果.一般来说,可以 ...
Logistic回归（逻辑回归）和softmax回归
一.Logistic回归 Logistic回归(Logistic Regression,简称LR)是一种常用的处理二类分类问题的模型. 在二类分类问题中,把因变量y可能属于的两个类分别称为负类和正类, ...
手写数字识别 ----Softmax回归模型官方案例注释（基于Tensorflow,Python）
# 手写数字识别 ----Softmax回归模型 # regression import os import tensorflow as tf from tensorflow.examples.tut ...

随机推荐

2014年3月份第2周51Aspx源码发布详情
MVC+EF某钢电子交易平台源码 2014-3-10 [VS2012]功能介绍:本源码是一套完整的电子交易平台系统,完全基于ASP.NET MVC+EF三层构架,开发环境为Visual Studio ...
bistu新生-1005
#include "stdio.h"#include "string.h"int main(){ char ku[]={'0','1','2','3','4', ...
Emacs常用命令
1.离开Emacs 挂起Emacs C-z 退出Emacs C-x C-c 2.文件打开文件 C-x C-f 保存文件 C-x C-s 保存所有的文件 C-x s 将一个文件的内容插入到当前buff ...
第一课~Django~简介
Django一个可以是Web开发工作者开发工作愉快并且高效的Web 框架 . 使用Django , 使你能够以最小的代建构建和维护高质量的Web应用 . 从好的方面来看 , Web开发激动人心并且富有 ...
Google protobuf
个人理解: 定义.proto文件就是指明消息里包含的成员和类型,protoc会compile成相应的java文件包含interface和implementation class,然后在构建messag ...
IOS 作业项目(4)步步完成画图程序(中续)
一,程序布局整理前言://1,程序启动//2,程序流程框架//3,程序界面一致//4,程序界面功能, //这里只做页面的固定功能, //在首次创建界面时,我们会指定好固定事件触发前的固定方法 //至 ...
HDU 3038
http://acm.hdu.edu.cn/showproblem.php?pid=3038 题意:[1-n]的区间,有m个询问,每个询问表示[a,b]的和是s,问一共有多少组矛盾 sum[i]表示i ...
Selenium - 实现网页元素拖拽
Drag and Drop, 使用鼠标实现元素拖拽的操作貌似很复杂, 在Selenium中, 借助OpenQA.Selenium.Interactions.Actions类库中提供的方法, 实现起来还 ...
jQuery对象与DOM对象之间的转换
刚开始学习jQuery,可能一时会分不清楚哪些是jQuery对象,哪些是DOM对象.至于DOM对象不多解释,我们接触的太多了,下面重点介绍一下jQuery,以及两者相互间的转换. 什么是jQuery对 ...
性能测试之－wrk(转)
转载地址:http://zjumty.iteye.com/blog/2221040 测试先行是软件系统质量保证的有效手段. 在单元测试方面, 我们有非常成熟的 xUnit 方案. 在集成测试方面, 我 ...

Softmax回归（使用theano）

Softmax回归（使用theano）的更多相关文章

随机推荐

热门专题