原文地址：http://www.jianshu.com/p/311141f2047d

问题描述

程序实现

13-15

# coding: utf-8

import numpy as np

import numpy.random as random

import matplotlib.pyplot as plt

def sign(x):

    if(x>=0):

        return 1

    else:

        return -1

def gen_data():

    x1=random.uniform(-1,1,1000)

    x2=random.uniform(-1,1,1000)

    id_array=random.permutation([i for i in range(1000)])

    dataY=np.zeros((1000,1))

    for i in range(1000):

        if(i<1000*0.1):

            i = id_array[i]

            dataY[i][0]=-sign(x1[i]**2+x2[i]**2-0.6)

        else:

            i = id_array[i]

            dataY[i][0]=sign(x1[i]**2+x2[i]**2-0.6)

    dataX=np.concatenate((np.ones((1000,1)),np.array(x1).reshape((1000,1)),np.array(x2).reshape((1000,1))),axis=1)

    return dataX,dataY

def w_lin(dataX,dataY):

    dataX_T=np.transpose(dataX)

    tmp=np.dot(np.linalg.inv(np.dot(dataX_T,dataX)),dataX_T)

    return np.dot(tmp,dataY)

def pred(dataX,wLIN):

    pred=np.dot(dataX,wLIN)

    num_data=dataX.shape[0]

    for i in range(num_data):

        pred[i][0]=sign(pred[i][0])

    return pred

def zero_one_cost(pred,dataY):

    return np.sum(pred!=dataY)/dataY.shape[0]

def feat_transform(dataX):

    num_data=dataX.shape[0]

    tmp1=dataX[:,1]*dataX[:,2]

    tmp2=dataX[:,1]**2

    tmp3=dataX[:,2]**2

    new_dataX=np.concatenate(

        (dataX,tmp1.reshape((num_data,1)),tmp2.reshape((num_data,1)),tmp3.reshape((num_data,1))),axis=1)

    return new_dataX

if __name__=="__main__":

    cost_list=[]

    for i in range(1000):

        dataX,dataY=gen_data()

        wLIN=w_lin(dataX,dataY)

        cost_list.append(zero_one_cost(pred(dataX,wLIN),dataY))

    # show results

    print("the average Ein over 1000 experiments: ",sum(cost_list)/len(cost_list))

    plt.figure()

    plt.hist(cost_list)

    plt.xlabel("zero_one Ein")

    plt.ylabel("frequency")

    plt.title("13")

    plt.savefig("13.png")

    W=[]

    cost_list=[]

    for i in range(1000):

        # train

        dataX,dataY=gen_data()

        dataX=feat_transform(dataX)

        wLIN=w_lin(dataX,dataY)

        W.append(wLIN[:,0].tolist())

        # test

        testX, testY = gen_data()

        testX = feat_transform(testX)

        cost_list.append(zero_one_cost(pred(testX, wLIN), testY))

    min_cost=min(cost_list)

    min_id=cost_list.index(min_cost)

    print(W[min_id])

    W=np.array(W)

    # show w3

    print("the average w3 over 1000 experiments: ",np.average(W,axis=0)[3])

    plt.figure()

    plt.hist(W[:,3].tolist())

    plt.xlabel("w3")

    plt.ylabel("frequency")

    plt.title("14")

    plt.savefig("14.png")

    # show Eout

    print("the average Eout over 1000 experiments: ",sum(cost_list)/len(cost_list))

    plt.figure()

    plt.hist(cost_list)

    plt.xlabel("Eout")

    plt.ylabel("frequency")

    plt.title("15")

    plt.savefig("15.png")

18-20

# coding: utf-8

import numpy as np

def sigmoid(x):

    return 1/(1+np.e**(-x))

def read_data(dataFile):

    with open(dataFile,'r') as f:

        lines=f.readlines()

        data_list=[]

        for line in lines:

            line=line.strip().split()

            data_list.append([1.0] + [float(l) for l in line])

        dataArray=np.array(data_list)

        num_data=dataArray.shape[0]

        num_dim=dataArray.shape[1]-1

        dataX=dataArray[:,:-1].reshape((num_data,num_dim))

        dataY=dataArray[:,-1].reshape((num_data,1))

        return dataX,dataY

def gradient_descent(w,dataX,dataY,eta):

    assert w.shape[0]==dataX.shape[1],"wrong shape!"

    assert w.shape[1]==1,"wrong shape of w!"

    num_data=dataX.shape[0]

    num_dim=dataX.shape[1]

    tmp1=-dataY*dataX

    tmp2=-dataY*np.dot(dataX,w)

    for i in range(num_data):

        tmp2[i][0]=sigmoid(tmp2[i][0])

    tmp3=np.average(tmp1 * tmp2, axis=0)

    new_w=w-eta*tmp3.reshape((num_dim,1))

    return new_w

def s_gradient_descent(w,dataX,dataY,eta):

    assert w.shape[0]==dataX.shape[1],"wrong shape!"

    assert w.shape[1]==1,"wrong shape of w!"

    assert dataX.shape[0]==1,"wrong shape of x!"

    assert dataY.shape[0]==1,"wrong shape of y!"

    num_dim=dataX.shape[1]

    tmp1=-dataY*dataX

    tmp2=-dataY*np.dot(dataX,w)

    tmp2[0][0]=sigmoid(tmp2[0][0])

    tmp3=np.average(tmp1 * tmp2, axis=0)

    new_w=w-eta*tmp3.reshape((num_dim,1))

    return new_w

def pred(wLOG,dataX):

    pred=np.dot(dataX,wLOG)

    num_data=dataX.shape[0]

    for i in range(num_data):

        pred[i][0]=sigmoid(pred[i][0])

        if(pred[i][0]>=0.5):

            pred[i][0]=1

        else:

            pred[i][0]=-1

    return pred

def zero_one_cost(pred,dataY):

    return np.sum(pred!=dataY)/dataY.shape[0]

if __name__=="__main__":

    # train

    dataX,dataY=read_data("hw3_train.dat")

    num_dim=dataX.shape[1]

    w=np.zeros((num_dim,1))

    print("\n18")

    for i in range(2000):

        w=gradient_descent(w,dataX,dataY,eta=0.001)

    print("the weight vector within g: ",w[:,0])

    # test

    testX,testY=read_data("hw3_test.dat")

    Eout=zero_one_cost(pred(w,testX),testY)

    print("the Eout(g) on the test set: ",Eout)

    print("\n18.1")

    w = np.zeros((num_dim, 1))

    for i in range(20000):

        w = gradient_descent(w, dataX, dataY, eta=0.001)

    print("the weight vector within g: ", w[:, 0])

    # test

    Eout = zero_one_cost(pred(w, testX), testY)

    print("the Eout(g) on the test set: ", Eout)

    print("\n19")

    w=np.zeros((num_dim,1))

    for i in range(2000):

        w = gradient_descent(w, dataX, dataY, eta=0.01)

    print("the weight vector within g: ", w[:, 0])

    # test

    Eout = zero_one_cost(pred(w, testX), testY)

    print("the Eout(g) on the test set: ", Eout)

    print("\n20")

    w=np.zeros((num_dim,1))

    num_data=dataX.shape[0]

    for i in range(2000):

        i%=num_data

        x=dataX[i,:].reshape((1,num_dim))

        y=dataY[i,:].reshape((1,1))

        w=s_gradient_descent(w,x,y,eta=0.001)

    print("the weight vector within g: ", w[:, 0])

    # test

    Eout = zero_one_cost(pred(w, testX), testY)

    print("the Eout(g) on the test set: ", Eout)

运行结果及分析

13-15

18-20

对比18和18.1，可知迭代步长较小时，需要较多迭代次数才能达到较优效果。

机器学习基石笔记：Homework #3 LinReg&LogReg相关习题的更多相关文章

机器学习基石笔记：Homework #1 PLA&PA相关习题
原文地址:http://www.jianshu.com/p/5b4a64874650 问题描述程序实现 # coding: utf-8 import numpy as np import matpl ...
机器学习基石笔记：Homework #2 decision stump相关习题
原文地址:http://www.jianshu.com/p/4bc01760ac20 问题描述程序实现 17-18 # coding: utf-8 import numpy as np import ...
机器学习基石笔记：11 Linear Models for Classification、LC vs LinReg vs LogReg、OVA、OVO
原文地址:https://www.jianshu.com/p/6f86290e70f9 一.二元分类的线性模型线性回归后的参数值常用于PLA/PA/Logistic Regression的参数初始化 ...
机器学习基石笔记：Homework #4 Regularization&Validation相关习题
原文地址:https://www.jianshu.com/p/3f7d4aa6a7cf 问题描述程序实现 # coding: utf-8 import numpy as np import math ...
机器学习基石：Homework #0 SVD相关&常用矩阵求导公式
林轩田机器学习基石笔记1—The Learning Problem
机器学习分为四步: When Can Machine Learn? Why Can Machine Learn? How Can Machine Learn? How Can Machine Lear ...
机器学习基石笔记：01 The Learning Problem
原文地址:https://www.jianshu.com/p/bd7cb6c78e5e 什么时候适合用机器学习算法? 存在某种规则/模式,能够使性能提升,比如准确率: 这种规则难以程序化定义,人难以给 ...
机器学习基石笔记：04 Feasibility of Learning
原文地址:https://www.jianshu.com/p/f2f4d509060e 机器学习是设计算法\(A\),在假设集合\(H\)里,根据给定数据集\(D\),选出与实际模式\(f\)最为相近 ...
机器学习基石笔记：03 Types of Learning
原文地址:https://www.jianshu.com/p/86b2a9cef742 一.学习的分类根据输出空间\(Y\):分类(二分类.多分类).回归.结构化(监督学习+输出空间有结构): 根据 ...

随机推荐

.NET Core开源组件:后台任务利器之Hangfire 转载 https://www.cnblogs.com/chenug/p/6655636.html
.NET Core开源组件:后台任务利器之Hangfire 一.简述 Hangfire作为一款高人气且容易上手的分布式后台执行服务,支持多种数据库.在.net core的环境中,由Core自带的D ...
15. Django连接Mysql数据库
安装PyMySQL,打开cmd, pip install PyMySQL 在.../blog/init.py 目录下添加: import pymysql pymysql.install_as_MySQ ...
HDU 6242 Geometry Problem（计算几何 + 随机化）
题目链接:http://acm.hdu.edu.cn/showproblem.php?pid=6242 思路:当 n == 1 时任取一点 p 作为圆心即可. n >= 2 && ...
转 jmeter 等待时间 pacing think time
第一部分:Request之间的等待时间的设置先明确一些概念:1)定时器是在每个sampler(采样器)之前执行的,而不是之后:是的,你没有看错,不管这个定时器的位置放在sampler之后,还是之下, ...
LVM-扩容目录
LVM LVM是一种源自Unix环境,在Linux上广泛应用的逻辑虚拟盘存储方案.借助LVM,可以在保证各个Linux目录分区稳定,又可以实现各目录存储资源灵活分配. 本文主要系统介绍Linux环境下 ...
docker部署一个简单的mian.py项目文件
安装docker yum install -y docker 启动docker systemctl start docker 查询可安装的Python版本,默认centos python 2.7 ...
隐式激活Activity
react踩坑
1.列表渲染一定要注意key的唯一性,不然会导致页面只更新部分的bug graphVertexConfigList.data.map((item, index) => { return < ...
shell专用参数变量
termcap - 终端功能数据库
描述 DESCRIPTION termcap 数据库是一个过时 (obsolete) 工具,用来描述以字符为单位的终端和打印机的功能.它之所以被保留,是为了兼容古老的程序:新程序应当使用 termin ...

机器学习基石笔记：Homework #3 LinReg&LogReg相关习题

问题描述

程序实现

13-15

18-20

运行结果及分析

13-15

18-20

机器学习基石笔记：Homework #3 LinReg&LogReg相关习题的更多相关文章

随机推荐

热门专题