机器学习作业（三）多类别分类与神经网络—

题目太长了！下载地址【传送门】

第1题

简述：识别图片上的数字。

 import numpy as np

 import scipy.io as scio

 import matplotlib.pyplot as plt

 import scipy.optimize as op

 #显示图片数据

 def displayData(X):

     m = np.size(X, 0)  #X的行数，即样本数量

     n = np.size(X, 1)  #X的列数，即单个样本大小

     example_width = int(np.round(np.sqrt(n)))  #单张图片宽度

     example_height = int(np.floor(n / example_width))  #单张图片高度

     display_rows = int(np.floor(np.sqrt(m)))  #显示图中，一行多少张图

     display_cols = int(np.ceil(m / display_rows))  #显示图中，一列多少张图片

     pad = 1  #图片间的间隔

     display_array = - np.ones((pad + display_rows * (example_height + pad),

                             pad + display_cols * (example_width + pad)))  #初始化图片矩阵

     curr_ex = 0  #当前的图片计数

     #将每张小图插入图片数组中

     for j in range(0, display_rows):

         for i in range(0, display_cols):

             if curr_ex >= m:

                 break

             max_val = np.max(abs(X[curr_ex, :]))

             jstart = pad + j * (example_height + pad)

             istart = pad + i * (example_width + pad)

             display_array[jstart: (jstart + example_height), istart: (istart + example_width)] = \

                 np.array(X[curr_ex, :]).reshape(example_height, example_width) / max_val

             curr_ex = curr_ex + 1

         if curr_ex >= m:

             break

     display_array = display_array.T

     plt.imshow(display_array,cmap=plt.cm.gray)

     plt.axis('off')

     plt.show()

 #计算hθ(z)

 def sigmoid(z):

     g = 1.0 / (1.0 + np.exp(-z))

     return g

 #计算cost

 def lrCostFunction(theta, X, y, lamb):

     theta = np.array(theta).reshape((np.size(theta), 1))

     m = np.size(y)

     h = sigmoid(np.dot(X, theta))

     J = 1 / m * (-np.dot(y.T, np.log(h)) - np.dot((1 - y.T), np.log(1 - h)))

     theta2 = theta[1:, 0]

     Jadd = lamb / (2 * m) * np.sum(theta2 ** 2)

     J = J + Jadd

     return J.flatten()

 #计算梯度

 def gradient(theta, X, y, lamb):

     theta = np.array(theta).reshape((np.size(theta), 1))

     m = np.size(y)

     h = sigmoid(np.dot(X, theta))

     grad = 1/m*np.dot(X.T, h - y)

     theta[0,0] = 0

     gradadd = lamb/m*theta

     grad = grad + gradadd

     return grad.flatten()

 #θ计算

 def oneVsAll(X, y, num_labels, lamb):

     m = np.size(X, 0)

     n = np.size(X, 1)

     all_theta = np.zeros((num_labels, n+1))

     one = np.ones(m)

     X = np.insert(X, 0, values=one, axis=1)

     for c in range(0, num_labels):

         initial_theta = np.zeros(n+1)

         y_t = (y==c)

         result = op.minimize(fun=lrCostFunction, x0=initial_theta, args=(X, y_t, lamb), method='TNC', jac=gradient)

         all_theta[c, :] = result.x

     return all_theta

 #计算准确率

 def predictOneVsAll(all_theta, X):

     m = np.size(X, 0)

     num_labels = np.size(all_theta, 0)

     p = np.zeros((m, 1))  #用来保存每行的最大值

     g = np.zeros((np.size(X, 0), num_labels))  #用来保存每次分类后的结果（一共分类了10次，每次保存到一列上）

     one = np.ones(m)

     X = np.insert(X, 0, values=one, axis=1)

     for c in range(0, num_labels):

         theta = all_theta[c, :]

         g[:, c] = sigmoid(np.dot(X, theta.T))

     p = g.argmax(axis=1)

     # print(p)

     return p.flatten()

 #加载数据文件

 data = scio.loadmat('ex3data1.mat')

 X = data['X']

 y = data['y']

 y = y%10  #因为数据集是考虑了matlab从1开始，把0的结果保存为了10，这里进行取余，将10变回0

 m = np.size(X, 0)

 rand_indices = np.random.randint(0,m,100)

 sel = X[rand_indices, :]

 displayData(sel)

 #计算θ

 lamb = 0.1

 num_labels = 10

 all_theta = oneVsAll(X, y, num_labels, lamb)

 # print(all_theta)

 #计算预测的准确性

 pred = predictOneVsAll(all_theta, X)

 # np.set_printoptions(threshold=np.inf)

 #在计算这个上遇到了一个坑：

 #pred输出的是[[...]]的形式，需要flatten变成1维向量，y同样用flatten变成1维向量

 acc = np.mean(pred == y.flatten())*100

 print('Training Set Accuracy:',acc,'%')

运行结果：

第2题

简介：使用神经网络实现数字识别（Θ已提供）

 import numpy as np

 import scipy.io as scio

 import matplotlib.pyplot as plt

 import scipy.optimize as op

 #显示图片数据

 def displayData(X):

     m = np.size(X, 0)  #X的行数，即样本数量

     n = np.size(X, 1)  #X的列数，即单个样本大小

     example_width = int(np.round(np.sqrt(n)))  #单张图片宽度

     example_height = int(np.floor(n / example_width))  #单张图片高度

     display_rows = int(np.floor(np.sqrt(m)))  #显示图中，一行多少张图

     display_cols = int(np.ceil(m / display_rows))  #显示图中，一列多少张图片

     pad = 1  #图片间的间隔

     display_array = - np.ones((pad + display_rows * (example_height + pad),

                             pad + display_cols * (example_width + pad)))  #初始化图片矩阵

     curr_ex = 0  #当前的图片计数

     #将每张小图插入图片数组中

     for j in range(0, display_rows):

         for i in range(0, display_cols):

             if curr_ex >= m:

                 break

             max_val = np.max(abs(X[curr_ex, :]))

             jstart = pad + j * (example_height + pad)

             istart = pad + i * (example_width + pad)

             display_array[jstart: (jstart + example_height), istart: (istart + example_width)] = \

                 np.array(X[curr_ex, :]).reshape(example_height, example_width) / max_val

             curr_ex = curr_ex + 1

         if curr_ex >= m:

             break

     display_array = display_array.T

     plt.imshow(display_array,cmap=plt.cm.gray)

     plt.axis('off')

     plt.show()

 #计算hθ(z)

 def sigmoid(z):

     g = 1.0 / (1.0 + np.exp(-z))

     return g

 #实现神经网络

 def predict(theta1, theta2, X):

     m = np.size(X,0)

     p = np.zeros((np.size(X, 0), 1))

     #第二层计算

     one = np.ones(m)

     X = np.insert(X, 0, values=one, axis=1)

     a2 = sigmoid(np.dot(X, theta1.T))

     #第三层计算

     one = np.ones(np.size(a2,0))

     a2 = np.insert(a2, 0, values=one, axis=1)

     a3 = sigmoid(np.dot(a2, theta2.T))

     p = a3.argmax(axis=1) + 1  #y的值为1-10，所以此处0-9要加1

     return p.flatten()

 #读取数据文件

 data = scio.loadmat('ex3data1.mat')

 X = data['X']

 y = data['y']

 m = np.size(X, 0)

 rand_indices = np.random.randint(0,m,100)

 sel = X[rand_indices, :]

 # displayData(sel)

 theta = scio.loadmat('ex3weights.mat')

 theta1 = theta['Theta1']

 theta2 = theta['Theta2']

 #预测准确率

 pred = predict(theta1, theta2, X)

 acc = np.mean(pred == y.flatten())*100

 print('Training Set Accuracy:',acc,'%')

 #识别单张图片

 for i in range(0, m):

     it = np.random.randint(0, m, 1)

     it = it[0]

     displayData(X[it:it+1, :])

     pred = predict(theta1, theta2, X[it:it+1, :])

     print('Neural Network Prediction:', pred)

     print('input q to exit:')

     cin = input()

     if cin == 'q':

         break

神经网络的矩阵表示分析：

运行结果：

机器学习作业（三）多类别分类与神经网络——Python(numpy)实现的更多相关文章

机器学习作业（三）多类别分类与神经网络——Matlab实现
题目太长了!下载地址[传送门] 第1题简述:识别图片上的数字. 第1步:读取数据文件: %% Setup the parameters you will use for this part of t ...
机器学习入门16 - 多类别神经网络 (Multi-Class Neural Networks)
原文链接:https://developers.google.com/machine-learning/crash-course/multi-class-neural-networks/ 多类别分类, ...
機器學習基石(Machine Learning Foundations) 机器学习基石作业三课后习题解答
今天和大家分享coursera-NTU-機器學習基石(Machine Learning Foundations)-作业三的习题解答.笔者在做这些题目时遇到非常多困难,当我在网上寻找答案时却找不到,而林 ...
机器学习实验报告：利用3层神经网络对CIFAR-10图像数据库进行分类
PS:这是6月份时的一个结课项目,当时的想法就是把之前在Coursera ML课上实现过的对手写数字识别的方法迁移过来,但是最后的效果不太好… 2014年 6 月一.实验概述实验采用的是CIFAR ...
Andrew Ng机器学习课程笔记（四）之神经网络
Andrew Ng机器学习课程笔记(四)之神经网络版权声明:本文为博主原创文章,转载请指明转载地址 http://www.cnblogs.com/fydeblog/p/7365730.html 前言 ...
斯坦福深度学习与nlp第四讲词窗口分类和神经网络
http://www.52nlp.cn/%E6%96%AF%E5%9D%A6%E7%A6%8F%E6%B7%B1%E5%BA%A6%E5%AD%A6%E4%B9%A0%E4%B8%8Enlp%E7%A ...
用Python开始机器学习（2：决策树分类算法）
http://blog.csdn.net/lsldd/article/details/41223147 从这一章开始进入正式的算法学习. 首先我们学习经典而有效的分类算法:决策树分类算法. 1.决策树 ...
吴恩达《深度学习》-第一门课 (Neural Networks and Deep Learning)-第三周：浅层神经网络(Shallow neural networks) -课程笔记
第三周:浅层神经网络(Shallow neural networks) 3.1 神经网络概述(Neural Network Overview) 使用符号$ ^{[
基于机器学习和TFIDF的情感分类算法，详解自然语言处理
摘要:这篇文章将详细讲解自然语言处理过程,基于机器学习和TFIDF的情感分类算法,并进行了各种分类算法(SVM.RF.LR.Boosting)对比本文分享自华为云社区<[Python人工智能] ...

随机推荐

clr via c# 程序集加载和反射集(一)
1,程序集加载---弱的程序集可以加载强签名的程序集,但是不可相反.否则引用会报错!(但是,反射是没问题的) //获取当前类的Assembly Assembly.GetEntryAssembly() ...
使用Nginx对.NetCore站点进行反向代理
前言之前的博客我已经在Linux上部署好了.NetCore站点且通过Supervisor对站点进行了进程守护,同时也安装好了Nginx.Nginx的用处非常大,还是简单说下,它最大的功能就是方便我们 ...
NServiceBus 入门到精通（一）
什么是NServiceBus?NServiceBus 是一个用于构建企业级 .NET系统的开源通讯框架.它在消息发布/订阅支持.工作流集成和高度可扩展性等方面表现优异,因此是很多分布式系统基础平台的理 ...
SAP S4HANA如何取到采购订单ITEM里的'条件'选项卡里的条件类型值？
SAP S4HANA如何取到采购订单ITEM里的'条件'选项卡里的条件类型值? 最近在准备一个采购订单行项目的增强的function spec.其中有一段逻辑是取到采购订单行项目条件里某个指定的条件类 ...
Maven 仓库、坐标、常用命令
maven中的仓库需要jar包时,先到本地仓库中找,没有就从中央仓库去下载到本地仓库. 中央仓库很多都在国外,下载速度慢.国内的一些公司在自己的服务器上搭建了maven仓库(中央仓库的镜像),供内部 ...
P3078 [USACO13MAR]Poker Hands S
链接:Miku ---------------- 这道题和线段树有什么关系 --------------- 很简单的贪心,如果一堆牌比左边的大,那么肯定是要加上他的差的反正,顺手出掉就可以了 --- ...
cf936B
题意简述:给出一个有向图,问从s出发是否能找到一条长度为奇数的路径并且路径的端点出度为0,存在就输出路径,如果不存在判断图中是否存在环,存在输出Draw,否则输出lose 题解:类似于DP,将每一个点 ...
leetcode腾讯精选练习之旋转链表（四）
旋转链表题目: 给定一个链表,旋转链表,将链表每个节点向右移动 k 个位置,其中 k 是非负数. 示例 1: 输入: 1->2->3->4->5->NULL, k = ...
# ConfigureAwait常见问题解答
原文: https://devblogs.microsoft.com/dotnet/configureawait-faq/ .NET 在七多年前在语言和类库添加了 async/await .在那个时候 ...
SpringBoot 教程之发送邮件
目录 1. 简介 2. API 3. 配置 4. 实战 5. 示例源码 6. 参考资料 1. 简介 Spring Boot 收发邮件最简便方式是通过 spring-boot-starte ...

机器学习作业（三）多类别分类与神经网络——Python(numpy)实现

机器学习作业（三）多类别分类与神经网络——Python(numpy)实现的更多相关文章

随机推荐

热门专题