



#-*- coding: UTF- -*-

import random
import numpy as np
import matplotlib.pyplot as plt #加载数据
def load_exdata(filename):
data = []
with open(filename, 'r') as f:
for line in f.readlines():
line = line.split(',')
current = [int(item) for item in line] //根据数据输入的不同确定是int 还是其他类型
return data data = load_exdata('ex1data2.txt');
data = np.array(data,np.int64)//根据数据输入的不同确定是int 还是其他类型 #特征缩放
def featureNormalize(X):
X_norm = X;
mu = np.zeros((,X.shape[]))
sigma = np.zeros((,X.shape[]))
for i in range(X.shape[]):
mu[,i] = np.mean(X[:,i]) # 均值
sigma[,i] = np.std(X[:,i]) # 标准差
# print(mu)
# print(sigma)
X_norm = (X - mu) / sigma
return X_norm,mu,sigma #计算损失
def computeCost(X, y, theta):
m = y.shape[]
# J = (np.sum((X.dot(theta) - y)**)) / (*m)
C = X.dot(theta) - y
J2 = (C.T.dot(C))/ (*m)
return J2 #梯度下降
def gradientDescent(X, y, theta, alpha, num_iters):
m = y.shape[]
# 存储历史误差
J_history = np.zeros((num_iters, ))
for iter in range(num_iters):
# 对J求导,得到 alpha/m * (WX - Y)*x(i), (,m)*(m,) X (m,)*(,) = (m,)
theta = theta - (alpha/m) * (X.T.dot(X.dot(theta) - y))
J_history[iter] = computeCost(X, y, theta)
return J_history,theta iterations = #迭代次数
alpha = 0.01 #学习率
x = data[:,(,)].reshape((-,))
y = data[:,].reshape((-,))
m = y.shape[]
x,mu,sigma = featureNormalize(x)
X = np.hstack([x,np.ones((x.shape[], ))])
# X = X[range(),:]
# y = y[range(),:] theta = np.zeros((, )) j = computeCost(X,y,theta)
J_history,theta = gradientDescent(X, y, theta, alpha, iterations) print('Theta found by gradient descent',theta) def predict(data):
testx = np.array(data)
testx = ((testx - mu) / sigma)
testx = np.hstack([testx,np.ones((testx.shape[], ))])
price = testx.dot(theta)
print('price is %d ' % (price)) predict([,])




python 代码:

#-*- coding: UTF- -*-

import random
import numpy as np
import matplotlib.pyplot as plt #加载数据
def load_exdata(filename):
data = []
with open(filename, 'r') as f:
for line in f.readlines():
line = line.split(',')
current = [float(item) for item in line]
return data data = load_exdata('testdata.txt');
data = np.array(data,np.float64)//数据是浮点型 # 特征缩放
def featureNormalize(X):
X_norm = X;
mu = np.zeros((, X.shape[]))
sigma = np.zeros((, X.shape[]))
for i in range(X.shape[]):
mu[, i] = np.mean(X[:, i]) # 均值
sigma[, i] = np.std(X[:, i]) # 标准差
# print(mu)
# print(sigma)
X_norm = (X - mu) / sigma
return X_norm, mu, sigma # 计算损失
def computeCost(X, y, theta):
m = y.shape[]
# J = (np.sum((X.dot(theta) - y)**)) / (*m)
C = X.dot(theta) - y
J2 = (C.T.dot(C)) / ( * m)
return J2 # 梯度下降
def gradientDescent(X, y, theta, alpha, num_iters):
m = y.shape[]
# print(m)
# 存储历史误差
J_history = np.zeros((num_iters, ))
for iter in range(num_iters):
# 对J求导,得到 alpha/m * (WX - Y)*x(i), (,m)*(m,) X (m,)*(,) = (m,)
theta = theta - (alpha / m) * (X.T.dot(X.dot(theta) - y))
J_history[iter] = computeCost(X, y, theta)
return J_history, theta iterations = # 迭代次数
alpha = 0.01 # 学习率
x = data[:, ( ,,)].reshape((-, ))//数据特征输入,采用数据集一行的,第1,2,3个数据,然后将其变成一行,所以用shape
y = data[:, ].reshape((-, ))//输出特征,数据集的第四位
m = y.shape[]
x, mu, sigma = featureNormalize(x)
X = np.hstack([x, np.ones((x.shape[], ))])
# X = X[range(),:]
# y = y[range(),:] theta = np.zeros((, ))//因为x+y.总共有四个输入,所以theta是四维 j = computeCost(X, y, theta)
J_history, theta = gradientDescent(X, y, theta, alpha, iterations) print('Theta found by gradient descent', theta) def predict(data):
testx = np.array(data)
testx = ((testx - mu) / sigma)
testx = np.hstack([testx, np.ones((testx.shape[], ))])
price = testx.dot(theta)
print('predit value is %f ' % (price)) predict([151.5,41.3,58.5])//输入为3维

