python怎樣搭建多層神經(jīng)網(wǎng)絡(luò)?這個(gè)問(wèn)題可能是我們?nèi)粘9ぷ鹘?jīng)常見(jiàn)到的。通過(guò)這個(gè)問(wèn)題,希望你能收獲更多。下面是解決這個(gè)問(wèn)題的步驟內(nèi)容。
成都創(chuàng)新互聯(lián)專(zhuān)注于企業(yè)營(yíng)銷(xiāo)型網(wǎng)站建設(shè)、網(wǎng)站重做改版、瑯琊網(wǎng)站定制設(shè)計(jì)、自適應(yīng)品牌網(wǎng)站建設(shè)、H5場(chǎng)景定制、商城網(wǎng)站定制開(kāi)發(fā)、集團(tuán)公司官網(wǎng)建設(shè)、成都外貿(mào)網(wǎng)站制作、高端網(wǎng)站制作、響應(yīng)式網(wǎng)頁(yè)設(shè)計(jì)等建站業(yè)務(wù),價(jià)格優(yōu)惠性?xún)r(jià)比高,為瑯琊等各大城市提供網(wǎng)站開(kāi)發(fā)制作服務(wù)。模型的搭建按照自己的想法設(shè)計(jì),源碼共7個(gè).py文件,如下圖:
按照創(chuàng)建先后順序,分別是:data.py,layer.py,network.py,activation.py,loss.py,train.py,evaluate.py。data.py用于獲取數(shù)據(jù)并對(duì)數(shù)據(jù)進(jìn)行預(yù)處理,layer.py創(chuàng)建了一個(gè)Layer類(lèi),用來(lái)表示第L層,network.py抽象了一個(gè)網(wǎng)絡(luò)類(lèi),將傳入的若干層通過(guò)計(jì)算輸入輸出連接起來(lái),組成一個(gè)網(wǎng)絡(luò),data.py用來(lái)讀取數(shù)據(jù),loss.py明確了交叉熵?fù)p失函數(shù)和其導(dǎo)數(shù),activation.py分別寫(xiě)了激活函數(shù)relu和sigmoid以及其導(dǎo)函數(shù),train.py創(chuàng)建了層次并組成網(wǎng)絡(luò),然后對(duì)數(shù)據(jù)進(jìn)行訓(xùn)練并保存模型,最后evaluate.py用于對(duì)測(cè)試集進(jìn)行測(cè)試。
網(wǎng)絡(luò)分為2大塊,正向傳播和反向傳播:
但是不管是正向還是反向,網(wǎng)絡(luò)中的每一層都可以抽象出來(lái),因此創(chuàng)建一個(gè)layer類(lèi):
正向傳播的L層:
反向傳播的L層:
在寫(xiě)代碼之前,最重要的是確定每個(gè)變量和參數(shù)的維度:
正向傳播:
注意:n[L]表示當(dāng)前層(即第L層)中的神經(jīng)元個(gè)數(shù),n[L-1]表示前一層(即L-1層)的神經(jīng)元個(gè)數(shù),例如在本次程序中,n[0]=12288,n[1]=1000,n[2]=500,n[3]=1
反向傳播:
1. data.py
# coding: utf-8
# 2019/7/20 18:59
import h6py
import numpy as np
def get_train():
f = h6py.File('dataset/train_catvnoncat.h6','r')
x_train = np.array(f['train_set_x'])#訓(xùn)練集數(shù)據(jù) 將數(shù)據(jù)轉(zhuǎn)化為np.array
y_train = np.array(f['train_set_y'])#訓(xùn)練集標(biāo)簽
return x_train,y_train
def get_test():
f = h6py.File('dataset/test_catvnoncat.h6', 'r')
x_test = np.array(f['test_set_x'])#測(cè)試集數(shù)據(jù) 將數(shù)據(jù)轉(zhuǎn)化為np.array
y_test = np.array(f['test_set_y'])#測(cè)試集標(biāo)簽
return x_test,y_test
def preprocess(X):
#將X標(biāo)準(zhǔn)化,從0-255變成0-1
# X =X / 255
#將數(shù)據(jù)從(m,64,64,3)變成(m,12288)
X = X.reshape([X.shape[0], X.shape[1]*X.shape[2]*X.shape[3]]).T
return X
if __name__ == '__main__':
x1,y1 = get_train()
x2,y2 = get_test()
print(x1.shape,y1.shape)
print(x2.shape,y2.shape)
from matplotlib import pyplot as plt
plt.figure()
for i in range(1,16):
plt.subplot(3,5,i)
plt.imshow(x1[i])
print(y1[i])
plt.show()
2. layer.py
# coding: utf-8
# 2019/7/21 9:22
import numpy as np
class Layer:
def __init__(self,nL,nL_1,activ,activ_deri, learning_rate):
#參數(shù)分別表示:當(dāng)前層神經(jīng)元個(gè)數(shù),前一層神經(jīng)元個(gè)數(shù),激活函數(shù),激活函數(shù)的導(dǎo)函數(shù),學(xué)習(xí)率
self.nL = nL
self.nL_1 = nL_1
self.g = activ
self.g_d = activ_deri
self.alpha = learning_rate
self.W = np.random.randn(nL,nL_1)*0.01
self.b = np.random.randn(nL,1)*0.01
#正向傳播:
#1、計(jì)算Z=WX+b
#2、計(jì)算A=g(Z)
def forward(self,AL_1):
self.AL_1 = AL_1
assert (AL_1.shape[0] == self.nL_1)
self.Z = np.dot(self.W,AL_1)+self.b
assert (self.Z.shape[0] == self.nL)
AL = self.g(self.Z)
return AL
#反向傳播:
#1、m表示樣本個(gè)數(shù)
#2、計(jì)算dZ,dW,db,dAL_1
#3、梯度下降,更新W和b
def backward(self,dAL):
assert (dAL.shape[0] == self.nL)
m = dAL.shape[1]
dZ = np.multiply(dAL,self.g_d(self.Z))
assert (dZ.shape[0] == self.nL)
dW = np.dot(dZ,self.AL_1.T)/m
assert (dW.shape == (self.nL,self.nL_1))
db = np.mean(dZ,axis=1,keepdims=True)
assert (db.shape == (self.nL,1))
dAL_1 = np.dot(self.W.T,dZ)
assert (dAL_1.shape[0] == self.nL_1)
#梯度下降
self.W -= self.alpha*dW
self.b -= self.alpha*db
return dAL_1
3. network.py
# coding: utf-8
# 2019/7/21 10:45
import numpy as np
class Network:
def __init__(self,layers,loss,loss_der):
self.layers = layers
self.loss = loss
self.loss_der = loss_der
#根據(jù)輸入的數(shù)據(jù)來(lái)調(diào)用正向傳播函數(shù),不斷更新A,最后得到預(yù)測(cè)結(jié)果
def predict(self,X):
A = X
for layer in self.layers:
A = layer.forward(A)
return A
#連接每個(gè)層組建網(wǎng)絡(luò):
#1、根據(jù)輸入的數(shù)據(jù)進(jìn)行正向傳播,得到預(yù)測(cè)結(jié)果Y_predict
#2、根據(jù)Y_predict和真實(shí)值Y,通過(guò)損失函數(shù)來(lái)計(jì)算成本值J
#3、根據(jù)J來(lái)計(jì)算反向傳播的輸入值dA
#4、調(diào)用反向傳播函數(shù)來(lái)更新dA
def train(self,X,Y,epochs=10):
for i in range(epochs):
Y_predict = self.predict(X)
J = np.mean(self.loss(Y, Y_predict))
print('epoch %d:loss=%f'%(i,J))
dA = self.loss_der(Y,Y_predict)
for layer in reversed(self.layers):
#更新dA
dA= layer.backward(dA)
4. loss.py
# coding: utf-8
# 2019/7/21 11:34
import numpy as np
#交叉熵?fù)p失函數(shù)
def cross_entropy(y, y_predict):
y_predict = np.clip(y_predict,1e-10,1-1e-10) #防止0*log(0)出現(xiàn)。導(dǎo)致計(jì)算結(jié)果變?yōu)镹aN
return -(y * np.log(y_predict) + (1 - y) * np.log(1 - y_predict))
#交叉熵?fù)p失函數(shù)的導(dǎo)函數(shù)
def cross_entropy_der(y,y_predict):
return -y/y_predict+(1-y)/(1-y_predict)
5. activation.py
# coding: utf-8
# 2019/7/21 9:49
import numpy as np
def sigmoid(z):
return 1 / (1 + np.exp(-z))
#sigmoid導(dǎo)函數(shù)
def sigmoid_der(z):
x = np.exp(-z)
return x/((1+x)**2)
def relu(z):無(wú)錫婦科醫(yī)院 http://www.xasgyy.net/
return np.maximum(0,z)
#relu導(dǎo)函數(shù)
def relu_der(z):
return (z>=0).astype(np.float64)
6. train.py
# coding: utf-8
# 2019/7/21 12:13
import data,layer,loss,network,activation
import pickle,time
#對(duì)數(shù)據(jù)集進(jìn)行訓(xùn)練并保存模型
#1、搭建3層網(wǎng)絡(luò)層
#2、將3個(gè)層組建成網(wǎng)絡(luò)
#3、獲取訓(xùn)練集數(shù)據(jù)
#4、對(duì)輸入值X進(jìn)行預(yù)處理
#5、將數(shù)據(jù)輸入網(wǎng)絡(luò)進(jìn)行訓(xùn)練,epochs為1000
#6、將整個(gè)模型保存
if __name__ == '__main__':
learning_rate = 0.01
L1 = layer.Layer(1000,64*64*3, activation.relu, activation.relu_der, learning_rate)
L2 = layer.Layer(500,1000,activation.relu, activation.relu_der, learning_rate)
L3 = layer.Layer(1,500, activation.sigmoid, activation.sigmoid_der, learning_rate)
net = network.Network([L1,L2,L3], loss.cross_entropy, loss.cross_entropy_der)
X,Y = data.get_train()
X = data.preprocess(X)
net.train(X,Y,1000)
with open('models/model_%s.pickle'%(time.asctime().replace(':','_').replace(' ','-')),'wb') as f:
pickle.dump(net,f)
7. evaluate.py
# coding: utf-8
# 2019/7/21 14:17
import data
import pickle
import numpy as np
if __name__ == '__main__':
model_name = 'model_Sun-Jul-21-14_41_42-2019.pickle'
#導(dǎo)入模型
with open('models/'+model_name,'rb') as f:
net = pickle.load(f)
#獲取測(cè)試數(shù)據(jù)集
X,Y = data.get_test()
X = data.preprocess(X)
#根據(jù)輸入數(shù)據(jù)X進(jìn)行預(yù)測(cè)
Y_predict = net.predict(X)
Y_pred_float = (Y_predict>0.5).astype(np.float64)
#計(jì)算精確度
accuracy = np.sum(np.equal(Y_pred_float,Y).astype(np.int))/Y.shape[0]
print('accuracy:',accuracy)
結(jié)果
看完上訴內(nèi)容,你們對(duì)python搭建多層神經(jīng)網(wǎng)絡(luò)大概了解了嗎?如果想了解更多相關(guān)文章內(nèi)容,歡迎關(guān)注創(chuàng)新互聯(lián)行業(yè)資訊頻道,感謝各位的閱讀!
另外有需要云服務(wù)器可以了解下創(chuàng)新互聯(lián)cdcxhl.cn,海內(nèi)外云服務(wù)器15元起步,三天無(wú)理由+7*72小時(shí)售后在線,公司持有idc許可證,提供“云服務(wù)器、裸金屬服務(wù)器、高防服務(wù)器、香港服務(wù)器、美國(guó)服務(wù)器、虛擬主機(jī)、免備案服務(wù)器”等云主機(jī)租用服務(wù)以及企業(yè)上云的綜合解決方案,具有“安全穩(wěn)定、簡(jiǎn)單易用、服務(wù)可用性高、性?xún)r(jià)比高”等特點(diǎn)與優(yōu)勢(shì),專(zhuān)為企業(yè)上云打造定制,能夠滿(mǎn)足用戶(hù)豐富、多元化的應(yīng)用場(chǎng)景需求。