Python利用三層神經網絡實現手寫數字分類詳解

Posted on 2021-11-30 by WalkonNet

前言

本文做的是基於三層神經網絡實現手寫數字分類，神經網絡設計是設計復雜深度學習算法應用的基礎，本文將介紹如何設計一個三層神經網絡模型來實現手寫數字分類。首先介紹如何利用高級編程語言Python搭建神經網絡訓練和推斷框架來實現手寫數字分類的訓練和使用。

本文實驗文檔下載

一、神經網絡組成

一個完整的神經網絡通常由多個基本的網絡層堆疊而成。本實驗中的三層全連接神經網絡由三個全連接層構成，在每兩個全連接層之間會插入ReLU激活函數引入非線性變換，最後使用Softmax層計算交叉嫡損失，如下圖所示。因此本實驗中使用的基本單元包括全連接層、ReLU激活函數、Softmax損失函數。

二、代碼實現

1.引入庫

import numpy as np
import struct
import os

2.導入數據集

MNIST_DIR = "mnist_data"
TRAIN_DATA = "train-images-idx3-ubyte"
TRAIN_LABEL = "train-labels-idx1-ubyte"
TEST_DATA = "t10k-images-idx3-ubyte"
TEST_LABEL = "t10k-labels-idx1-ubyte"

數據集鏈接

數據集下載後一定記得解壓

3.全連接層

class FullyConnectedLayer(object):
    def __init__(self, num_input, num_output):  # 全連接層初始化
        self.num_input = num_input
        self.num_output = num_output
    def init_param(self, std=0.01):  # 參數初始化
        self.weight = np.random.normal(loc=0, scale=std, size=(self.num_input, self.num_output))
        self.bias = np.zeros([1, self.num_output])
    def forward(self, input):  # 前向傳播計算
        self.input = input
        self.output = np.dot(self.input,self.weight)+self.bias
        return self.output
    def backward(self, top_diff):  # 反向傳播的計算
        self.d_weight =np.dot(self.input.T,top_diff) 
        self.d_bias = top_diff #
        bottom_diff = np.dot(top_diff,self.weight.T) 
        return bottom_diff
    def update_param(self, lr):  # 參數更新
        self.weight = self.weight - lr * self.d_weight   
        self.bias = self.bias - lr * self.d_bias    
    def load_param(self, weight, bias):  # 參數加載
        assert self.weight.shape == weight.shape
        assert self.bias.shape == bias.shape
        self.weight = weight
        self.bias = bias
    def save_param(self):  # 參數保存
        return self.weight, self.bias

4.ReLU激活函數層

class ReLULayer(object):
    def forward(self, input):  # 前向傳播的計算
        self.input = input
        output = np.maximum(self.input,0)  
        return output
    def backward(self, top_diff):  # 反向傳播的計算
        b = self.input
        b[b>0] =1
        b[b<0] = 0
        bottom_diff = np.multiply(b,top_diff)
        return bottom_diff

5.Softmax損失層

class SoftmaxLossLayer(object):
    def forward(self, input):  # 前向傳播的計算
        input_max = np.max(input, axis=1, keepdims=True)
        input_exp = np.exp(input- input_max)#(64,10)
        partsum = np.sum(input_exp,axis=1)
        sum = np.tile(partsum,(10,1))
        self.prob = input_exp / sum.T
        return self.prob
    def get_loss(self, label):   # 計算損失
        self.batch_size = self.prob.shape[0]
        self.label_onehot = np.zeros_like(self.prob)
        self.label_onehot[np.arange(self.batch_size), label] = 1.0
        loss = -np.sum(self.label_onehot*np.log(self.prob)) / self.batch_size
        return loss
    def backward(self):  # 反向傳播的計算
        bottom_diff = (self.prob - self.label_onehot)/self.batch_size
        return bottom_diff

6.網絡訓練與推斷模塊

class MNIST_MLP(object):
    def __init__(self, batch_size=64, input_size=784, hidden1=32, hidden2=16, out_classes=10, lr=0.01, max_epoch=1,print_iter=100):
        self.batch_size = batch_size
        self.input_size = input_size
        self.hidden1 = hidden1
        self.hidden2 = hidden2
        self.out_classes = out_classes
        self.lr = lr
        self.max_epoch = max_epoch
        self.print_iter = print_iter

    def shuffle_data(self):
        np.random.shuffle(self.train_data)

    def build_model(self):  # 建立網絡結構
        self.fc1 = FullyConnectedLayer(self.input_size, self.hidden1)
        self.relu1 = ReLULayer()
        self.fc2 = FullyConnectedLayer(self.hidden1, self.hidden2)  
        self.relu2 = ReLULayer()  
        self.fc3 = FullyConnectedLayer(self.hidden2, self.out_classes)
        self.softmax = SoftmaxLossLayer()
        self.update_layer_list = [self.fc1, self.fc2, self.fc3]

    def init_model(self):
        for layer in self.update_layer_list:
            layer.init_param()

    def forward(self, input):  # 神經網絡的前向傳播
        h1 = self.fc1.forward(input)
        h1 = self.relu1.forward(h1)
        h2 = self.fc2.forward(h1)  
        h2 = self.relu2.forward(h2)  
        h3 = self.fc3.forward(h2)  
        self.prob = self.softmax.forward(h3)
        return self.prob

    def backward(self):  # 神經網絡的反向傳播
        dloss = self.softmax.backward()
        dh2 = self.fc3.backward(dloss)  
        dh2 = self.relu2.backward(dh2)  
        dh1 = self.fc2.backward(dh2)
        dh1 = self.relu1.backward(dh1)  
        dh1 = self.fc1.backward(dh1)

    def update(self, lr):
        for layer in self.update_layer_list:
            layer.update_param(lr)

    def load_mnist(self, file_dir, is_images='True'):
        bin_file = open(file_dir, 'rb')
        bin_data = bin_file.read()
        bin_file.close()
        if is_images:
            fmt_header = '>iiii'
            magic, num_images, num_rows, num_cols = struct.unpack_from(fmt_header, bin_data, 0)
        else:
            fmt_header = '>ii'
            magic, num_images = struct.unpack_from(fmt_header, bin_data, 0)
            num_rows, num_cols = 1, 1
        data_size = num_images * num_rows * num_cols
        mat_data = struct.unpack_from('>' + str(data_size) + 'B', bin_data, struct.calcsize(fmt_header))
        mat_data = np.reshape(mat_data, [num_images, num_rows * num_cols])
        return mat_data

    def load_data(self):
        train_images = self.load_mnist(os.path.join(MNIST_DIR, TRAIN_DATA), True)
        train_labels = self.load_mnist(os.path.join(MNIST_DIR, TRAIN_LABEL), False)
        test_images = self.load_mnist(os.path.join(MNIST_DIR, TEST_DATA), True)
        test_labels = self.load_mnist(os.path.join(MNIST_DIR, TEST_LABEL), False)
        self.train_data = np.append(train_images, train_labels, axis=1)
        self.test_data = np.append(test_images, test_labels, axis=1)


    def load_model(self, param_dir):
        params = np.load(param_dir).item()
        self.fc1.load_param(params['w1'], params['b1'])
        self.fc2.load_param(params['w2'], params['b2'])
        self.fc3.load_param(params['w3'], params['b3'])

    def save_model(self, param_dir):
        params = {}
        params['w1'], params['b1'] = self.fc1.save_param()
        params['w2'], params['b2'] = self.fc2.save_param()
        params['w3'], params['b3'] = self.fc3.save_param()
        np.save(param_dir, params)

    def train(self):
        max_batch_1 = self.train_data.shape[0] / self.batch_size
        max_batch = int(max_batch_1)
        for idx_epoch in range(self.max_epoch):
            mlp.shuffle_data()
            for idx_batch in range(max_batch):
                batch_images = self.train_data[idx_batch * self.batch_size:(idx_batch + 1) * self.batch_size, :-1]
                batch_labels = self.train_data[idx_batch * self.batch_size:(idx_batch + 1) * self.batch_size, -1]
                prob = self.forward(batch_images)
                loss = self.softmax.get_loss(batch_labels)
                self.backward()
                self.update(self.lr)
                if idx_batch % self.print_iter == 0:
                    print('Epoch %d, iter %d, loss: %.6f' % (idx_epoch, idx_batch, loss))

    def evaluate(self):
        pred_results = np.zeros([self.test_data.shape[0]])
        for idx in range(int(self.test_data.shape[0] / self.batch_size)):
            batch_images = self.test_data[idx * self.batch_size:(idx + 1) * self.batch_size, :-1]
            prob = self.forward(batch_images)
            pred_labels = np.argmax(prob, axis=1)
            pred_results[idx * self.batch_size:(idx + 1) * self.batch_size] = pred_labels
        accuracy = np.mean(pred_results == self.test_data[:, -1])
        print('Accuracy in test set: %f' % accuracy)

7.完整流程

if __name__ == '__main__':
    h1, h2, e = 128, 64, 20
    mlp = MNIST_MLP(hidden1=h1, hidden2=h2,max_epoch=e)
    mlp.load_data()
    mlp.build_model()
    mlp.init_model()
    mlp.train()
    mlp.save_model('mlp-%d-%d-%depoch.npy' % (h1,h2,e))
    mlp.load_model('mlp-%d-%d-%depoch.npy' % (h1, h2, e))
    mlp.evaluate()

三、代碼debug

pycharm在初次運行時，會在以下代碼報錯：

mlp.load_model('mlp-%d-%d-%depoch.npy' % (h1, h2, e))

ValueError: Object arrays cannot be loaded when allow_pickle=False

經過上網查看原因後，發現是numpy版本太高引起

解決方法：

點擊報錯處，進入源代碼（.py），註釋掉693行：

#if not allow_pickle:
    #raise ValueError("Object arrays cannot be loaded when "
                   #  "allow_pickle=False")
 
    # Now read the actual data.
    if dtype.hasobject:
        # The array contained Python objects. We need to unpickle the data.
        #if not allow_pickle:
            #raise ValueError("Object arrays cannot be loaded when "
                           #  "allow_pickle=False")
        if pickle_kwargs is None:
            pickle_kwargs = {}
        try:
            array = pickle.load(fp, **pickle_kwargs)
        except UnicodeError as err:
            if sys.version_info[0] >= 3:
                # Friendlier error message

四、結果展示

在不改變網絡結構的條件下我通過自行調節參數主要體現在：

if __name__ == '__main__':
    h1, h2, e = 128, 64, 20

class MNIST_MLP(object):
    def __init__(self, batch_size=64, input_size=784, hidden1=32, hidden2=16, out_classes=10, lr=0.01, max_epoch=1,print_iter=100):

為瞭提高準確率，當然你可以從其他方面進行修改，以下是我得出的輸出結果：

補充

ValueError: Object arrays cannot be loaded when allow_pickle=False解決方案

在讀.npz文件時報下面錯誤：

population_data=np.load("./data/populations.npz")
print(population_data.files)#裡面有兩個數組   data  feature_names
data=population_data['data']
print(data)
print(population_data['feature_names'])

報錯：

['data', 'feature_names']
Traceback (most recent call last):
  File "E:/pycharm file/使用scikit-learn構建模型/構建一元線性模型.py", line 32, in <module>
    data=population_data['data']
  File "E:\pycharm file\venv\lib\site-packages\numpy\lib\npyio.py", line 262, in __getitem__
    pickle_kwargs=self.pickle_kwargs)
  File "E:\pycharm file\venv\lib\site-packages\numpy\lib\format.py", line 692, in read_array
    raise ValueError("Object arrays cannot be loaded when "
ValueError: Object arrays cannot be loaded when allow_pickle=False

報錯為：numpy版本太高，我用的是1.16.3，應該降級為1.16.2

兩種解決方案：

Numpy 1.16.3幾天前發佈瞭。從發行版本中說明：“函數np.load（）和np.lib.format.read_array（）采用allow_pickle關鍵字，現在默認為False以響應CVE-2019-6446 < nvd.nist.gov/vuln/detail / CVE-2019-6446 >“。降級到1.16.2對我有幫助，因為錯誤發生在一些library內部

第一種：點擊報錯處，進入源代碼（.py），註釋掉693行：

#if not allow_pickle:
    #raise ValueError("Object arrays cannot be loaded when "
                   #  "allow_pickle=False")
 
    # Now read the actual data.
    if dtype.hasobject:
        # The array contained Python objects. We need to unpickle the data.
        #if not allow_pickle:
            #raise ValueError("Object arrays cannot be loaded when "
                           #  "allow_pickle=False")
        if pickle_kwargs is None:
            pickle_kwargs = {}
        try:
            array = pickle.load(fp, **pickle_kwargs)
        except UnicodeError as err:
            if sys.version_info[0] >= 3:
                # Friendlier error message

修改後成功解決瞭問題，但改掉源碼不知道會不會有後遺癥

第二種：降級numpy版本

pip install numpy==1.16.2

上述兩種方法都可以成功解決報錯問題

以上就是Python利用三層神經網絡實現手寫數字分類詳解的詳細內容，更多關於Python 的資料請關註WalkonNet其它相關文章！

Python利用三層神經網絡實現手寫數字分類詳解

目錄

前言

一、神經網絡組成

二、代碼實現

1.引入庫

2.導入數據集

3.全連接層

4.ReLU激活函數層

5.Softmax損失層

6.網絡訓練與推斷模塊

三、代碼debug

四、結果展示

補充

推薦閱讀：

發佈留言取消回覆

近期文章

目錄

前言

一、神經網絡組成

二、代碼實現

1.引入庫

2.導入數據集

3.全連接層

4.ReLU激活函數層

5.Softmax損失層

6.網絡訓練與推斷模塊

三、代碼debug

四、結果展示

補充

推薦閱讀：

發佈留言 取消回覆

近期文章

標籤

發佈留言取消回覆