BP神经网络

概况

BP(back propagation)神经网络是1986年由Rumelhart和McClelland为首的科学家提出的概念，是一种按照误差逆向传播算法训练的多层前馈神经网络，是应用最广泛的神经网络模型之一。Minsky和Papert在颇具影响力的"perceptron" 一书中指出，简单的感知器只能求解线性问题，能够求解非线性问题的网络应该具有感知层，但是对隐藏层神经元的学习规则还没有合理的理论依据。

代码模板

import numpy as np


def sigmoid(x):
    return 1.0 / (1.0 + np.exp(-x))


def derived_sigmoid(x):
    return x * (1 - x)


def make_matrix(m, n, fill=0.0):  # m行n列
    a = []
    for i in range(m):
        a.append([fill] * n)
    return np.array(a)


# neural network class 4 layer
class neuralNetwork:

    # initialize the neural network
    def __init__(self, input_nodes, hidden_nodes, hidden2_nodes, output_nodes, learning_rate=0.1):
        """
        The network consists of three layers: input layer, hidden layer and output layer.
        Here defined these layers.
        :param input_nodes: dimension of input
        :param hidden_nodes: dimension of hidden nodes
        :param output_nodes: dimension of output
        :param learning_rate: the learning rate of neural network
        """

        self.x_num = input_nodes + 1  # 添加一个偏置
        self.h_num = hidden_nodes
        self.h2_num = hidden2_nodes
        self.y_num = output_nodes

        # 初始化向量
        self.x_vector = np.array([0.0] * self.x_num)
        self.hi_vector = np.array([0.0] * self.h_num)
        self.ho_vector = np.array([0.0] * self.h_num)
        self.h2i_vector = np.array([0.0] * self.h2_num)
        self.h2o_vector = np.array([0.0] * self.h2_num)
        self.yi_vector = np.array([0.0] * self.y_num)
        self.yo_vector = np.array([0.0] * self.y_num)

        # 初始化权值矩阵
        # 输入数据到隐藏层输入的变换矩阵
        self.weight_xh = (np.random.random([self.x_num, self.h_num]) - 0.51)  
        # 隐藏层间的变换矩阵
        self.weight_hh2 = (np.random.random([self.h_num, self.h2_num]) - 0.51)
        # 隐藏层输出到输出层输入的变换矩阵
        self.weight_h2y = (np.random.random([self.h2_num, self.y_num]) - 0.51)
        # 学习率
        self.lr = learning_rate

        # 动量因子
        self.input_correction = make_matrix(self.x_num, self.h_num)
        self.hidden_correction = make_matrix(self.h_num, self.h2_num)
        self.output_correction = make_matrix(self.h2_num, self.y_num)
		# 动量因子影响率
        self.m = 0.1

    def forward(self, input_feature):
        """
        Forward the neural network
        :param input_feature: single input image, flattened [784, ]
        """
        if len(input_feature) != self.x_num - 1:
            raise ValueError("输入数据与输入结点数量不同")

            # 简单的处理一下输入数据
        self.x_vector[1:self.x_num] = input_feature
        self.x_vector = np.array(self.x_vector)

        # 输入层->隐藏层
        self.hi_vector = np.dot(self.x_vector, self.weight_xh)
        # print(self.hi_vector)

        # 激活隐藏层神经元
        self.ho_vector = np.array(sigmoid(self.hi_vector))
        # print(self.ho_vector)

        self.h2i_vector = np.dot(self.ho_vector, self.weight_hh2)

        self.h2o_vector = np.array(sigmoid(self.h2i_vector))

        # 隐藏层->输出层
        self.yi_vector = np.dot(self.h2o_vector, self.weight_h2y)
        # print(self.yi_vector)

        # 激活输出层神经元
        self.yo_vector = np.array(sigmoid(self.yi_vector))
        # print(self.yo_vector)

        return self.yo_vector

    def backpropagation(self, targets_list):
        """
        Propagate backwards
        :param targets_list: output onehot code of a single image, [10, ]
        """
        if len(targets_list) != self.y_num:
            raise ValueError("标记数量与输出数量不符")

        targets = np.array(targets_list)  # 简单处理输入

        # 计算误差
        error = 0.5 * np.dot((targets - self.yo_vector).T,
                             (targets - self.yo_vector))

        # 计算残差
        delta_h2y = np.array((targets - self.yo_vector) 
                             * derived_sigmoid(self.yo_vector))
        delta_hh2 = np.array(np.dot(delta_h2y, self.weight_h2y.T) 
                             * derived_sigmoid(self.h2o_vector))
        delta_xh = np.array(np.dot(delta_hh2, self.weight_hh2.T) 
                            * derived_sigmoid(self.ho_vector))

        # 更新权值
        # print(self.weight_xh)
        self.weight_h2y += self.lr 
        	* np.dot(delta_h2y.reshape(-1, 1),self.h2o_vector.reshape(1, -1)).T 
        	+ self.m * self.output_correction

        self.weight_hh2 += self.lr 
        	* np.dot(delta_hh2.reshape(-1, 1),self.hi_vector.reshape(1, -1)).T 
        	+ self.m * self.hidden_correction

        self.weight_xh += self.lr 
        	* np.dot(delta_xh.reshape(-1, 1),self.x_vector.reshape(1, -1)).T 
        	+ self.m * self.input_correction

        # 更新
        self.output_correction = self.lr 
        	* np.dot(delta_h2y.reshape(-1, 1), self.h2o_vector.reshape(1, -1)).T
        self.hidden_correction = self.lr 
        	* np.dot(delta_hh2.reshape(-1, 1), self.ho_vector.reshape(1, -1)).T
        self.input_correction = self.lr 
        	* np.dot(delta_xh.reshape(-1, 1), self.x_vector.reshape(1, -1)).T
        return error

posted @ 2023-03-27 21:47 玖芜阅读(127) 评论(0) 收藏举报

刷新页面返回顶部

Loading

SuYang's Blog

BP神经网络

概况

相关定义与原理

代码模板

公告