深度学习之神经网络代码实现_深度学习代码资源-CSDN文库

共30个文件

pyc：11个

py：11个

csv：7个

版权申诉

神经网络

深度学习

26 浏览量 2023-05-28 15:09:46 上传评论收藏 5.16MB ZIP 举报

资源推荐

资源详情

资源评论

收起资源包目录

深度学习之神经网络代码实现.zip （30个子文件）

data

mnist-demo.csv 17.43MB

non-linear-regression-x-y.csv 4KB

world-happiness-report-2017.csv 29KB

fashion-mnist-demo.csv 10.57MB

microchips-tests.csv 2KB

iris.csv 4KB

server-operational-params.csv 11KB

utils

__init__.py 0B

features

__init__.py 232B

normalize.py 544B

generate_polynomials.py 1KB

prepare_for_training.py 1KB

__pycache__

normalize.cpython-36.pyc 522B

generate_sinusoids.cpython-36.pyc 531B

__init__.cpython-36.pyc 355B

generate_polynomials.cpython-36.pyc 1KB

prepare_for_training.cpython-36.pyc 904B

generate_sinusoids.py 388B

hypothesis

__init__.py 116B

sigmoid_gradient.py 218B

__pycache__

sigmoid.cpython-36.pyc 376B

sigmoid_gradient.cpython-36.pyc 428B

__init__.cpython-36.pyc 269B

sigmoid.py 155B

__pycache__

__init__.cpython-36.pyc 140B

neural_network

multilayer_perceptron.py 9KB

mnist.py 3KB

__pycache__

multilayer_perceptron2.cpython-36.pyc 5KB

multilayer_perceptron.cpython-36.pyc 5KB

公式.png 132KB

import numpy as np from utils.features import prepare_for_training from utils.hypothesis import sigmoid, sigmoid_gradient class MultilayerPerceptron: def __init__(self,data,labels,layers,normalize_data =False): data_processed = prepare_for_training(data,normalize_data = normalize_data)[0] self.data= data_processed self.labels= labels self.layers= layers #784 25 10 self.normalize_data= normalize_data self.thetas = MultilayerPerceptron.thetas_init(layers) def predict(self,data): data_processed = prepare_for_training(data,normalize_data = self.normalize_data)[0] num_examples = data_processed.shape[0] predictions = MultilayerPerceptron.feedforward_propagation(data_processed,self.thetas,self.layers) return np.argmax(predictions,axis=1).reshape((num_examples,1)) def train(self,max_iterations=1000,alpha=0.1): unrolled_theta = MultilayerPerceptron.thetas_unroll(self.thetas) (optimized_theta,cost_history) = MultilayerPerceptron.gradient_descent(self.data,self.labels,unrolled_theta,self.layers,max_iterations,alpha) self.thetas = MultilayerPerceptron.thetas_roll(optimized_theta,self.layers) return self.thetas,cost_history @staticmethod def thetas_init(layers): num_layers = len(layers) thetas = {} for layer_index in range(num_layers - 1): """ 会执行两次，得到两组参数矩阵：25*785 , 10*26 """ in_count = layers[layer_index] out_count = layers[layer_index+1] # 这里需要考虑到偏置项，记住一点偏置的个数跟输出的结果是一致的 thetas[layer_index] = np.random.rand(out_count,in_count+1)*0.05 #随机进行初始化操作，值尽量小一点 return thetas @staticmethod def thetas_unroll(thetas): num_theta_layers = len(thetas) unrolled_theta = np.array([]) for theta_layer_index in range(num_theta_layers): unrolled_theta = np.hstack((unrolled_theta,thetas[theta_layer_index].flatten())) return unrolled_theta @staticmethod def gradient_descent(data,labels,unrolled_theta,layers,max_iterations,alpha): optimized_theta = unrolled_theta cost_history = [] for _ in range(max_iterations): cost = MultilayerPerceptron.cost_function(data,labels,MultilayerPerceptron.thetas_roll(optimized_theta,layers),layers) cost_history.append(cost) theta_gradient = MultilayerPerceptron.gradient_step(data,labels,optimized_theta,layers) optimized_theta = optimized_theta - alpha* theta_gradient return optimized_theta,cost_history @staticmethod def gradient_step(data,labels,optimized_theta,layers): theta = MultilayerPerceptron.thetas_roll(optimized_theta,layers) thetas_rolled_gradients = MultilayerPerceptron.back_propagation(data,labels,theta,layers) thetas_unrolled_gradients = MultilayerPerceptron.thetas_unroll(thetas_rolled_gradients) return thetas_unrolled_gradients @staticmethod def back_propagation(data,labels,thetas,layers): num_layers = len(layers) (num_examples,num_features) = data.shape num_label_types = layers[-1] deltas = {} #初始化操作 for layer_index in range(num_layers -1 ): in_count = layers[layer_index] out_count = layers[layer_index+1] deltas[layer_index] = np.zeros((out_count,in_count+1)) #25*785 10*26 for example_index in range(num_examples): layers_inputs = {} layers_activations = {} layers_activation = data[example_index,:].reshape((num_features,1))#785*1 layers_activations[0] = layers_activation #逐层计算 for layer_index in range(num_layers - 1): layer_theta = thetas[layer_index] #得到当前权重参数值 25*785 10*26 layer_input = np.dot(layer_theta,layers_activation) #第一次得到25*1 第二次10*1 layers_activation = np.vstack((np.array([[1]]),sigmoid(layer_input))) layers_inputs[layer_index + 1] = layer_input #后一层计算结果 layers_activations[layer_index + 1] = layers_activation #后一层经过激活函数后的结果 output_layer_activation = layers_activation[1:,:] delta = {} #标签处理 bitwise_label = np.zeros((num_label_types,1)) bitwise_label[labels[example_index][0]] = 1 #计算输出层和真实值之间的差异 delta[num_layers - 1] = output_layer_activation - bitwise_label #遍历循环 L L-1 L-2 ...2 for layer_index in range(num_layers - 2,0,-1): layer_theta = thetas[layer_index] next_delta = delta[layer_index+1] layer_input = layers_inputs[layer_index] layer_input = np.vstack((np.array((1)),layer_input)) #按照公式进行计算 delta[layer_index] = np.dot(layer_theta.T,next_delta)*sigmoid_gradient(layer_input) #过滤掉偏置参数 delta[layer_index] = delta[layer_index][1:,:] for layer_index in range(num_layers-1): layer_delta = np.dot(delta[layer_index+1],layers_activations[layer_index].T) deltas[layer_index] = deltas[layer_index] + layer_delta #第一次25*785 第二次10*26 for layer_index in range(num_layers -1): deltas[layer_index] = deltas[layer_index] * (1/num_examples) return deltas @staticmethod def cost_function(data,labels,thetas,layers): num_layers = len(layers) num_examples = data.shape[0] num_labels = layers[-1] #前向传播走一次 predictions = MultilayerPerceptron.feedforward_propagation(data,thetas,layers) #制作标签，每一个样本的标签都得是one-hot bitwise_labels = np.zeros((num_examples,num_labels)) for example_index in range(num_examples): bitwise_labels[example_index][labels[example_index][0]] = 1 bit_set_cost = np.sum(np.log(predictions[bitwise_labels == 1])) bit_not_set_cost = np.sum(np.log(1-predictions[bitwise_labels == 0])) cost = (-1/num_examples) *(bit_set_cost+bit_not_set_cost) return cost @staticmethod def feedforward_propagation(data,thetas,layers): num_layers = len(layers) num_examples = data.shape[0] in_layer_activation = data # 逐层计算 for layer_index in range(num_layers - 1): theta = thetas[layer_index] out_layer_activation = sigmoid(np.dot(in_layer_activation,theta.T)) # 正常计算完之后是num_examples*25,但是要考虑偏置项变成num_examples*26 out_layer_activation = np.hstack((np.ones((num_examples,1)),out_layer_activation)) in_layer_activation = out_layer_activation #返回输出层结果,结果中不要偏置项了 return in_layer_activation[:,1:] @staticmethod def thetas_roll(unrolled_thetas,layers): num_layers = len(layers) thetas = {} unrolled_shift = 0 for layer_index in range(num_layers - 1): in_count = layers[layer_index] out_count = layers[layer_index+1] thetas_width = in_count + 1 thetas_height = out_count thetas_volume = thetas_width * theta

评论收藏

内容反馈

版权申诉