DLSys Lab 1
作业要求
笔记
最最经典的 MNIST 数据集,它来啦。课程组提供了 load_mnist
载入数据集,每个 image
为一个一维数组。在 Codeium 的帮助下,先把数据集打印看看:
import matplotlib.pyplot as plt
if __name__ == "__main__":
path = "./dataset/"
train_images, _ = load_mnist(path, kind="train")
# cmap='gray' displays the image in grayscale
plt.imshow(train_images[1].reshape((28, 28)), cmap="Greys")
plt.show()
课程组提供了 3 层神经网络的实现。
import numpy as np
class LinearLayer:
def __init__(self, input_nodes, output_nodes, bias=True):
self.input_nodes = input_nodes
self.output_nodes = output_nodes
self.weight = np.random.normal(
0.0, pow(self.input_nodes, -0.5), (self.output_nodes, self.input_nodes)
)
if bias:
self.bias = np.zeros((self.output_nodes, 1))
else:
self.bias = None
self.inputs = None # input data
self.outputs = None # output data
self.activation_function = lambda x: 1.0 / (1 + np.exp(-x))
self.reverse_activation_function = lambda x: x * (1.0 - x)
def forward(self, inputs):
self.inputs = inputs
wdi = np.dot(self.weight, self.inputs)
if self.bias is not None:
self.outputs = self.activation_function(wdi + self.bias)
else:
self.outputs = self.activation_function(wdi)
return self.outputs
def backpropagation(self, next_grad, learning_rate):
delta_bias = next_grad * self.reverse_activation_function(self.outputs)
delta_weight = np.dot(delta_bias, np.transpose(self.inputs))
curr_grad = np.dot(self.weight.T, next_grad)
self.weight += learning_rate * delta_weight
if self.bias is not None:
self.bias += learning_rate * delta_bias
return curr_grad
def __repr__(self):
return "<LinearLayer: {}->{}>".format(self.input_nodes, self.output_nodes)
# neural network class
class neuralNetwork:
# initialize the neural network
def __init__(self, layers: tuple, learning_rate=0.1):
"""
The network consists of three layers: input layer, hidden layer and output layer.
Here defined these layers.
:param input_nodes: dimension of input
:param hidden_layers: tuple of dimension of hidden nodes
:param output_nodes: dimension of output
:param learning_rate: the learning rate of neural network
"""
print("init neural network")
self.input_nodes = layers[0]
self.output_nodes = layers[-1]
# Some parameters that will be used next
self.lr = learning_rate # learning rate
# init layers
self.layers: list[LinearLayer] = []
for i in range(1, len(layers)):
self.layers.append(LinearLayer(layers[i - 1], layers[i]))
print(self.layers)
def forward(self, input_feature):
"""
Forward the neural network
:param input_feature: single input image, flattened [784, ]
"""
# convert inputs list to 2d array
prev_output = np.array(input_feature, ndmin=2).T
for layer in self.layers:
prev_output = layer.forward(prev_output)
self.final_outputs = prev_output
def backpropagation(self, targets_list):
"""
Propagate backwards
:param targets_list: output onehot code of a single image, [10, ]
"""
targets = np.array(targets_list, ndmin=2).T
# loss
loss = np.sum(np.square(self.final_outputs - targets)) / 2
# output layer error is the (final_outputs - target)
output_loss = targets - self.final_outputs
# backpropagation through the output layer
for i in range(len(self.layers) - 1, -1, -1):
output_loss = self.layers[i].backpropagation(output_loss, self.lr)
return np.sum((targets - self.final_outputs) ** 2)