根据《python 神经网络编程》(【英】塔里克.拉希德 tariq r中国工信出版社,人民邮电出版社)进行了初步实践,发现该书是入门的不二之选。
环境:
1、IDE:sublime_txt,配合python的相关插件
2、编译运行环境,推荐使用virtualenv沙盒环境
程序
# neural network class definition
import numpy
import scipy.special
import matplotlib.pyplot as plt
class NeuralNetwork:
# initialise the neural network
def __init__(self, inputnodes, hiddennodes, outputnodes, learningrate):
# set number of nodes in each input,hidden,output layer
self.inodes = inputnodes
self.hnodes = hiddennodes
self.onodes = outputnodes
# link weight matrices , wih and who
# weights inside the arrays w_i_j, where link is from node i to node j in the next layer
self.wih = numpy.random.normal(
0.0, pow(self.hnodes, -0.5), (self.hnodes, self.inodes))
self.who = numpy.random.normal(
0.0, pow(self.onodes, -0.5), (self.onodes, self.hnodes))
# learning rate
self.lr = learningrate
# activation function is the sigmod function
self.activation_function = lambda x: scipy.special.expit(x)
pass
# train the neural network
def train(self, inputs_list, targets_list):
# convert input list to 2d array
inputs = numpy.array(inputs_list, ndmin=2).T
targets = numpy.array(targets_list, ndmin=2).T
# calculate signals into hidden layer
hidden_inputs = numpy.dot(self.wih, inputs)
# calcuate the signals emerging from hidden layer
hidden_outputs = self.activation_function(hidden_inputs)
# calculate signals into final output layer
final_inputs = numpy.dot(self.who, hidden_outputs)
# calcaute signals emerging from final outp
final_outputs = self.activation_function(final_inputs)
# errro is the target-acutal
output_errors = targets - final_outputs
# hidden layer error is the output_errors, split by weights,recombined at hidden nodes
hidden_errors = numpy.dot(self.who.T, output_errors)
# update the weights for the links between the hidden and output layers
self.who += self.lr * numpy.dot((output_errors * final_outputs * (
1.0 - final_outputs)), numpy.transpose(hidden_outputs))
# update the weights for the links between the input and hidden layers
self.wih += self.lr * \
numpy.dot((hidden_errors * hidden_outputs *
(1.0 - hidden_outputs)), numpy.transpose(inputs))
pass
# query the neural network
def query(self, inputs_list):
# convert inputs list to 2d array
inputs = numpy.array(inputs_list, ndmin=2).T
# calculate signals into hidden layer
hidden_inputs = numpy.dot(self.wih, inputs)
# calcuate the signals emerging from hidden layer
hidden_outputs = self.activation_function(hidden_inputs)
# calculate signals into final output layer
final_inputs = numpy.dot(self.who, hidden_outputs)
# calcaute signals emerging from final outp
final_outputs = self.activation_function(final_inputs)
return final_outputs
if __name__ == '__main__':
input_nodes = 784
hidden_nodes = 100
output_nodes = 10
learningrate = 0.3
nn = NeuralNetwork(input_nodes, hidden_nodes, output_nodes, learningrate)
# read training dataset
training_data_file = open("mnist_dataset/mnist_train_100.csv", 'r')
training_data_list = training_data_file.readlines()
training_data_file.close()
# go through all records in the training data set
for record in training_data_list:
# split the record by ',' commas
all_values = record.split(',')
# scale and shift the inputs
inputs = (numpy.asfarray(all_values[1:])/255.0*0.99)+0.01
# create the target output values (all 0.01 ,except the desired label which is 0.99)
targets = numpy.zeros(output_nodes)+0.01
# all_values[0] is the target label for this record
targets[int(all_values[0])] = 0.99
nn.train(inputs, targets)
pass
# load the mnist test data csv fie into a list
test_data_file = open("mnist_dataset/mnist_test_10.csv", 'r')
test_data_list = test_data_file.readlines()
test_data_file.close()
scorecard = []
for record in test_data_list:
all_values = record.split(',')
correct_lable = int(all_values[0])
print(correct_lable, "correct_lable")
inputs = (numpy.asfarray(all_values[1:])/255.0*0.99)+0.01
outputs = nn.query(inputs)
label = numpy.argmax(outputs)
print(label, "network answer")
if (label == correct_lable):
scorecard.append(1)
else:
scorecard.append(0)
pass
pass
print scorecard
# calculate the performance score
scorecard_array = numpy.asarray(scorecard)
print("performance = ", float(scorecard_array.sum())/scorecard_array.size)
#image_array = numpy.asfarray(all_values[1:]).reshape((28,28))
# plt.imshow(image_array,cmap='Greys',interpolation='None')
# plt.show()
说明:
1、代码逻辑很简单,需要详细的解读请参考书
2、在开发国产中,涉及第三方import进来包的使用,如果有错误,请在python交互环境下验证,验证正确下写在程序中
3、比如这一块, # plt.imshow(image_array,cmap='Greys',interpolation='None'),需要通过 # plt.show()来绘制