手寫神經網絡Python深度學習

import numpy
import scipy.special
import matplotlib.pyplot as plt
import scipy.misc
import glob
import imageio
import scipy.ndimage

class neuralNetWork:
  def __init__(self,inputnodes,hiddennodes,outputnodes,learningrate):
    self.inodes = inputnodes
    self.hnodes = hiddennodes
    self.onodes = outputnodes

    self.wih = numpy.random.normal(0.0,pow(self.inodes, -0.5),(self.hnodes,self.inodes))
    self.who = numpy.random.normal(0.0,pow(self.hnodes, -0.5),(self.onodes,self.hnodes))
    
    self.lr = learningrate

    self.activation_function = lambda x: scipy.special.expit(x) # 激活函數
    self.inverse_activation_function = lambda x: scipy.special.logit(x) # 反向查詢log激活函數

  def train(self,inputs_list,targets_list):
    inputs = numpy.array(inputs_list,ndmin=2).T
    targets = numpy.array(targets_list,ndmin=2).T

    hidden_inputs = numpy.dot(self.wih,inputs)
    hidden_outputs = self.activation_function(hidden_inputs)

    final_inputs = numpy.dot(self.who,hidden_outputs)
    final_outputs = self.activation_function(final_inputs)

    output_errors = targets - final_outputs
    hidden_errors = numpy.dot(self.who.T,output_errors)

    self.who += self.lr * numpy.dot((output_errors * final_outputs * (1.0 - final_outputs)),numpy.transpose(hidden_outputs))
    self.wih += self.lr * numpy.dot((hidden_errors * hidden_outputs * (1.0 - hidden_outputs)),numpy.transpose(inputs))

  def query(self,inputs_list):
    inputs = numpy.array(inputs_list,ndmin=2).T

    hidden_inputs = numpy.dot(self.wih,inputs)
    hidden_outputs = self.activation_function(hidden_inputs)
    final_inputs = numpy.dot(self.who,hidden_outputs)
    final_outputs = self.activation_function(final_inputs)

    return final_outputs
  def backquery(self, targets_list):
    final_outputs = numpy.array(targets_list, ndmin=2).T
  
    final_inputs = self.inverse_activation_function(final_outputs)
    hidden_outputs = numpy.dot(self.who.T, final_inputs)
    
    hidden_outputs -= numpy.min(hidden_outputs)
    hidden_outputs /= numpy.max(hidden_outputs)
    hidden_outputs *= 0.98
    hidden_outputs += 0.01

    hidden_inputs = self.inverse_activation_function(hidden_outputs)
    inputs = numpy.dot(self.wih.T, hidden_inputs)
    inputs -= numpy.min(inputs)
    inputs /= numpy.max(inputs)
    inputs *= 0.98
    inputs += 0.01
    
    return inputs
  

input_nodes = 784
hidden_nodes = 200
output_nodes = 10
learing_rate = 0.1
n = neuralNetWork(input_nodes,hidden_nodes,output_nodes,learing_rate)

train_data_file = open('mnist_train.csv', 'r')
train_data_list = train_data_file.readlines()
train_data_file.close()

epochs = 5
for e in range(epochs):
  for record in train_data_list:
    all_values = record.split(',')
    #image_array = numpy.asfarray(all_values[1:]).reshape((28,28))
    #plt.imshow(image_array,cmap='Greys',interpolation='None')
    #plt.show()
    inputs = (numpy.asfarray(all_values[1:])/255.0 *0.99)+0.01
    targets = numpy.zeros(output_nodes) + 0.01
    targets[int(all_values[0])] = 0.99
    n.train(inputs,targets)

    #手寫字體傾斜10度做爲測試數據
    inputs_plusx_img = scipy.ndimage.interpolation.rotate(inputs.reshape(28,28), 10, cval=0.01, order=1, reshape=False)
    n.train(inputs_plusx_img.reshape(784), targets)
    inputs_minusx_img = scipy.ndimage.interpolation.rotate(inputs.reshape(28,28), -10, cval=0.01, order=1, reshape=False)
    n.train(inputs_minusx_img.reshape(784), targets)


test_data_file = open('mnist_test.csv', 'r')
test_data_list = test_data_file.readlines()
test_data_file.close()
# all_values = test_data_list[0].split(',')

# # image_array = numpy.asfarray(all_values[1:]).reshape((28,28))
# # plt.imshow(image_array,cmap='Greys',interpolation='None')
# # plt.show()

# output = n.query((numpy.asfarray(all_values[1:])/ 255.0 * 0.99)+0.01)


scorecard = []
for record in test_data_list:
  all_values = record.split(',')
  correct_label = int(all_values[0])
  #print(correct_label,'correct_label')
  inputs = (numpy.asfarray(all_values[1:])/255.0 *0.99)+0.01
  outputs = n.query(inputs)
  label = numpy.argmax(outputs)
  #print(label,'network answer')
  if (label == correct_label):
    scorecard.append(1)
  else:
    scorecard.append(0)
scorecard_array = numpy.asarray(scorecard)
print("performance = ",scorecard_array.sum() / scorecard_array.size)

# 識別本身手寫字
our_own_dataset = []

for image_file_name in glob.glob('2828_my_own_?.png'):
  label = int(image_file_name[-5:-4])
  
  print ("loading ... ", image_file_name)
  img_array = imageio.imread(image_file_name, as_gray=True)
  img_data  = 255.0 - img_array.reshape(784)
  
  img_data = (img_data / 255.0 * 0.99) + 0.01
  print(numpy.min(img_data))
  print(numpy.max(img_data))
  
  record = numpy.append(label,img_data)
  our_own_dataset.append(record)

item = 2
plt.imshow(our_own_dataset[item][1:].reshape(28,28), cmap='Greys', interpolation='None')
correct_label = our_own_dataset[item][0]
inputs = our_own_dataset[item][1:]

outputs = n.query(inputs)
print (outputs)

label = numpy.argmax(outputs)
print("network says ", label)
if (label == correct_label):
    print ("match!")
else:
    print ("no match!")

# 反向生成圖像
label = 0
targets = numpy.zeros(output_nodes) + 0.01
targets[label] = 0.99
print(targets)

image_data = n.backquery(targets)

plt.imshow(image_data.reshape(28,28), cmap='Greys', interpolation='None')
相關文章
相關標籤/搜索