-
Notifications
You must be signed in to change notification settings - Fork 551
/
Copy pathmnist_ann.py
101 lines (86 loc) · 3.3 KB
/
mnist_ann.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
# -*- coding: utf-8 -*-
"""MNIST_ANN.ipynb
Automatically generated by Colaboratory.
Original file is located at
https://colab.research.google.com/drive/1IYoctAFrXbyWW_H6FZ2W2QD8heZnMvi-
"""
# Description: This program classifies the MNIST handwritten digit images
# as a number 0 - 9
# Install packages
pip install tensorflow keras numpy mnist matplotlib
#import the packages / dependecies
import numpy as np
import mnist # Get data set from
from keras.models import Sequential #ANN architecture
from keras. layers import Dense # The layers in the ANN
from keras.utils import to_categorical
import matplotlib.pyplot as plt # Graph
#Load the data set
train_images = mnist.train_images() # training data of images
train_labels = mnist.train_labels() # training data of the labels
test_images = mnist. test_images() # testing data images
test_labels = mnist.test_labels() # testing data labels
#Normalize the images
#Normalize the pixel values from [0, 255] to [-0.5 to 0.5]
#This make the network easier to train
train_images = (train_images / 255) - 0.5
test_images = (test_images/ 255) - 0.5
#Flatten the images. Flatten each 28 x 28 image into a 784= 28^2
#dimensional vector and pass into the neural network
train_images = train_images.reshape((-1, 784))
test_images = test_images.reshape((-1,784))
#print the new image shape
print(train_images.shape) #60,000 rows and 784 cols
print(test_images.shape) #10,000 rows and 784 cols
#Build the ANN model
#With 3 layers, 2 with 64 neurons and activation function = relu
# and 1 layer with 10 neurons with activation function= softmax
model = Sequential()
model.add(Dense(64, activation='relu', input_dim=784))
model.add(Dense(64, activation='relu'))
model.add(Dense(10, activation='softmax'))
#Compile the model
# loss measures how well the model did on training, and then tries to improve on
# it using the optimizer
model.compile(
optimizer= 'adam',
loss = 'categorical_crossentropy', #loss function for classes > 2
metrics = ['accuracy']
)
#Train the model
model.fit(
train_images, #The training data images
to_categorical(train_labels),#The trainind data labels, label data only returns a single digit representing the class of each label Ex: train_labels = 2,to_categorical(2)= [0,0,1,0,0,0,0,0,0,0]
epochs=5, #Number of iterations over the entire data set to train on
batch_size = 3 #The number of samples per gradient update for training
)
#Evaluate the model
model.evaluate(
test_images,
to_categorical(test_labels)
)
#save the model to disk
model.save_weights('model.h5')
# Load the model from disk later using:
# Build the model.
#model = Sequential([
# Dense(64, activation='relu', input_shape=(784,)),
# Dense(64, activation='relu'),
# Dense(10, activation='softmax'),
#])
# model.load_weights('model.h5')
#Make predictions
# Predict on the first 5 test images.
# Keep in mind that the output of our network is 10 probabilities,
# so we'll use np.argmax()to turn those into actual digits
predictions = model.predict(test_images[:5])
#print(predictions)
print (np.argmax(predictions, axis =1))
print(test_labels[:5])
import matplotlib.pyplot as plt
for i in range(0,5):
first_image = test_images[i]
first_image = np.array(first_image, dtype='float')
pixels = first_image.reshape((28, 28))
plt.imshow(pixels, cmap='gray')
plt.show()