import numpy as np # mathematical and scientific functions
import matplotlib.pyplot as plt # visualization

# format matplotlib options
%matplotlib inline
plt.rcParams.update({'font.size': 20})

import keras.backend # information on the backend that keras is using
from keras.utils import np_utils # functions to wrangle label vectors
from keras.models import Sequential # the basic deep learning model
from keras.layers import Dense, Flatten, Convolution2D, MaxPooling2D # important CNN layers
from keras.models import load_model # to load a pre-saved model (may require hdf libraries installed)

from keras.datasets import mnist # the MNIST dataset
from keras.datasets import fashion_mnist # the Fashion-MNIST dataset

Using TensorFlow backend.


print(keras.backend.backend())

tensorflow


(X_train, y_train), (X_test, y_test) = mnist.load_data()

Downloading data from https://s3.amazonaws.com/img-datasets/mnist.npz
11493376/11490434 [==============================] - 6s 0us/step


print('The dimensions of X_train are:')
print(X_train.shape)
print('The dimensions of X_test are:')
print(X_test.shape)

The dimensions of X_train are:
(60000, 28, 28)
The dimensions of X_test are:
(10000, 28, 28)


print('The variable type of X_train is:')
print(X_train.dtype)
print('The variable type of X_test is:')
print(X_test.dtype)

The variable type of X_train is:
uint8
The variable type of X_test is:
uint8


plt.figure()
plt.imshow(X_train[0],cmap='gray')
plt.show()


plt.figure(figsize=(20,20))
for k in range(0,10):
    plt.subplot(1,10,k+1)
    plt.imshow(X_train[k],cmap='gray')
    plt.axis('off')
plt.show()


print(y_train[0])

5


plt.figure(figsize=(20,20))
for k in range(0,10):
    plt.subplot(1,10,k+1)
    plt.imshow(X_train[k],cmap='gray')
    plt.title(y_train[k])
    plt.axis('off')
plt.show()


plt.figure(figsize=(20,20))
for d in range(0,10): # loop over the digits 0 through 9
    for k in range(0,10): # choose 10 example images for each digit
        plt.subplot(10,10,d*10+k+1) # select the current subplot
        plt.imshow(X_train[np.where(y_train==d)[0][k],:,:],cmap='gray') # plot the image
        plt.axis('off')


X_train = X_train.reshape(X_train.shape[0], 28, 28, 1)
X_test = X_test.reshape(X_test.shape[0], 28, 28, 1)


print('The dimensions of X_train are:')
print(X_train.shape)
print('The dimensions of X_test are:')
print(X_test.shape)

The dimensions of X_train are:
(60000, 28, 28, 1)
The dimensions of X_test are:
(10000, 28, 28, 1)


plt.figure(figsize=(20,20))
for k in range(0,10):
    plt.subplot(1,10,k+1)
    plt.imshow(X_train[k],cmap='gray')
    plt.axis('off')
plt.show()


plt.figure(figsize=(20,20))
for k in range(0,10):
    plt.subplot(1,10,k+1)
    plt.imshow(X_train[k].squeeze(),cmap='gray')
    plt.axis('off')
plt.show()


print('The range of X_train is ['+str(X_train.min())+','+str(X_train.max())+']')
print('The range of X_test is ['+str(X_test.min())+','+str(X_test.max())+']')

The range of X_train is [0,255]
The range of X_test is [0,255]


X_train = X_train.astype('float32')
X_test = X_test.astype('float32')
X_train /= 255
X_test /= 255


print('The range of X_train is ['+str(X_train.min())+','+str(X_train.max())+']')
print('The range of X_test is ['+str(X_test.min())+','+str(X_test.max())+']')

The range of X_train is [0.0,1.0]
The range of X_test is [0.0,1.0]


print('The dimensions of y_train are:')
print(y_train.shape)
print('The dimensions of y_test are:')
print(y_test.shape)

The dimensions of y_train are:
(60000,)
The dimensions of y_test are:
(10000,)


print('The first ten entries of y_train are:')
print(y_train[:10])

The first ten entries of y_train are:
[5 0 4 1 9 2 1 3 1 4]


Y_train = np_utils.to_categorical(y_train, 10)
Y_test = np_utils.to_categorical(y_test, 10)


print('The dimensions of Y_train are:')
print(Y_train.shape)
print('The dimensions of Y_test are:')
print(Y_test.shape)

The dimensions of Y_train are:
(60000, 10)
The dimensions of Y_test are:
(10000, 10)


print('The first ten entries of y_train (original label vector) are:')
print(y_train[0:10])
print('The argmax of the first ten entries of Y_train (one-hot label vector) are:')
print(Y_train[0:10,:])

The first ten entries of y_train (original label vector) are:
[5 0 4 1 9 2 1 3 1 4]
The argmax of the first ten entries of Y_train (one-hot label vector) are:
[[0. 0. 0. 0. 0. 1. 0. 0. 0. 0.]
 [1. 0. 0. 0. 0. 0. 0. 0. 0. 0.]
 [0. 0. 0. 0. 1. 0. 0. 0. 0. 0.]
 [0. 1. 0. 0. 0. 0. 0. 0. 0. 0.]
 [0. 0. 0. 0. 0. 0. 0. 0. 0. 1.]
 [0. 0. 1. 0. 0. 0. 0. 0. 0. 0.]
 [0. 1. 0. 0. 0. 0. 0. 0. 0. 0.]
 [0. 0. 0. 1. 0. 0. 0. 0. 0. 0.]
 [0. 1. 0. 0. 0. 0. 0. 0. 0. 0.]
 [0. 0. 0. 0. 1. 0. 0. 0. 0. 0.]]


print('The first ten entries of y_train (original label vector) are:')
print(y_train[0:10])
print('The first ten entries of Y_train (one-hot label vector) are:')
print(np.argmax(Y_train[0:10,:],axis=1))

The first ten entries of y_train (original label vector) are:
[5 0 4 1 9 2 1 3 1 4]
The first ten entries of Y_train (one-hot label vector) are:
[5 0 4 1 9 2 1 3 1 4]


model1 = Sequential()
model1.add(Convolution2D(32, (3, 3), activation='relu', input_shape=(28,28,1), data_format='channels_last'))
model1.add(Convolution2D(32, (3, 3), activation='relu', data_format='channels_last'))
model1.add(MaxPooling2D(pool_size=(2,2),data_format='channels_last'))
model1.add(Flatten())
model1.add(Dense(128, activation='relu'))
model1.add(Dense(10, activation='softmax'))


model1.compile(loss='categorical_crossentropy', optimizer='adam',metrics=['accuracy'])


model1.fit(X_train, Y_train, batch_size=64, epochs=1, verbose=1)

Epoch 1/1
60000/60000 [==============================] - 145s 2ms/step - loss: 0.1403 - accuracy: 0.9602

<keras.callbacks.callbacks.History at 0x16b6e9170c8>


model2 = Sequential()
model2.add(Convolution2D(32, (3, 3), activation='relu', input_shape=(28,28,1), data_format='channels_last'))
model2.add(Convolution2D(32, (3, 3), activation='relu', data_format='channels_last'))
model2.add(MaxPooling2D(pool_size=(2,2),data_format='channels_last'))
model2.add(Flatten())
model2.add(Dense(128, activation='relu'))
model2.add(Dense(10, activation='softmax'))

model2.compile(loss='categorical_crossentropy', optimizer='adam',metrics=['accuracy'])

model2.fit(X_train, Y_train, batch_size=64, epochs=1, verbose=1)

Epoch 1/1
60000/60000 [==============================] - 103s 2ms/step - loss: 0.1444 - accuracy: 0.9560

<keras.callbacks.callbacks.History at 0x16b6f514748>


model2 = Sequential()
model2.add(Convolution2D(32, (3, 3), activation='relu', input_shape=(28,28,1), data_format='channels_first'))
model2.add(Convolution2D(32, (3, 3), activation='relu', data_format='channels_first'))
model2.add(MaxPooling2D(pool_size=(2,2),data_format='channels_first'))
model2.add(Flatten())
model2.add(Dense(128, activation='relu'))
model2.add(Dense(10, activation='softmax'))

model2.compile(loss='categorical_crossentropy', optimizer='adam',metrics=['accuracy'])

model2.fit(X_train, Y_train, batch_size=64, epochs=1, verbose=1)

---------------------------------------------------------------------------
AttributeError                            Traceback (most recent call last)
<ipython-input-28-4b1bdaf93886> in <module>
      1 model2 = Sequential()
----> 2 model2.add(Convolution2D(32, (3, 3), activation='relu', input_shape=(28,28,1), data_format='channels_first'))
      3 model2.add(Convolution2D(32, (3, 3), activation='relu', data_format='channels_first'))
      4 model2.add(MaxPooling2D(pool_size=(2,2),data_format='channels_first'))
      5 model2.add(Flatten())

~\anaconda3\envs\aiworkshop1\lib\site-packages\keras\engine\sequential.py in add(self, layer)
    164                     # and create the node connecting the current layer
    165                     # to the input layer we just created.
--> 166                     layer(x)
    167                     set_inputs = True
    168             else:

~\anaconda3\envs\aiworkshop1\lib\site-packages\keras\backend\tensorflow_backend.py in symbolic_fn_wrapper(*args, **kwargs)
     73         if _SYMBOLIC_SCOPE.value:
     74             with get_graph().as_default():
---> 75                 return func(*args, **kwargs)
     76         else:
     77             return func(*args, **kwargs)

~\anaconda3\envs\aiworkshop1\lib\site-packages\keras\engine\base_layer.py in __call__(self, inputs, **kwargs)
    487             # Actually call the layer,
    488             # collecting output(s), mask(s), and shape(s).
--> 489             output = self.call(inputs, **kwargs)
    490             output_mask = self.compute_mask(inputs, previous_mask)
    491 

~\anaconda3\envs\aiworkshop1\lib\site-packages\keras\layers\convolutional.py in call(self, inputs)
    169                 padding=self.padding,
    170                 data_format=self.data_format,
--> 171                 dilation_rate=self.dilation_rate)
    172         if self.rank == 3:
    173             outputs = K.conv3d(

~\anaconda3\envs\aiworkshop1\lib\site-packages\keras\backend\tensorflow_backend.py in conv2d(x, kernel, strides, padding, data_format, dilation_rate)
   3699     data_format = normalize_data_format(data_format)
   3700 
-> 3701     x, tf_data_format = _preprocess_conv2d_input(x, data_format)
   3702 
   3703     padding = _preprocess_padding(padding)

~\anaconda3\envs\aiworkshop1\lib\site-packages\keras\backend\tensorflow_backend.py in _preprocess_conv2d_input(x, data_format, force_transpose)
   3572     tf_data_format = 'NHWC'
   3573     if data_format == 'channels_first':
-> 3574         if not _has_nchw_support() or force_transpose:
   3575             x = tf.transpose(x, (0, 2, 3, 1))  # NCHW -> NHWC
   3576         else:

~\anaconda3\envs\aiworkshop1\lib\site-packages\keras\backend\tensorflow_backend.py in _has_nchw_support()
    520     """
    521     explicitly_on_cpu = _is_current_explicit_device('cpu')
--> 522     gpus_available = len(_get_available_gpus()) > 0
    523     return (not explicitly_on_cpu and gpus_available)
    524 

~\anaconda3\envs\aiworkshop1\lib\site-packages\keras\backend\tensorflow_backend.py in _get_available_gpus()
    504             _LOCAL_DEVICES = [x.name for x in devices]
    505         else:
--> 506             _LOCAL_DEVICES = tf.config.experimental_list_devices()
    507     return [x for x in _LOCAL_DEVICES if 'device:gpu' in x.lower()]
    508 

AttributeError: module 'tensorflow_core._api.v2.config' has no attribute 'experimental_list_devices'


model2 = Sequential()
model2.add(Convolution2D(32, (3, 3), activation='relu', input_shape=(28,28,1), data_format='channels_last'))
model2.add(Convolution2D(32, (3, 3), activation='relu', data_format='channels_last'))
model2.add(MaxPooling2D(pool_size=(2,2),data_format='channels_last'))
#model2.add(Flatten())
model2.add(Dense(128, activation='relu'))
model2.add(Dense(10, activation='softmax'))

model2.compile(loss='categorical_crossentropy', optimizer='adam',metrics=['accuracy'])

model2.fit(X_train, Y_train, batch_size=64, epochs=1, verbose=1)

---------------------------------------------------------------------------
ValueError                                Traceback (most recent call last)
<ipython-input-29-b42bce916ce9> in <module>
      9 model2.compile(loss='categorical_crossentropy', optimizer='adam',metrics=['accuracy'])
     10 
---> 11 model2.fit(X_train, Y_train, batch_size=64, epochs=1, verbose=1)

~\anaconda3\envs\aiworkshop1\lib\site-packages\keras\engine\training.py in fit(self, x, y, batch_size, epochs, verbose, callbacks, validation_split, validation_data, shuffle, class_weight, sample_weight, initial_epoch, steps_per_epoch, validation_steps, validation_freq, max_queue_size, workers, use_multiprocessing, **kwargs)
   1152             sample_weight=sample_weight,
   1153             class_weight=class_weight,
-> 1154             batch_size=batch_size)
   1155 
   1156         # Prepare validation data.

~\anaconda3\envs\aiworkshop1\lib\site-packages\keras\engine\training.py in _standardize_user_data(self, x, y, sample_weight, class_weight, check_array_lengths, batch_size)
    619                 feed_output_shapes,
    620                 check_batch_axis=False,  # Don't enforce the batch size.
--> 621                 exception_prefix='target')
    622 
    623             # Generate sample-wise weight values given the `sample_weight` and

~\anaconda3\envs\aiworkshop1\lib\site-packages\keras\engine\training_utils.py in standardize_input_data(data, names, shapes, check_batch_axis, exception_prefix)
    133                         ': expected ' + names[i] + ' to have ' +
    134                         str(len(shape)) + ' dimensions, but got array '
--> 135                         'with shape ' + str(data_shape))
    136                 if not check_batch_axis:
    137                     data_shape = data_shape[1:]

ValueError: Error when checking target: expected dense_6 to have 4 dimensions, but got array with shape (60000, 10)


model2 = Sequential()
model2.add(Convolution2D(32, (3, 3), activation='relu', input_shape=(28,28,1), data_format='channels_last'))
model2.add(Convolution2D(32, (3, 3), activation='relu', data_format='channels_last'))
model2.add(MaxPooling2D(pool_size=(2,2),data_format='channels_last'))
model2.add(Flatten())
model2.add(Dense(128, activation='relu'))
model2.add(Dense(128, activation='softmax'))

model2.compile(loss='categorical_crossentropy', optimizer='adam',metrics=['accuracy'])

model2.fit(X_train, Y_train, batch_size=64, epochs=1, verbose=1)

---------------------------------------------------------------------------
ValueError                                Traceback (most recent call last)
<ipython-input-30-2e1393361a52> in <module>
      9 model2.compile(loss='categorical_crossentropy', optimizer='adam',metrics=['accuracy'])
     10 
---> 11 model2.fit(X_train, Y_train, batch_size=64, epochs=1, verbose=1)

~\anaconda3\envs\aiworkshop1\lib\site-packages\keras\engine\training.py in fit(self, x, y, batch_size, epochs, verbose, callbacks, validation_split, validation_data, shuffle, class_weight, sample_weight, initial_epoch, steps_per_epoch, validation_steps, validation_freq, max_queue_size, workers, use_multiprocessing, **kwargs)
   1152             sample_weight=sample_weight,
   1153             class_weight=class_weight,
-> 1154             batch_size=batch_size)
   1155 
   1156         # Prepare validation data.

~\anaconda3\envs\aiworkshop1\lib\site-packages\keras\engine\training.py in _standardize_user_data(self, x, y, sample_weight, class_weight, check_array_lengths, batch_size)
    619                 feed_output_shapes,
    620                 check_batch_axis=False,  # Don't enforce the batch size.
--> 621                 exception_prefix='target')
    622 
    623             # Generate sample-wise weight values given the `sample_weight` and

~\anaconda3\envs\aiworkshop1\lib\site-packages\keras\engine\training_utils.py in standardize_input_data(data, names, shapes, check_batch_axis, exception_prefix)
    143                             ': expected ' + names[i] + ' to have shape ' +
    144                             str(shape) + ' but got array with shape ' +
--> 145                             str(data_shape))
    146     return data
    147 

ValueError: Error when checking target: expected dense_8 to have shape (128,) but got array with shape (10,)


model3 = Sequential()
model3.add(Convolution2D(32, (3, 3), activation='relu', input_shape=(28,28,1), data_format='channels_last'))
model3.add(Convolution2D(32, (3, 3), activation='relu', data_format='channels_last'))
model3.add(MaxPooling2D(pool_size=(2,2),data_format='channels_last'))
model3.add(Flatten())
model3.add(Dense(128, activation='relu'))
model3.add(Dense(10, activation='tanh'))

model3.compile(loss='categorical_crossentropy', optimizer='adam',metrics=['accuracy'])

model3.fit(X_train, Y_train, batch_size=64, epochs=1, verbose=1)

Epoch 1/1
60000/60000 [==============================] - 110s 2ms/step - loss: 8.0835 - accuracy: 0.1009

<keras.callbacks.callbacks.History at 0x16b71d1de88>


model4 = Sequential()
model4.add(Convolution2D(32, (3, 3), activation='relu', input_shape=(28,28,1), data_format='channels_last'))
model4.add(Convolution2D(32, (3, 3), activation='relu', data_format='channels_last'))
model4.add(MaxPooling2D(pool_size=(2,2),data_format='channels_last'))
model4.add(Flatten())
model4.add(Dense(128, activation='relu'))
model4.add(Dense(10, activation='softmax'))

model4.compile(loss='binary_crossentropy', optimizer='adam',metrics=['accuracy'])

model4.fit(X_train, Y_train, batch_size=64, epochs=1, verbose=1)

Epoch 1/1
60000/60000 [==============================] - 108s 2ms/step - loss: 0.0251 - accuracy: 0.9915

<keras.callbacks.callbacks.History at 0x16b71e73dc8>


score = model1.evaluate(X_test, Y_test, verbose=1)
print(score)

10000/10000 [==============================] - 7s 682us/step
[0.04841461051488295, 0.9836999773979187]


print(model1.metrics_names)

['loss', 'accuracy']


Y_predict = model1.predict(X_test,verbose=1)

10000/10000 [==============================] - 7s 681us/step


print(Y_predict.shape)

(10000, 10)


print(Y_predict[0:10,:])

[[4.05177758e-08 7.43065387e-09 2.37806557e-06 2.58250338e-06
  1.32016120e-10 6.64513600e-09 6.50171193e-12 9.99993682e-01
  6.94475716e-07 5.78243203e-07]
 [1.32357775e-06 8.71970027e-04 9.99126256e-01 5.49216530e-08
  6.64163308e-11 3.73077036e-09 1.32753513e-07 2.21830199e-09
  3.57962051e-07 1.14670252e-10]
 [1.79842009e-05 9.98999059e-01 5.65366936e-05 1.32168325e-05
  6.44273678e-05 1.28859028e-05 1.01682672e-05 7.75526569e-04
  4.35361144e-05 6.71234602e-06]
 [9.99958873e-01 3.54211949e-08 9.94088714e-06 8.73126549e-09
  3.90109278e-07 3.95757098e-07 2.31599006e-05 6.50946845e-07
  5.35008394e-06 1.46342552e-06]
 [5.83880501e-06 6.28110342e-07 5.05188427e-06 3.39747743e-07
  9.99858856e-01 8.84693065e-08 2.88095930e-06 1.05900563e-05
  5.37548749e-06 1.10328197e-04]
 [7.17639432e-06 9.98586416e-01 9.56198073e-06 1.58115131e-06
  4.67288082e-05 1.08867607e-06 1.44783314e-06 1.32461940e-03
  1.69964169e-05 4.56649468e-06]
 [1.40812929e-07 8.77150342e-06 2.12768646e-05 1.91419222e-05
  3.51276517e-01 7.10015942e-04 1.34696995e-06 9.68216409e-05
  4.54874605e-01 1.92991406e-01]
 [4.10326662e-09 3.42933930e-07 9.80323193e-07 1.17285090e-05
  2.24219402e-04 1.33342022e-04 3.50651312e-08 8.88734803e-07
  6.77975011e-04 9.98950481e-01]
 [1.26563573e-05 2.65104583e-09 5.87654597e-07 4.32099547e-08
  3.93154920e-07 9.84957039e-01 8.30869284e-03 3.97608204e-08
  6.70878543e-03 1.16976953e-05]
 [1.21137347e-07 1.99952876e-09 1.36449376e-06 1.15867590e-06
  6.39622682e-04 2.09732275e-06 6.38211084e-09 5.66185452e-04
  4.46928432e-03 9.94320154e-01]]


print(np.round(Y_predict[0:10,:],2))

[[0.   0.   0.   0.   0.   0.   0.   1.   0.   0.  ]
 [0.   0.   1.   0.   0.   0.   0.   0.   0.   0.  ]
 [0.   1.   0.   0.   0.   0.   0.   0.   0.   0.  ]
 [1.   0.   0.   0.   0.   0.   0.   0.   0.   0.  ]
 [0.   0.   0.   0.   1.   0.   0.   0.   0.   0.  ]
 [0.   1.   0.   0.   0.   0.   0.   0.   0.   0.  ]
 [0.   0.   0.   0.   0.35 0.   0.   0.   0.45 0.19]
 [0.   0.   0.   0.   0.   0.   0.   0.   0.   1.  ]
 [0.   0.   0.   0.   0.   0.98 0.01 0.   0.01 0.  ]
 [0.   0.   0.   0.   0.   0.   0.   0.   0.   0.99]]


y_predict = Y_predict.argmax(axis=-1)


print(y_predict[0:10])

[7 2 1 0 4 1 8 9 5 9]


my_acc = (y_predict==y_test).sum()/len(y_predict)
print('My accuracy computation says:')
print(my_acc)

My accuracy computation says:
0.9837


print('Actual labels are:')
print(y_test[0:10])
print('Predicted labels are:')
print(y_predict[0:10])

Actual labels are:
[7 2 1 0 4 1 4 9 5 9]
Predicted labels are:
[7 2 1 0 4 1 8 9 5 9]


incorrect_labels = np.where(y_predict!=y_test)[0]
print('There are '+str(len(incorrect_labels))+' incorrectly classified images')

There are 163 incorrectly classified images


plt.figure(figsize=(15,15))
for k in range(0,9): # choose 10 examples
    plt.subplot(3,3,k+1) # select the current subplot
    plt.imshow(np.squeeze(X_test[incorrect_labels[k],:,:]),cmap='gray') # plot the image
    plt.title('Actual:'+str(y_test[incorrect_labels[k]])+' Predicted:'+str(y_predict[incorrect_labels[k]]))
    plt.axis('off')


score = model3.evaluate(X_test, Y_test, verbose=1)
print(score)

Y_predict = model3.predict(X_test,verbose=1)
y_predict = Y_predict.argmax(axis=-1)

my_acc = (y_predict==y_test).sum()/len(y_predict)
print('My accuracy computation says:')
print(my_acc)

print(Y_predict)

10000/10000 [==============================] - 8s 773us/step
[8.057436024475098, 0.10090000182390213]
10000/10000 [==============================] - 3s 323us/step
My accuracy computation says:
0.1009
[[-0.973072   -0.8842376   0.96776295 ...  0.98423636  0.9954213
   0.9915314 ]
 [-0.9976873  -0.8748546   0.99810606 ...  0.99707055  0.9997076
   0.99870926]
 [-0.90909916 -0.8807202   0.8966731  ...  0.86087024  0.9748953
   0.9491585 ]
 ...
 [-0.98996896 -0.96023846  0.9889787  ...  0.99146676  0.99941707
   0.9986351 ]
 [-0.989946   -0.9145103   0.9892308  ...  0.9919738   0.99909675
   0.99780166]
 [-0.99878985 -0.96146595  0.99856424 ...  0.9987184   0.9999072
   0.9996895 ]]


score = model4.evaluate(X_test, Y_test, verbose=1)
print(score)

Y_predict = model4.predict(X_test,verbose=1)
y_predict = Y_predict.argmax(axis=-1)

my_acc = (y_predict==y_test).sum()/len(y_predict)
print('My accuracy computation says:')
print(my_acc)

print(Y_predict)

10000/10000 [==============================] - 7s 678us/step
[0.009117328152665869, 0.9967696070671082]
10000/10000 [==============================] - 3s 329us/step
My accuracy computation says:
0.9831
[[5.9873059e-07 3.5044065e-10 1.0003435e-07 ... 9.9999797e-01
  1.1135760e-07 5.5747341e-07]
 [2.1488156e-06 8.6308628e-06 9.9998629e-01 ... 3.1622252e-10
  7.8438552e-07 1.0652504e-10]
 [7.1815870e-05 9.9565083e-01 1.2233267e-03 ... 4.1579080e-04
  2.2510721e-03 1.3366683e-05]
 ...
 [2.7786931e-09 2.8147473e-09 1.9756570e-09 ... 2.9908915e-06
  3.6714137e-05 4.7742269e-05]
 [8.2209077e-08 7.3970114e-09 9.7479913e-10 ... 9.9465547e-09
  1.2571395e-04 2.8228129e-08]
 [1.6427188e-07 8.0722729e-10 3.2076801e-05 ... 7.6732789e-09
  1.1046466e-06 7.8044499e-10]]


(X_train_f, y_train_f), (X_test_f, y_test_f) = fashion_mnist.load_data()
X_train_f = X_train_f.reshape(X_train_f.shape[0], 28, 28, 1)
X_train_f = X_train_f.astype('float32')
X_train_f /= 255
Y_train_f = np_utils.to_categorical(y_train_f, 10)
X_test_f = X_test_f.reshape(X_test_f.shape[0], 28, 28, 1)
X_test_f = X_test_f.astype('float32')
X_test_f /= 255
Y_test_f = np_utils.to_categorical(y_test_f, 10)

Downloading data from http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz
32768/29515 [=================================] - 0s 5us/step
Downloading data from http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz
26427392/26421880 [==============================] - 21s 1us/step
Downloading data from http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz
8192/5148 [===============================================] - 0s 0us/step
Downloading data from http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz
4423680/4422102 [==============================] - 5s 1us/step


score = model1.evaluate(X_test_f, Y_test_f, verbose=1)
print(score)

10000/10000 [==============================] - 7s 672us/step
[4.987198582458496, 0.1193000003695488]


plt.figure()
plt.imshow(np.squeeze(X_test_f[0]),cmap='gray')
plt.show()
print('This image is class '+str(y_test[0])+' in the Fashion-MNIST dataset')

This image is class 7 in the Fashion-MNIST dataset


Y_example = model1.predict(X_test_f[0].reshape(1,28,28,1),verbose=1)
y_example = np.argmax(Y_example)
print(y_example)

1/1 [==============================] - 0s 14ms/step
1


model1_f = keras.models.clone_model(model1)
model1_f.set_weights(model1.get_weights())

for layer in model1_f.layers[:-1]:
    layer.trainable=False
    
model1_f.compile(loss='categorical_crossentropy', optimizer='adam',metrics=['accuracy'])

model1_f.fit(X_train_f, Y_train_f, batch_size=64, epochs=1, verbose=1)

Epoch 1/1
60000/60000 [==============================] - 23s 389us/step - loss: 1.2105 - accuracy: 0.5974s - loss: 1.2147 - accuracy

<keras.callbacks.callbacks.History at 0x16b70101d88>


score = model1_f.evaluate(X_test_f, Y_test_f, verbose=1)
print(score)

10000/10000 [==============================] - 8s 760us/step
[0.7792962156295776, 0.729200005531311]


score = model1_f.evaluate(X_test, Y_test, verbose=1)
print(score)

10000/10000 [==============================] - 7s 738us/step
[4.2286063625335695, 0.3264999985694885]


model1_f = keras.models.clone_model(model1)
model1_f.set_weights(model1.get_weights())

for layer in model1_f.layers[:-2]:
    layer.trainable=False
    
model1_f.compile(loss='categorical_crossentropy', optimizer='adam',metrics=['accuracy'])

model1_f.fit(X_train_f, Y_train_f, batch_size=64, epochs=1, verbose=1)

score = model1_f.evaluate(X_test_f, Y_test_f, verbose=1)
print(score)

Epoch 1/1
60000/60000 [==============================] - 33s 546us/step - loss: 0.4156 - accuracy: 0.8545
10000/10000 [==============================] - 3s 338us/step
[0.32236459945440293, 0.8853999972343445]


model1.save('model1.h5')
model1_f.save('model1_f.h5')


model1 = load_model('model1.h5')
model1_f = load_model('model1_f.h5')

Tutorial 3: Deep Learning for Images¶

Laura E. Boucheron, Electrical & Computer Engineering, NMSU¶

October 2020¶

Overview¶

Section 0: Preliminaries¶

A Note on Jupyter Notebooks¶

Section 0.3a Import Necessary Libraries (For users using a local machine)¶

Section 0.3b Build the Conda Environment (For users using the ARS HPC Ceres with JupyterLab)¶

Section 1: The MNIST Dataset¶

1.1 Importing the MNIST dataset¶

Printing out the current backend¶

A note on other standard datasets included in keras¶

1.2 Load training and test data¶

A note on the variable name conventions¶

1.3 Checking dimensionality of the MNIST data variables¶

A note on tensors¶

1.4 Visualizing an MNIST image¶

Your turn: ¶

1.5 MNIST label vectors¶

Your turn: ¶

1.5 A visualization of the digit variation in MNIST¶

Section 2: Data Preprocessing (Dimensionality Wrangling)¶

2.1 Input data dimensionality considerations¶

A note on the importance of dimensionality¶

Your turn: ¶

Your turn: ¶

2.2 Input data intensity scaling considerations¶

Your turn: ¶

Casting the data as float¶

Your turn: ¶

A note on other common data preprocessing methods¶

A note on the use of float32 or float64¶

2.3 Label vector coding¶

2.3.1 Dimensionality of the loaded label vectors¶

2.3.2 A brief introduction to one-hot coding¶

2.3.3 What do labels "mean"?¶

A very important note on the abstractness of labels¶

2.3.4 Converting labels to one-hot coding¶

Your turn: ¶

2.3.5 Converting labels from one-hot coding¶

Section 3: Building a CNN for MNIST¶

3.1 Import necessary keras library functions¶

3.2 Define the model architecture¶

3.3 Compile the model¶

3.4 Train the model¶

3.5 Some Common Errors in Defining, Compiling, and Training the Model¶

3.5.1 Errors that actually report as errors¶

Your turn: ¶

Your turn: ¶

Your turn: ¶

3.5.2 Errors that don't appear to be errors at first¶

Section 4: Testing the Trained CNN¶

4.1 Determining accuracy on test data¶

4.2 Determining the predicted labels¶

4.2.1 Determining the one-hot labels¶

4.2.2 Determining the numerical class labels¶

4.2.3 Comparing the predicted labels to the ground truth¶

4.2.4 Investigate errors in classification¶

Your turn: ¶

Section 5: Transfer Learning¶

5.1 Applying the MNIST Network Directly to Fashion-MNIST¶

5.2 Adapting the MNIST Model for Fashion-MNIST (Transfer Learning)¶

Your turn: ¶

Your turn: ¶

Your turn: ¶

Section 6: Saving Trained Models¶