-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathfashionRecognitionCNN.py
220 lines (146 loc) · 7.04 KB
/
fashionRecognitionCNN.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import matplotlib.image as mpimg
import seaborn as sns
np.random.seed(2)
from sklearn.metrics import accuracy_score
from sklearn.metrics import classification_report
from sklearn.model_selection import train_test_split
from sklearn.metrics import confusion_matrix
import itertools
from keras.utils.np_utils import to_categorical # convert to one-hot-encoding
from keras.models import Sequential
from keras.layers import Dense, Dropout, Flatten, Conv2D, MaxPool2D
from keras.optimizers import RMSprop
from keras.preprocessing.image import ImageDataGenerator
from keras.callbacks import ReduceLROnPlateau
import time
seconds= time.time()
time_start = time.ctime(seconds) # The time.ctime() function takes seconds passed since epoc
print("start time:", time_start,"\n") # as an argument and returns a string representing time.
def getData(path):
dataset = pd.read_csv(path)
return dataset
def fashion_Recognition_CNN_Model():
model = Sequential()
model.add(Conv2D(filters = 32, kernel_size = (5,5),padding = 'Same', # CNN architechture is: [[Conv2D->relu]*2 -> MaxPool2D -> Dropout]*2 ->
activation ='relu', input_shape = (28,28,1))) # Flatten -> Dense -> Dropout -> Out
model.add(Conv2D(filters = 32, kernel_size = (5,5),padding = 'Same',
activation ='relu'))
model.add(MaxPool2D(pool_size=(2,2)))
model.add(Dropout(0.25))
model.add(Conv2D(filters = 64, kernel_size = (3,3),padding = 'Same',
activation ='relu'))
model.add(Conv2D(filters = 64, kernel_size = (3,3),padding = 'Same',
activation ='relu'))
model.add(MaxPool2D(pool_size=(2,2), strides=(2,2)))
model.add(Dropout(0.25))
model.add(Flatten())
model.add(Dense(256, activation = "relu"))
model.add(Dropout(0.5))
model.add(Dense(10, activation = "softmax"))
return model
#Defining plotting confusion matrix function
def plot_confusion_matrix(cm, classes,
normalize=False,
title='Confusion matrix',
cmap=plt.cm.Blues):
"""
This function prints and plots the confusion matrix.
Normalization can be applied by setting `normalize=True`.
"""
plt.imshow(cm, interpolation='nearest', cmap=cmap)
plt.title(title)
plt.colorbar()
tick_marks = np.arange(len(classes))
plt.xticks(tick_marks, classes, rotation=45)
plt.yticks(tick_marks, classes)
if normalize:
cm = cm.astype('float') / cm.sum(axis=1)[:, np.newaxis]
thresh = cm.max() / 2.
for i, j in itertools.product(range(cm.shape[0]), range(cm.shape[1])):
plt.text(j, i, cm[i, j],
horizontalalignment="center",
color="white" if cm[i, j] > thresh else "black")
plt.tight_layout()
plt.ylabel('True label')
plt.xlabel('Predicted label')
# plt.show()
plt.savefig("confusion_matrix.png")
# Load data
dataset = getData("./FashionMNIST_Train_Test.csv")
# Split the Dataset into Test and Training datasets 80-20 split
Train_Dataset, Test_dataset = train_test_split(dataset, test_size = 0.2, random_state=2)
Y_train = Train_Dataset['label']
X_train = Train_Dataset.drop(['label'],axis=1)
Y_test = Test_dataset['label']
X_test = Test_dataset.drop(['label'],axis=1)
print("X_train ,X_test ,Y_train ,Y_test :",X_train.shape,X_test.shape,Y_train.shape,Y_test.shape,"\n")
# Reshape image in 3 dimensions (height = 28px, width = 28px , depth = 1)
X_train = X_train.values.reshape((-1,28,28,1))
X_test = X_test.values.reshape(-1,28,28,1)
print("After Reshaping (28*28*1) : ",X_train.shape,X_test.shape,"\n")
# Moreover the CNN converg faster on [0..1] data than on [0..255].
# Normalize the data
X_train = X_train/255.0
X_test = X_test/255.0
#Label encoding
# Encode labels to one hot vectors (ex : 2 -> [0,0,1,0,0,0,0,0,0,0])
Y_train = to_categorical(Y_train, num_classes = 10)
Y_Test = to_categorical(Y_test, num_classes = 10)
# Split the train and the validation set for the fitting
X_train, X_val, Y_train, Y_val = train_test_split(X_train, Y_train, test_size = 0.1, random_state = 2)
print("Dataset shape after train and validation set split : X_train, Y_train, X_validation, Y_validation :",X_train.shape,Y_train.shape,X_val.shape,Y_val.shape,"\n")
class_names = ['T-shirt', 'Trouser', 'Pullover', 'Dress', 'Coat', 'Sandal', 'Shirt', 'Sneaker', 'Bag', 'Ankle boot']
class_labels = [0,1,2,3,4,5,6,7,8,9]
articles=pd.DataFrame({'class_labels':class_labels,'class_names':class_names})
#Some examples
#plt.imshow(X_train[6][:,:,0])
#plt.show()
model = fashion_Recognition_CNN_Model()
# Define the optimizer
optimizer = RMSprop(lr=0.001, rho=0.9, epsilon=1e-08, decay=0.0)
# Compile the model
model.compile(optimizer = optimizer , loss = "categorical_crossentropy", metrics=["accuracy"])
# Set a learning rate annealer
learning_rate_reduction = ReduceLROnPlateau(monitor='val_acc',
patience=3,
verbose=1,
factor=0.5,
min_lr=0.00001)
epochs = 10 # Turn epochs to 30 to get 0.9967 accuracy attained .992% accuracy on 10 epochs
batch_size = 128
history = model.fit(X_train, Y_train, batch_size = batch_size, epochs = epochs,
validation_data = (X_val, Y_val))
print("\n","****************MODEL EVALUATION ************************\n")
# Model Evaluation on Test data
test_loss,test_acc=model.evaluate(X_test,Y_Test) # Evaluating model on Test_data
print("Accuracy on test data :",test_acc,"\n")
seconds= time.time()
time_stop = time.ctime(seconds)
print("\n","stop time:", time_stop,"\n")
# Predict the values from the Test dataset
Y_pred = model.predict(X_test)
# Convert predictions classes to one hot vectors
Y_pred_classes = np.argmax(Y_pred,axis = 1)
# compute the confusion matrix
confusion_mtx = confusion_matrix(Y_test, Y_pred_classes)
accuracy = accuracy_score(Y_test, Y_pred_classes)
print('Accuracy: %f' % accuracy)
prediction_res = pd.Series(Y_pred_classes,name="Label")
#Printing Classification Report
Y_Test_as_arrary=Y_test.array #Y_test is a series need to be converted into 1-D array for passed into Classification_report func.
print(classification_report(Y_Test_as_arrary, Y_pred_classes, target_names=class_names))
# Training and validation curves
# Plot the loss and accuracy curves for training and validation
fig, ax = plt.subplots(2,1)
ax[0].plot(history.history['loss'], color='b', label="Training loss")
ax[0].plot(history.history['val_loss'], color='r', label="validation loss",axes =ax[0])
legend = ax[0].legend(loc='best', shadow=True)
ax[1].plot(history.history['accuracy'], color='b', label="Training accuracy")
ax[1].plot(history.history['val_accuracy'], color='r',label="Validation accuracy")
legend = ax[1].legend(loc='best', shadow=True)
plt.savefig("Loss_Accuracy.png")
# plot the confusion matrix
plot_confusion_matrix(confusion_mtx, classes = range(10))