forked from Matuzas77/MNIST-0.17
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathmain.py
More file actions
101 lines (68 loc) · 4.24 KB
/
main.py
File metadata and controls
101 lines (68 loc) · 4.24 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
import tensorflow as tf
import numpy as np
from tensorflow.keras import optimizers
from sklearn.metrics import accuracy_score
from tensorflow.keras.datasets import mnist
(x_train, y_train), (x_test, y_test) = mnist.load_data()
x_train, x_test = np.array(x_train, np.float32), np.array(x_test, np.float32)
x_train, x_test = x_train / 255-0.5, x_test / 255-0.5
y_train=tf.keras.utils.to_categorical(y_train,10)
y_test=tf.keras.utils.to_categorical(y_test,10)
x_train=np.expand_dims(x_train,axis=-1)
x_test=np.expand_dims(x_test,axis=-1)
def squeeze_excite_block2D(filters,input): # squeeze and exite is a good thing
se = tf.keras.layers.GlobalAveragePooling2D()(input)
se = tf.keras.layers.Reshape((1, filters))(se)
se = tf.keras.layers.Dense(filters//32, activation='relu')(se)
se = tf.keras.layers.Dense(filters, activation='sigmoid')(se)
se = tf.keras.layers.multiply([input, se])
return se
datagen = tf.keras.preprocessing.image.ImageDataGenerator(rotation_range=10, width_shift_range=0.1, shear_range=10,
height_shift_range=0.1, zoom_range=0.2)
datagen.fit(x_train)
datagen2 = tf.keras.preprocessing.image.ImageDataGenerator()
datagen2.fit(x_test)
def make_model():
s = tf.keras.Input(shape=x_train.shape[1:])
x = tf.keras.layers.Conv2D(128,(3,3),activation='relu',padding='same')(s)
x = tf.keras.layers.Conv2D(128,(3,3),activation='relu',padding='same')(x)
x = tf.keras.layers.Conv2D(128,(3,3),activation='relu',padding='same')(x)
x = tf.keras.layers.BatchNormalization()(x)
x = squeeze_excite_block2D(128,x)
x = tf.keras.layers.Conv2D(128,(3,3),activation='relu',padding='same')(x)
x = tf.keras.layers.Conv2D(128,(3,3),activation='relu',padding='same')(x)
x = tf.keras.layers.Conv2D(128,(3,3),activation='relu',padding='same')(x)
x = tf.keras.layers.BatchNormalization()(x)
x = squeeze_excite_block2D(128,x)
x = tf.keras.layers.AveragePooling2D(2)(x)
x = tf.keras.layers.Conv2D(128,(3,3),activation='relu',padding='same')(x)
x = tf.keras.layers.Conv2D(128,(3,3),activation='relu',padding='same')(x)
x = tf.keras.layers.Conv2D(128,(3,3),activation='relu',padding='same')(x)
x = tf.keras.layers.BatchNormalization()(x)
x = squeeze_excite_block2D(128,x)
x = tf.keras.layers.AveragePooling2D(2)(x)
x = tf.keras.layers.concatenate([tf.keras.layers.GlobalMaxPooling2D()(x),
tf.keras.layers.GlobalAveragePooling2D()(x)])
x = tf.keras.layers.Dense(10,activation='softmax',use_bias=False,
kernel_regularizer=tf.keras.regularizers.l1(0.00025))(x) # this make stacking better
return tf.keras.Model(inputs=s, outputs=x)
batch_size=32
supermodel=[]
for i in range(3):
np.random.seed(i)
model=make_model()
model.compile(optimizer=optimizers.Adam(lr=0.001), loss='categorical_crossentropy',metrics=['accuracy'])
model.fit_generator(datagen.flow(x_train, y_train, batch_size=batch_size,shuffle=True),
steps_per_epoch=len(x_train) / batch_size, epochs=13,verbose=0)
model.compile(optimizer=optimizers.Adam(lr=0.0001), loss='categorical_crossentropy',metrics=['accuracy'])
model.fit_generator(datagen.flow(x_train, y_train, batch_size=batch_size,shuffle=True),
steps_per_epoch=len(x_train) / batch_size, epochs=3,verbose=0)
model.compile(optimizer=optimizers.Adam(lr=0.00001), loss='categorical_crossentropy',metrics=['accuracy'])
model.fit_generator(datagen.flow(x_train, y_train, batch_size=batch_size,shuffle=True),
steps_per_epoch=len(x_train) / batch_size, epochs=3,verbose=0)
model.fit(x_train, y_train, batch_size=batch_size,shuffle=True, epochs=1,verbose=0)
model.save("model"+str(i))
supermodel.append(model)
print(i,'acc:',accuracy_score(np.argmax(y_test,axis=1),np.argmax(model.predict(x_test),axis=1)))
P=np.asarray([a.predict(x_test) for a in supermodel])
accuracy_score(np.argmax(y_test,axis=1),np.argmax(np.mean(P,axis=0),axis=1)) # 20 models stack accurasy