machine-learning/Autoencoder/image_encoder.py at master · adminho/machine-learning · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
import time
import datetime
import random

import numpy as np
import matplotlib.pyplot as plt

from keras.models import Model
from keras.models import Sequential
from keras.layers.core import Dense
from keras.datasets import mnist

#np.random.seed(137)  # for reproducibility
def plotExampleImg(title,imageData, decodedData, Ydigits):
	fig, ax = plt.subplots(2, 10, figsize=(10, 2))
	plt.gcf().canvas.set_window_title(title)
	#fig.set_facecolor('#FFFFFF')
	for num in range(0,10):
		numberImg = imageData[np.where(Ydigits == num)[0]]
		imgDecoded = decodedData[np.where(Ydigits == num)[0]]
		#Return random integers from 0 (inclusive) to high (exclusive).
		randomIndex = np.random.randint(0, numberImg.shape[0])
		#axList[num].imshow(numberImg[randomIndex], cmap=plt.cm.gray)
		plt.gray()
		ax[0][num].imshow(numberImg[randomIndex])
		ax[0][num].set_axis_off()
		ax[1][num].imshow(imgDecoded[randomIndex])
		ax[1][num].set_axis_off()

	plt.show()


# n_input = 784 # MNIST data input (img shape: 28*28)
def build_neural_network(input_len):
	model = Sequential()
	model.add(Dense(input_dim=input_len, units=256 , activation='relu'))
	model.add(Dense(256, activation='relu'))
	# now model.output_shape == (None, 256)
	# note: `None` is the batch dimension.
	#
	model.add(Dense(128, activation='relu'))
	#now model.output_shape == (None, 128)
	#
	model.add(Dense(256, activation='relu'))
	model.add(Dense(256, activation='relu'))
	#now model.output_shape == (None, 256)

	model.add(Dense(input_len))
	#print(model.summary())

	# algorithim to train models use RMSProp
	# For a mean squared error regression problem
	model.compile(optimizer='rmsprop',
              loss='mse',
			  metrics=['accuracy'])
	return model

def trainModel(model, Xtrain, epochs=20):
	global_start_time = time.time()
	model.fit(Xtrain, Xtrain, batch_size=256, nb_epoch=epochs, verbose=0)
	sec = datetime.timedelta(seconds=int(time.time() - global_start_time))
	print ('Training duration : ', str(sec))

	# evaluate all training set after trained
	scores = model.evaluate(Xtrain, Xtrain, verbose=0)
	print("Evalute model: %s = %.4f" % (model.metrics_names[0] ,scores[0]))
	print("Evalute model: %s = %.4f" % (model.metrics_names[1] ,scores[1]*100))

	return model


if __name__ == "__main__":
	# Get MNIST Datasets
	(X_train, _), (X_test, Y_test) = mnist.load_data()
	_, heigh, width = X_train.shape
	total_pixel = heigh * width

	X_train = np.reshape(X_train, (-1, heigh * width))
	X_test = np.reshape(X_test, (-1, heigh * width))

	base_model = build_neural_network(X_train.shape[1])
	base_model = trainModel(base_model, X_train)
	print(base_model.summary())

	encoder_model = Model(inputs=base_model.input, outputs=base_model.get_layer("dense_2").output)
	print(encoder_model.summary())

	random_index = random.randint(0, X_test.shape[0])
	encoded = encoder_model.predict(np.array([X_test[random_index]]), verbose=0)
	print("Encoding digit:", Y_test[random_index])
	print("Encoding (examoke):\n", encoded[0:10])

	X_decoded = base_model.predict(X_test, verbose=0)
	# reshape to [example, heigh, width]
	X_decoded = np.reshape(X_decoded, (-1, heigh, width))
	X_test = np.reshape(X_test, (-1, heigh, width))
	print("Ploting...")
	plotExampleImg("Encoding and Decoding", X_test, X_decoded, Y_test)