machine-learning/src/mlp.py at master · vojtechcima/machine-learning · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
import tensorflow as tf
from tensorflow.examples.tutorials.mnist import input_data


class NeuralNet:
    """ NeuralNet class
    An implementation of a multilayered artificial neural network
    for multiclass data classification. The dimension of first (input)
    layer MUST match the dimension of the data sample. The dimension
    of the last layer must match the number of classes (labels).
    """

    def __init__(self, learning_rate, shape, session):
        self.session = session
        self.learning_rate = learning_rate
        self.shape = shape
        self.weights = self.init_weights()
        self.biases = self.init_biases()

        # Placeholders for inputs and labels
        self.x = tf.placeholder(tf.float32, [None, shape[0]])
        self.y_ = tf.placeholder(tf.float32, [None, shape[-1]])

        # Neural network model
        self.y = self.feed_forward()

        # Define loss J and optimizer
        self.J = tf.reduce_mean(
            tf.nn.softmax_cross_entropy_with_logits(
            logits=self.y, labels=self.y_))
        self.optimizer = tf.train.AdamOptimizer(
            learning_rate=learning_rate).minimize(self.J)

        # Define accuracy calculation
        self.correct_prediction = tf.equal(
            tf.argmax(self.y, 1), tf.argmax(self.y_, 1))
        self.accuracy = tf.reduce_mean(
            tf.cast(self.correct_prediction, tf.float32))
        tf.global_variables_initializer().run(session=self.session)

    def train(self, max_iter, data_set):
        """ Trains the network
        """

        for i in range(max_iter):
            batch = data_set.train.next_batch(50)
            self.optimizer.run({self.x: batch[0], self.y_: batch[1]},
                               session=self.session)
            if i % 10 == 0:
                print("Iteration: %s, Accuracy (ts): %s, Accuracy (vs): %s" %
                      (i, self.accuracy.eval({self.x: batch[0],
                                              self.y_: batch[1]},
                                             session=self.session),
                       self.accuracy.eval({self.x: data_set.test.images,
                                           self.y_: data_set.test.labels},
                                          session=self.session)))

    def init_weights(self):
        """ Randomly initializes weight matrices.
        :return: weight matrices
        """
        weights = {}
        for i in range(len(self.shape) - 1):
            weights[i] = tf.Variable(tf.random_normal(
                [self.shape[i], self.shape[i + 1]]))
        return weights

    def init_biases(self):
        """ Randomly initializes biases vectors.
        :return: bias vectors
        """
        biases = {}
        for i in range(len(self.shape) - 1):
            biases[i] = tf.Variable(tf.random_normal([self.shape[i + 1]]))
        return biases

    def feed_forward(self):
        """ Creates the neural network representation and workflow.
        :return: UNSCALED output of the last layer
        """
        l = None
        layer_idx = len(self.shape) - 1
        for i in range(layer_idx):
            if l is None:
                # Use X as an input for the first layer.
                l = tf.nn.relu(
                    tf.add(tf.matmul(self.x, self.weights[i]), self.biases[i]))
            elif i < layer_idx - 1:
                # Use the output of the previous layer as the inputs for all
                # hidden layers.
                l = tf.nn.relu(
                    tf.add(tf.matmul(l, self.weights[i]), self.biases[i]))
            else:
                # Don't scale the output of the last layer as it's taken
                # care of within the softmax_cross_entropy_with_logits
                # function when calculating the error.
                l = (tf.add(tf.matmul(l, self.weights[i]), self.biases[i]))
        return l


def main():
    learning_rate = 0.01
    max_iter = 10000

    # Define network shape as follows:
    #  * input layer matches the data dimension (784 pixels per image).
    #  * two hidden layer contains 256 neurons each.
    #  * last layer contains 10 neurons which is also the number of classes.
    # Note: while the dimension of the first and the last layer must match
    # dataset parameters, the number of hidden layers and the number of neurons
    # in these layers can be customised and will affect the classification
    shape = (784, 256, 256, 10)

    mnist = input_data.read_data_sets("../data/mnist/", one_hot=True)

    session = tf.Session()
    nn = NeuralNet(learning_rate, shape, session)
    nn.train(max_iter, mnist)
    session.close()

if __name__ == "__main__":
    main()