Correcting optimization algorithms workflow.

giangtranml · Apr 4, 2020 · 2d7ba53 · 2d7ba53
1 parent 59a3990
commit 2d7ba53
Show file tree

Hide file tree

Showing 9 changed files with 299 additions and 460 deletions.
diff --git a/convolutional_neural_network/README.md b/convolutional_neural_network/README.md
diff --git a/convolutional_neural_network/cnn_keras.py b/convolutional_neural_network/cnn_keras.py
diff --git a/convolutional_neural_network/convolutional_neural_network.py b/convolutional_neural_network/convolutional_neural_network.py
@@ -3,10 +3,15 @@
 Email: [email protected]
 Docs: https://giangtranml.github.io/ml/conv-net.html
 """
+import sys, os
+sys.path.append("..")
 import numpy as np
 from neural_network.neural_network import NeuralNetwork
 from nn_components.layers import ConvLayer, ActivationLayer, PoolingLayer, FlattenLayer, FCLayer, BatchNormLayer
 from nn_components.losses import CrossEntropy
+from libs.utils import one_hot_encoding, Trainer, preprocess_data, load_dataset_mnist
+from libs.mnist_lib import MNIST
+from optimizations_algorithms.optimizers import SGD, SGDMomentum, RMSProp, Adam
 
 class CNN(NeuralNetwork):
 
@@ -22,34 +27,134 @@ def __init__(self, optimizer:object, layers:list, loss_func:object=CrossEntropy(
         """
         super().__init__(optimizer, layers, loss_func)
 
-    def _structure(self, layers):
-        """
-        Structure function that initializes convolutional neural network architecture.
+def main():
+    arch = [
+        ConvLayer(filter_size=(3, 3), filters=6, padding="SAME", stride=1, weight_init="he_normal"),
+        ActivationLayer(activation="relu"),
+        PoolingLayer(filter_size=(2, 2), stride=2, mode="max"),
 
-        Parameters
-        ----------
-        layers: (list) a list of sequential layers. For convolutional neural network, it should have [ConvLayer, PoolingLayer, FCLayer,
-                                                                                        ActivationLayer, BatchnormLayer, DropoutLayer]
-        """
-        for layer in layers:
-            if isinstance(layer, (ConvLayer, FCLayer, BatchNormLayer)):
-                layer.initialize_optimizer(self.optimizer)
-        return layers
+        ConvLayer(filter_size=(3, 3), filters=16, padding="SAME", stride=1, weight_init="he_normal"),
+        ActivationLayer(activation="relu"),
+        PoolingLayer(filter_size=(2, 2), stride=2, mode="max"),
 
-    def _backward(self, Y, Y_hat, X):
-        """
-        CNN backward propagation.
+        ConvLayer(filter_size=(3, 3), filters=32, padding="SAME", stride=1, weight_init="he_normal"),
+        ActivationLayer(activation="relu"),
+        PoolingLayer(filter_size=(2, 2), stride=2, mode="max"),
 
-        Parameters
-        ----------
-        Y: one-hot encoding label.
-            shape = (m, C).
-        Y_hat: output values of forward propagation NN.
-            shape = (m, C).
-        X: training dataset.
-            shape = (m, iW, iH, iC).
-        """
-        dA_prev = self._backward_last(Y, Y_hat)
-        for i in range(len(self.layers)-3, 0, -1):
-            dA_prev = self.layers[i].backward(dA_prev, self.layers[i-1])
-        _ = self.layers[i-1].backward(dA_prev, X)
+        FlattenLayer(),
+
+        FCLayer(num_neurons=128, weight_init="he_normal"),
+        ActivationLayer(activation="relu"),
+
+        FCLayer(num_neurons=64, weight_init="he_normal"),
+        ActivationLayer(activation="relu"),
+
+        FCLayer(num_neurons=10, weight_init="he_normal"),
+        ActivationLayer(activation="softmax")
+    ]
+
+    print("Train MNIST dataset by CNN with pure Python: Numpy.")
+    weight_path = "cnn_weights.pkl"
+    training_phase = weight_path not in os.listdir(".")
+    load_dataset_mnist("../libs")
+    mndata = MNIST('../libs/data_mnist', gz=True)
+
+    if training_phase:
+        images_train, labels_train = mndata.load_training()
+        images_train, labels_train = preprocess_data(images_train, labels_train, nn=True)
+
+        epochs = 5
+        batch_size = 64
+        learning_rate = 0.006
+
+        optimizer = Adam(alpha=learning_rate)
+        loss_func = CrossEntropy()
+
+        cnn = CNN(optimizer=optimizer, layers=arch, loss_func=loss_func)
+
+        trainer = Trainer(cnn, batch_size, epochs)
+        trainer.train(images_train, labels_train)
+        trainer.save_model(weight_path)
+
+    else:
+        import pickle
+        images_test, labels_test = mndata.load_testing()
+        images_test, labels_test = preprocess_data(images_test, labels_test, nn=True, test=True)
+        with open(weight_path, "rb") as f:
+            cnn = pickle.load(f)
+        pred = cnn.predict(images_test)
+
+        print("Accuracy:", len(pred[labels_test == pred]) / len(pred))
+        from sklearn.metrics.classification import confusion_matrix
+
+        print("Confusion matrix: ")
+        print(confusion_matrix(labels_test, pred))
+
+def test():
+    import numpy as np
+    from nn_components.layers import ConvLayer, PoolingLayer
+    from optimizations_algorithms.optimizers import SGD
+    import tensorflow as tf
+    tf.enable_eager_execution()
+
+    filter_size = (3, 3)
+    filters = 16
+    padding = "SAME"
+    stride = 1
+
+    optimizer = SGD()
+
+    conv_layer = ConvLayer(filter_size=filter_size, filters=filters, padding=padding, stride=stride)
+
+    pool_filter_size = (2, 2)
+    pool_stride = 2
+    pool_mode = "max"
+    pool_layer = PoolingLayer(filter_size=pool_filter_size, stride=pool_stride, mode=pool_mode)
+
+    X = np.random.normal(size=(16, 12, 12, 3))
+
+    d_prev = np.random.normal(size=(16, 12, 12, 16))
+
+    my_conv_forward = conv_layer.forward(X)
+    my_dA, my_dW = conv_layer.backward(d_prev, X) 
+    my_pool_forward = pool_layer.forward(X)
+
+    with tf.device("/cpu:0"):
+        tf_conv_forward = tf.nn.conv2d(X, conv_layer.W, strides=(stride, stride), padding=padding).numpy()
+        tf_dW = tf.nn.conv2d_backprop_filter(X, filter_sizes=filter_size + (X.shape[-1], filters), out_backprop=d_prev,
+                                            strides=(1, stride, stride, 1), padding=padding).numpy()
+        tf_dA = tf.nn.conv2d_backprop_input(input_sizes=X.shape, filter=conv_layer.W, out_backprop=d_prev, 
+                                            strides=(1, stride, stride, 1), padding=padding).numpy()
+
+        tf_pool_forward = tf.nn.max_pool2d(X, ksize=pool_filter_size, strides=(pool_stride, pool_stride), padding="VALID")
+
+    blank = "----------------------"
+    print(blank + "TEST FORWARD CONVOLUTION" + blank)
+    forward_result = np.allclose(my_conv_forward, tf_conv_forward)
+    forward_out = "PASS" if forward_result else "FAIL"
+    print("====> " + forward_out)
+
+    print(blank + "TEST BACKWARD CONVOLUTION" + blank)
+    dW_result = np.allclose(my_dW, tf_dW)
+    dW_out = "PASS" if dW_result else "FAIL"
+    print("====> dW case: " + dW_out)
+    dA_result = np.allclose(my_dA, tf_dA)
+    dA_out = "PASS" if dA_result else "FAIL"
+    print("====> dA case: " + dA_out)
+
+    print(blank + "TEST FORWARD POOLING" + blank)
+    pool_result = np.allclose(my_pool_forward, tf_pool_forward)
+    pool_out = "PASS" if pool_result else "FAIL"
+    print("====> " + pool_out)
+
+
+if __name__ == "__main__":
+    import argparse
+
+    parser = argparse.ArgumentParser(description="A CNN program.")
+    parser.add_argument("--test", action="store_true", help="Run the test cases.")
+    args = parser.parse_args()
+    if args.test:
+        test()
+    else:
+        main()