Update spec and scripts

2017-11-06 17:27:08 +00:00 · 2017-11-06 17:27:08 +00:00 · 94fee2d2d4
commit 94fee2d2d4
parent 90f7059240
4 changed files with 119 additions and 30 deletions
--- a/scripts/generate_batchnorm_test.py
+++ b/scripts/generate_batchnorm_test.py
@ -0,0 +1,43 @@
 import numpy as np
 from mlp.layers import BatchNormalizationLayer
 import argparse
 parser = argparse.ArgumentParser(description='Welcome to GAN-Shot-Learning script')
 parser.add_argument('--student_id', nargs="?", type=str, help='Your student id in the format "sxxxxxxx"')
 args = parser.parse_args()
 student_id = args.student_id
 def generate_inputs(student_id):
    student_number = student_id
    tests = np.arange(96).reshape((2, 3, 4, 4))
    tests[:, 0, :, :] = float(student_number[1:3]) / 10 - 5
    tests[:, :, 1, :] = float(student_number[3:5]) / 10 - 5
    tests[:, 2, :, :] = float(student_number[5:7]) / 10 - 5
    tests[0, 1, :, :] = float(student_number[7]) / 10 - 5
    return tests
 test_inputs = generate_inputs(student_id)
 test_inputs = np.reshape(test_inputs, newshape=(2, -1))
 test_grads_wrt_outputs = np.arange(-48, 48).reshape((2, -1))
 #produce BatchNorm Layer fprop and bprop
 activation_layer = BatchNormalizationLayer(input_dim=48)
 beta = np.array(48*[0.3])
 gamma = np.array(48*[0.8])
 activation_layer.params = [gamma, beta]
 BN_fprop = activation_layer.fprop(test_inputs)
 BN_bprop = activation_layer.bprop(
    test_inputs, BN_fprop, test_grads_wrt_outputs)
 BN_grads_wrt_params = activation_layer.grads_wrt_params(
    test_inputs, test_grads_wrt_outputs)
 test_output = "BatchNormalization:\nFprop: {}\nBprop: {}\nGrads_wrt_params: {}\n"\
    .format(BN_fprop, BN_bprop, BN_grads_wrt_params)
 with open("{}_batchnorm_test_file.txt".format(student_id), "w+") as out_file:
    out_file.write(test_output)
--- a/scripts/generate_conv_test.py
+++ b/scripts/generate_conv_test.py
@ -0,0 +1,46 @@
 import numpy as np
 from mlp.layers import ConvolutionalLayer
 import argparse
 parser = argparse.ArgumentParser(description='Welcome to GAN-Shot-Learning script')
 parser.add_argument('--student_id', nargs="?", type=str, help='Your student id in the format "sxxxxxxx"')
 args = parser.parse_args()
 student_id = args.student_id
 def generate_inputs(student_id):
    student_number = student_id
    tests = np.arange(96).reshape((2, 3, 4, 4))
    tests[:, 0, :, :] = float(student_number[1:3]) / 10 - 5
    tests[:, :, 1, :] = float(student_number[3:5]) / 10 - 5
    tests[:, 2, :, :] = float(student_number[5:7]) / 10 - 5
    tests[0, 1, :, :] = float(student_number[7]) / 10 - 5
    return tests
 test_inputs = generate_inputs(student_id)
 test_grads_wrt_outputs = np.arange(-20, 16).reshape((2, 2, 3, 3))
 inputs = np.arange(96).reshape((2, 3, 4, 4))
 kernels = np.arange(-12, 12).reshape((2, 3, 2, 2))
 biases = np.arange(2)
 #produce ConvolutionalLayer fprop, bprop and grads_wrt_params
 activation_layer = ConvolutionalLayer(num_input_channels=3, num_output_channels=2, input_dim_1=4, input_dim_2=4,
                                      kernel_dim_1=2, kernel_dim_2=2)
 activation_layer.params = [kernels, biases]
 conv_fprop = activation_layer.fprop(test_inputs)
 conv_bprop = activation_layer.bprop(
    test_inputs, conv_fprop, test_grads_wrt_outputs)
 conv_grads_wrt_params = activation_layer.grads_wrt_params(test_inputs,
                                                          test_grads_wrt_outputs)
 test_output = "ConvolutionalLayer:\nFprop: {}\nBprop: {}\n" \
              "Grads_wrt_params: {}\n".format(conv_fprop,
            conv_bprop,
            conv_grads_wrt_params)
 with open("{}_conv_test_file.txt".format(student_id), "w+") as out_file:
    out_file.write(test_output)
--- a/spec/coursework2.pdf
+++ b/spec/coursework2.pdf
--- a/spec/coursework2.tex
+++ b/spec/coursework2.tex
@ -138,32 +138,32 @@ code necessary for the coursework in it.
 This branch includes the following additions to your setup:
 \begin{itemize}
-\itemsep1pt\parskip0pt\parsep0pt
+	\itemsep1pt\parskip0pt\parsep0pt
-\item
+	\item
-  A notebook \verb+BatchNormalizationLayer_tests+ which includes 
+	A notebook \verb+BatchNormalizationLayer_tests+ which includes 
-  test functions to check the implementations of the BatchNorm layer
+	test functions to check the implementations of the BatchNorm layer
-  \texttt{fprop}, \texttt{bprop} and \texttt{grads\_wrt\_params}
+	\texttt{fprop}, \texttt{bprop} and \texttt{grads\_wrt\_params}
-  methods. The BatchNormalizationLayer skeleton code can be found in mlp.layers. 
+	methods. The BatchNormalizationLayer skeleton code can be found in mlp.layers. 
-  The tests use the mlp.layers implementation so be sure to reload your notebook
+	The tests use the mlp.layers implementation so be sure to reload your notebook
-  when you update your mlp.layers code.
+	when you update your mlp.layers code.
-\item
+	\item
-  A notebook \verb+Convolutional_layer_tests+ which includes
+	A notebook \verb+Convolutional_layer_tests+ which includes
-  test functions to check the implementations of the Convolutional layer
+	test functions to check the implementations of the Convolutional layer
-  \texttt{fprop}, \texttt{bprop} and \texttt{grads\_wrt\_params}
+	\texttt{fprop}, \texttt{bprop} and \texttt{grads\_wrt\_params}
-  methods. The ConvolutionalLayer skeleton code can be found in mlp.layers. 
+	methods. The ConvolutionalLayer skeleton code can be found in mlp.layers. 
-  The tests use the mlp.layers implementation so be sure to reload your notebook
+	The tests use the mlp.layers implementation so be sure to reload your notebook
-  when you update your mlp.layers code.
+	when you update your mlp.layers code.
-\item
+	\item
-  A new \texttt{ReshapeLayer} class in the \verb+mlp.layers+ module.
+	A new \texttt{ReshapeLayer} class in the \verb+mlp.layers+ module.
-  When included in a a multiple layer model, this allows the output of
+	When included in a a multiple layer model, this allows the output of
-  the previous layer to be reshaped before being forward propagated to
+	the previous layer to be reshaped before being forward propagated to
-  the next layer.
+	the next layer.
-\item
+	\item
-  A new \texttt{EMNISTDataProvider} class in the \verb+mlp.data_providers+ module.
+	A new \texttt{EMNISTDataProvider} class in the \verb+mlp.data_providers+ module.
-  This class is a small change to the \texttt{MNISTDataProvider} class, linking to the Balanced EMNIST data, and setting the number of classes to 47.
+	This class is a small change to the \texttt{MNISTDataProvider} class, linking to the Balanced EMNIST data, and setting the number of classes to 47.
-\item
+	\item
-  Training, validation, and test sets for the \texttt{EMNIST Balanced} dataset that
+	Training, validation, and test sets for the \texttt{EMNIST Balanced} dataset that
-  you will use in this coursework
+	you will use in this coursework
 \end{itemize}
@ -186,9 +186,9 @@ In part A of the coursework you will focus on using deep neural networks on EMNI
  \item Perform baseline experiments using DNNs trained on EMNIST.  Obviously there are a lot things that could be explored including hidden unit activation functions, network architectures, training hyperparameters, and the use of regularisation and dropout.   You cannot explore everything and is best to carefully investigate a few things in depth.
  \item Implement the RMSProp \citep{tieleman2012rmsprop} and Adam \citep{kingma2015adam} learning rules, by defining new classes inheriting from \texttt{GradientDescendLearningRule} in the \texttt{mlp/learning\_rules.py} module. The \texttt{MomentumLearningRule} class is an example of how to define  a learning rules which uses an additional state variable to calculate the updates to the parameters.
  \item Perform experiments to compare stochastic gradient descent, RMSProp, and Adam for deep neural network training on EMNIST, building on your earlier baseline experiments.  
-  \item Implement batch normalisation \citep{ioffe2015batch} as a class \verb+BatchNormLayer+.  You need to implement \texttt{fprop}, \texttt{bprop} and \texttt{grads\_wrt\_params} methods for this class. 
+  \item Implement batch normalisation \citep{ioffe2015batch} as a class \verb+BatchNormalizationLayer+.  You need to implement \texttt{fprop}, \texttt{bprop} and \texttt{grads\_wrt\_params} methods for this class. 
-  \item Verify the correctness of your implementation using the supplied unit tests in \verb+Batchnorm_tests.ipynb+.
+  \item Verify the correctness of your implementation using the supplied unit tests in\\\verb+BatchNormalizationLayer_tests.ipynb+.
-  \item Automatically create a test file \verb+sXXXXXXX_batchnorm_test.txt+, by running the provided program \verb+generate_conv_test.py+ which uses your \verb+BatchnormLayer+ class methods on a unique test vector generated using your student ID number.
+  \item Automatically create a test file \verb+sXXXXXXX_batchnorm_test.txt+, by running the provided program \verb+generate_batchnorm_test.py+ which uses your \verb+BatchNormalizationLayer+ class methods on a unique test vector generated using your student ID number.
  \item Perform experiments on EMNIST to investigate the impact of using batch normalisation in deep neural networks, building on your earlier experiments.  
 \end{enumerate}
 In the above experiments you should use the validation set to assess accuracy.  Use the test set at the end to assess the accuracy of the deep neural network architecture and training setup that you judge to be the best.
@ -199,7 +199,7 @@ In the above experiments you should use the validation set to assess accuracy.
 In part B of the coursework you should implement convolutional  and max-pooling layers, and carry out experiments using a convolutional networks with one and two convolutional layers.  
 \begin{enumerate}
  \item Implement a convolutional layer as a class \verb+ConvolutionalLayer+.  You need to implement \texttt{fprop}, \texttt{bprop} and \texttt{grads\_wrt\_params} methods for this class. 
-  \item Verify the correctness of your implementation using the supplied unit tests in \verb+Convolutional_layer_tests.ipynb+.
+  \item Verify the correctness of your implementation using the supplied unit tests in\\\verb+ConvolutionalLayer_tests.ipynb+.
  \item Automatically create a test file \verb+sXXXXXXX_conv_test.txt+, by running the provided program \verb+generate_conv_test.py+ which uses your \verb+ConvolutionalLayer+ class methods on a unique test vector generated using your student ID number.
  \item Implement a max-pooling layer. Non-overlapping pooling (which was assumed in the lecture presentation) is required. You may also implement a more generic solution with striding as well. 
  \item Construct and train networks containing one and two convolutional layers, and max-pooling layers, using the Balanced EMNIST data, reporting your experimental results.  As a default use convolutional kernels of dimension 5x5 (stride 1) and pooling regions of 2x2 (stride 2, hence non-overlapping).  As a default convolutional networks with two convolutional layers,  investigate a network with two convolutional+maxpooling layers with 5 feature maps in the first convolutional layer, and 10 feature maps in the second convolutional layer.