vgg training

alponomar · Dec 10, 2016 · 3e65439 · 3e65439
1 parent e17027a
commit 3e65439
Show file tree

Hide file tree

Showing 5 changed files with 284 additions and 60 deletions.
diff --git a/.gitignore b/.gitignore
@@ -1 +1,2 @@
 /logs/*
+/pretrained_params/*
diff --git a/convnet.py b/convnet.py
@@ -2,7 +2,7 @@
 from __future__ import division
 from __future__ import print_function
 
-import tensorflow as tf
+import tensorflow as tf.
 import numpy as np
 from tensorflow.contrib.layers import regularizers
 
@@ -23,7 +23,7 @@ def __init__(self, n_classes = 10):
                           This number is required in order to specify the
                           output dimensions of the ConvNet
         """
-        selfn_classes = n_classes
+        self.n_classes = n_classes
 
     def inference(self, x):
         """
@@ -46,49 +46,49 @@ def inference(self, x):
           x: 4D float Tensor of size [batch_size, input_height, input_width, input_channels]
 
         Returns:
-          logits: 2D float Tensor of size [batch_size, selfn_classes] Returns
+          logits: 2D float Tensor of size [batch_size, self.n_classes] Returns
                   the logits outputs (before softmax transformation) of the
                   network These logits can then be used with loss and accuracy
                   to evaluate the model
         """
-        x_inp = tfreshape(x, [-1, 32, 32, 3])
-        with tfvariable_scope('ConvNet'):
+        x_inp = tf.reshape(x, [-1, 32, 32, 3])
+        with tf.variable_scope('ConvNet'):
 
             def _forward_conv_layer(name, w_shape, b_shape, x_inp, max_pool_kernel, max_pool_stride, act_func):
-              with tfvariable_scope(name):
-                W = tfget_variable('W', w_shape, initializer=tfrandom_normal_initializer(mean = 00, stddev=1e-3, dtype=tffloat32))
-                b = tfget_variable('b', b_shape, initializer=tfconstant_initializer(0))
-                conv_out = act_func(tfnnconv2d(x_inp, W, strides=[1, 1, 1, 1], padding='SAME') + b)
-                out = tfnnmax_pool(conv_out, ksize=[1, max_pool_kernel, max_pool_kernel, 1], strides=[1, max_pool_stride, max_pool_stride, 1], padding='SAME')
-                tfhistogram_summary(name + '_weights', W)
-                tfhistogram_summary(name + '_b', b)
-                tfhistogram_summary(name + '_out', conv_out)
-                tfhistogram_summary(name + '_maxpool', out)
+              with tf.variable_scope(name):
+                W = tf.get_variable('W', w_shape, initializer=tf.random_normal_initializer(mean = 0.0, stddev=1e-3, dtype=tf.float32))
+                b = tf.get_variable('b', b_shape, initializer=tf.constant_initializer(0))
+                conv_out = act_func(tf.nnconv2d(x_inp, W, strides=[1, 1, 1, 1], padding='SAME') + b)
+                out = tf.nnmax_pool(conv_out, ksize=[1, max_pool_kernel, max_pool_kernel, 1], strides=[1, max_pool_stride, max_pool_stride, 1], padding='SAME')
+                tf.histogram_summary(name + '_weights', W)
+                tf.histogram_summary(name + '_b', b)
+                tf.histogram_summary(name + '_out', conv_out)
+                tf.histogram_summary(name + '_maxpool', out)
                 return out
 
             def _forward_fc_layer(name, w_shape, b_shape, x_inp, regularizer_strength, act_func):
-              with tfvariable_scope(name):
-                W = tfget_variable('W', w_shape, initializer=tfrandom_normal_initializer(mean = 00, stddev=1e-3, dtype=tffloat32),regularizer = regularizersl2_regularizer(regularizer_strength))
-                b = tfget_variable('b', b_shape, initializer=tfconstant_initializer(0))
-                out = act_func(tfmatmul(x_inp, W) + b)
-                tfhistogram_summary(name + '_weights', W)
-                tfhistogram_summary(name + '_b', b)
-                tfhistogram_summary(name + '_out', out)
+              with tf.variable_scope(name):
+                W = tf.get_variable('W', w_shape, initializer=tf.random_normal_initializer(mean = 0.0, stddev=1e-3, dtype=tf.float32),regularizer = regularizers.l2_regularizer(regularizer_strength))
+                b = tf.get_variable('b', b_shape, initializer=tf.constant_initializer(0))
+                out = act_func(tf.matmul(x_inp, W) + b)
+                tf.histogram_summary(name + '_weights', W)
+                tf.histogram_summary(name + '_b', b)
+                tf.histogram_summary(name + '_out', out)
               return out
 
             conv1 = _forward_conv_layer(name='conv1', w_shape=[5, 5, 3, 64], b_shape=64, 
-              x_inp=x_inp, max_pool_kernel=3, max_pool_stride=2, act_func=tfnnrelu)  
+              x_inp=x_inp, max_pool_kernel=3, max_pool_stride=2, act_func=tf.nn.relu)  
             conv2 = _forward_conv_layer(name='conv2', w_shape=[5, 5, 64, 64], b_shape=64, 
-              x_inp=conv1, max_pool_kernel=3, max_pool_stride=2, act_func=tfnnrelu) 
+              x_inp=conv1, max_pool_kernel=3, max_pool_stride=2, act_func=tf.nnrelu) 
 
-            selfflatten = tfreshape(conv2, [-1, 8 * 8 * 64])
+            self.flatten = tf.reshape(conv2, [-1, 8 * 8 * 64])
 
-            selffc1 = _forward_fc_layer(name='fc1', w_shape=[8 * 8 * 64, 384], b_shape=384, 
-              x_inp=selfflatten, regularizer_strength=0001, act_func=tfnnrelu)
-            selffc2 = _forward_fc_layer(name='fc2', w_shape=[384, 192], b_shape=192, 
-              x_inp=selffc1, regularizer_strength=0001, act_func=tfnnrelu)
+            self.fc1 = _forward_fc_layer(name='fc1', w_shape=[8 * 8 * 64, 384], b_shape=384, 
+              x_inp=self.flatten, regularizer_strength=0.001, act_func=tf.nn.relu)
+            self.fc2 = _forward_fc_layer(name='fc2', w_shape=[384, 192], b_shape=192, 
+              x_inp=self.fc1, regularizer_strength=0.001, act_func=tf.nn.relu)
             logits = _forward_fc_layer(name='logits', w_shape=[192, 10], b_shape=10, 
-              x_inp=selffc2, regularizer_strength=0001, act_func=lambda x: x)
+              x_inp=self.fc2, regularizer_strength=0.001, act_func=lambda x: x)
 
 
         return logits
@@ -97,13 +97,13 @@ def accuracy(self, logits, labels):
         """
         Calculate the prediction accuracy, ie the average correct predictions
         of the network
-        As in selfloss above, you can use tfscalar_summary to save
+        As in self.loss above, you can use tf.scalar_summary to save
         scalar summaries of accuracy for later use with the TensorBoard
 
         Args:
-          logits: 2D float Tensor of size [batch_size, selfn_classes]
-                       The predictions returned through selfinference
-          labels: 2D int Tensor of size [batch_size, selfn_classes]
+          logits: 2D float Tensor of size [batch_size, self.n_classes]
+                       The predictions returned through self.inference
+          labels: 2D int Tensor of size [batch_size, self.n_classes]
                      with one-hot encoding Ground truth labels for
                      each observation in batch
 
@@ -114,9 +114,9 @@ def accuracy(self, logits, labels):
         ########################
         # PUT YOUR CODE HERE  #
         ########################
-        correct_prediction = tfequal(tfargmax(labels, 1), tfargmax(logits, 1))
-        accuracy = tfreduce_mean(tfcast(correct_prediction, tffloat32))
-        tfscalar_summary('accuracy', accuracy)
+        correct_prediction = tf.equal(tf.argmax(labels, 1), tf.argmax(logits, 1))
+        accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))
+        tf.scalar_summary('accuracy', accuracy)
         # raise NotImplementedError
         ########################
         # END OF YOUR CODE    #
@@ -130,15 +130,15 @@ def loss(self, logits, labels):
         the ground truth labels The function will also add the regularization
         loss from network weights to the total loss that is return
         In order to implement this function you should have a look at
-        tfnnsoftmax_cross_entropy_with_logits
-        You can use tfscalar_summary to save scalar summaries of
+        tf.nn.softmax_cross_entropy_with_logits
+        You can use tf.scalar_summary to save scalar summaries of
         cross-entropy loss, regularization loss, and full loss (both summed)
         for use with TensorBoard This will be useful for compiling your report
 
         Args:
-          logits: 2D float Tensor of size [batch_size, selfn_classes]
-                       The predictions returned through selfinference
-          labels: 2D int Tensor of size [batch_size, selfn_classes]
+          logits: 2D float Tensor of size [batch_size, self.n_classes]
+                       The predictions returned through self.inference
+          labels: 2D int Tensor of size [batch_size, self.n_classes]
                        with one-hot encoding Ground truth labels for each
                        observation in batch
 
@@ -148,9 +148,9 @@ def loss(self, logits, labels):
         ########################
         # PUT YOUR CODE HERE  #
         ########################
-        cross_entropy = tfnnsoftmax_cross_entropy_with_logits(logits, labels, name='crossentropy')  
-        loss = tfreduce_mean(cross_entropy, name='loss')
-        tfscalar_summary('cross-entropy loss', loss)
+        cross_entropy = tf.nn.softmax_cross_entropy_with_logits(logits, labels, name='crossentropy')  
+        loss = tf.reduce_mean(cross_entropy, name='loss')
+        tf.scalar_summary('cross-entropy loss', loss)
         # loss = cross_entropy
         # raise NotImplementedError
         ########################

diff --git a/fc.py b/fc.py
@@ -0,0 +1,143 @@
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import tensorflow as tf
+import numpy as np
+from tensorflow.contrib.layers import regularizers
+
+
+class FC(object):
+    """
+   This class implements a convolutional neural network in TensorFlow
+   It incorporates a certain graph model to be trained and to be used
+   in inference
+    """
+
+    def __init__(self, n_classes = 10):
+        """
+        Constructor for an ConvNet object Default values should be used as hints for
+        the usage of each parameter
+        Args:
+          n_classes: int, number of classes of the classification problem
+                          This number is required in order to specify the
+                          output dimensions of the ConvNet
+        """
+        self.n_classes = n_classes
+
+    def inference(self, x):
+        """
+        Performs inference given an input tensor This is the central portion
+        of the network where we describe the computation graph Here an input
+        tensor undergoes a series of convolution, pooling and nonlinear operations
+        as defined in this method For the details of the model, please
+        see assignment file
+
+        Here we recommend you to consider using variable and name scopes in order
+        to make your graph more intelligible for later references in TensorBoard
+        and so on You can define a name scope for the whole model or for each
+        operator group (eg conv+pool+relu) individually to group them by name
+        Variable scopes are essential components in TensorFlow for parameter sharing
+        Although the model(s) which are within the scope of this class do not require
+        parameter sharing it is a good practice to use variable scope to encapsulate
+        model
+
+        Args:
+          x: 4D float Tensor of size [batch_size, input_height, input_width, input_channels]
+
+        Returns:
+          logits: 2D float Tensor of size [batch_size, self.n_classes] Returns
+                  the logits outputs (before softmax transformation) of the
+                  network These logits can then be used with loss and accuracy
+                  to evaluate the model
+        """
+        with tf.variable_scope('FCC'):
+
+            def _forward_fc_layer(name, w_shape, b_shape, x_inp, regularizer_strength, act_func):
+              with tf.variable_scope(name):
+                W = tf.get_variable('W', w_shape, initializer=tf.random_normal_initializer(mean = 0.0, stddev=1e-3, dtype=tf.float32),regularizer = regularizers.l2_regularizer(regularizer_strength))
+                b = tf.get_variable('b', b_shape, initializer=tf.constant_initializer(0))
+                out = act_func(tf.matmul(x_inp, W) + b)
+                tf.histogram_summary(name + '_weights', W)
+                tf.histogram_summary(name + '_b', b)
+                tf.histogram_summary(name + '_out', out)
+              return out
+
+
+            self.flatten = tf.reshape(x, [-1, 512])
+
+            self.fc1 = _forward_fc_layer(name='fc1', w_shape=[512, 384], b_shape=384, 
+              x_inp=self.flatten, regularizer_strength=0.001, act_func=tf.nn.relu)
+            self.fc2 = _forward_fc_layer(name='fc2', w_shape=[384, 192], b_shape=192, 
+              x_inp=self.fc1, regularizer_strength=0.001, act_func=tf.nn.relu)
+            logits = _forward_fc_layer(name='logits', w_shape=[192, 10], b_shape=10, 
+              x_inp=self.fc2, regularizer_strength=0.001, act_func=lambda x: x)
+
+
+        return logits
+
+    def accuracy(self, logits, labels):
+        """
+        Calculate the prediction accuracy, ie the average correct predictions
+        of the network
+        As in self.loss above, you can use tf.scalar_summary to save
+        scalar summaries of accuracy for later use with the TensorBoard
+
+        Args:
+          logits: 2D float Tensor of size [batch_size, self.n_classes]
+                       The predictions returned through self.inference
+          labels: 2D int Tensor of size [batch_size, self.n_classes]
+                     with one-hot encoding Ground truth labels for
+                     each observation in batch
+
+        Returns:
+          accuracy: scalar float Tensor, the accuracy of predictions,
+                    ie the average correct predictions over the whole batch
+        """
+        ########################
+        # PUT YOUR CODE HERE  #
+        ########################
+        correct_prediction = tf.equal(tf.argmax(labels, 1), tf.argmax(logits, 1))
+        accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))
+        tf.scalar_summary('accuracy', accuracy)
+        # raise NotImplementedError
+        ########################
+        # END OF YOUR CODE    #
+        ########################
+
+        return accuracy
+
+    def loss(self, logits, labels):
+        """
+        Calculates the multiclass cross-entropy loss from the logits predictions and
+        the ground truth labels The function will also add the regularization
+        loss from network weights to the total loss that is return
+        In order to implement this function you should have a look at
+        tf.nn.softmax_cross_entropy_with_logits
+        You can use tf.scalar_summary to save scalar summaries of
+        cross-entropy loss, regularization loss, and full loss (both summed)
+        for use with TensorBoard This will be useful for compiling your report
+
+        Args:
+          logits: 2D float Tensor of size [batch_size, self.n_classes]
+                       The predictions returned through self.inference
+          labels: 2D int Tensor of size [batch_size, self.n_classes]
+                       with one-hot encoding Ground truth labels for each
+                       observation in batch
+
+        Returns:
+          loss: scalar float Tensor, full loss = cross_entropy + reg_loss
+        """
+        ########################
+        # PUT YOUR CODE HERE  #
+        ########################
+        cross_entropy = tf.nn.softmax_cross_entropy_with_logits(logits, labels, name='crossentropy')  
+        loss = tf.reduce_mean(cross_entropy, name='loss')
+        tf.scalar_summary('cross-entropy loss', loss)
+        # loss = cross_entropy
+        # raise NotImplementedError
+        ########################
+        # END OF YOUR CODE    #
+        ########################
+
+        return loss