Ocode
diff --git a/‎code/logistic_cg.py‎
Lines changed: 67 additions & 70 deletions b/‎code/logistic_cg.py‎
Lines changed: 67 additions & 70 deletions
@@ -37,7 +37,13 @@
 __docformat__ = 'restructedtext en'
 
 
-import numpy, time, cPickle, gzip, sys, os
+import cPickle
+import gzip
+import os
+import sys
+import time
+
+import numpy
 
 import theano
 import theano.tensor as T
@@ -52,9 +58,6 @@ class LogisticRegression(object):
     determine a class membership probability.
     """
 
-
-
-
     def __init__(self, input, n_in, n_out):
         """ Initialize the parameters of the logistic regression
 
@@ -75,24 +78,20 @@ def __init__(self, input, n_in, n_out):
         # initialize theta = (W,b) with 0s; W gets the shape (n_in, n_out),
         # while b is a vector of n_out elements, making theta a vector of
         # n_in*n_out + n_out elements
-        self.theta = theano.shared(value=numpy.zeros(n_in*n_out+n_out, dtype=theano.config.floatX),
+        self.theta = theano.shared(value=numpy.zeros(n_in * n_out + n_out,
+                                                   dtype=theano.config.floatX),
                                    name='theta')
         # W is represented by the fisr n_in*n_out elements of theta
-        self.W     = self.theta[0:n_in*n_out].reshape((n_in,n_out))
+        self.W = self.theta[0:n_in * n_out].reshape((n_in, n_out))
         # b is the rest (last n_out elements)
-        self.b     = self.theta[n_in*n_out:n_in*n_out+n_out]
-
+        self.b = self.theta[n_in * n_out:n_in * n_out + n_out]
 
         # compute vector of class-membership probabilities in symbolic form
-        self.p_y_given_x = T.nnet.softmax(T.dot(input, self.W)+self.b)
+        self.p_y_given_x = T.nnet.softmax(T.dot(input, self.W) + self.b)
 
         # compute prediction as class whose probability is maximal in
         # symbolic form
-        self.y_pred=T.argmax(self.p_y_given_x, axis=1)
-
-
-
-
+        self.y_pred = T.argmax(self.p_y_given_x, axis=1)
 
     def negative_log_likelihood(self, y):
         """Return the negative log-likelihood of the prediction of this model
@@ -108,11 +107,7 @@ def negative_log_likelihood(self, y):
         :param y: corresponds to a vector that gives for each example the
                   correct label
         """
-        return -T.mean(T.log(self.p_y_given_x)[T.arange(y.shape[0]),y])
-
-
-
-
+        return -T.mean(T.log(self.p_y_given_x)[T.arange(y.shape[0]), y])
 
     def errors(self, y):
         """Return a float representing the number of errors in the minibatch
@@ -136,12 +131,7 @@ def errors(self, y):
             raise NotImplementedError()
 
 
-
-
-
-
-
-def cg_optimization_mnist( n_epochs=50, mnist_pkl_gz='../data/mnist.pkl.gz' ):
+def cg_optimization_mnist(n_epochs=50, mnist_pkl_gz='../data/mnist.pkl.gz'):
     """Demonstrate conjugate gradient optimization of a log-linear model
 
     This is demonstrated on MNIST.
@@ -151,7 +141,7 @@ def cg_optimization_mnist( n_epochs=50, mnist_pkl_gz='../data/mnist.pkl.gz' ):
 
     :type mnist_pkl_gz: string
     :param mnist_pkl_gz: the path of the mnist training file from
-                         http://www.iro.umontreal.ca/~lisa/deep/data/mnist/mnist.pkl.gz
+                 http://www.iro.umontreal.ca/~lisa/deep/data/mnist/mnist.pkl.gz
 
     """
     #############
@@ -160,7 +150,7 @@ def cg_optimization_mnist( n_epochs=50, mnist_pkl_gz='../data/mnist.pkl.gz' ):
     print '... loading data'
 
     # Load the dataset
-    f = gzip.open(mnist_pkl_gz,'rb')
+    f = gzip.open(mnist_pkl_gz, 'rb')
     train_set, valid_set, test_set = cPickle.load(f)
     f.close()
 
@@ -174,8 +164,10 @@ def shared_dataset(data_xy):
         variable) would lead to a large decrease in performance.
         """
         data_x, data_y = data_xy
-        shared_x = theano.shared(numpy.asarray(data_x, dtype=theano.config.floatX))
-        shared_y = theano.shared(numpy.asarray(data_y, dtype=theano.config.floatX))
+        shared_x = theano.shared(numpy.asarray(data_x,
+                                               dtype=theano.config.floatX))
+        shared_y = theano.shared(numpy.asarray(data_y,
+                                               dtype=theano.config.floatX))
         # When storing data on the GPU it has to be stored as floats
         # therefore we will store the labels as ``floatX`` as well
         # (``shared_y`` does exactly that). But during our computations
@@ -185,37 +177,33 @@ def shared_dataset(data_xy):
         # lets ous get around this issue
         return shared_x, T.cast(shared_y, 'int32')
 
-
-    test_set_x,  test_set_y  = shared_dataset(test_set)
+    test_set_x, test_set_y = shared_dataset(test_set)
     valid_set_x, valid_set_y = shared_dataset(valid_set)
     train_set_x, train_set_y = shared_dataset(train_set)
 
     batch_size = 600    # size of the minibatch
 
     n_train_batches = train_set_x.get_value(borrow=True).shape[0] / batch_size
     n_valid_batches = valid_set_x.get_value(borrow=True).shape[0] / batch_size
-    n_test_batches  = test_set_x.get_value(borrow=True).shape[0]  / batch_size
-
-
-    ishape     = (28,28) # this is the size of MNIST images
-    n_in       = 28*28   # number of input units
-    n_out      = 10      # number of output units
+    n_test_batches = test_set_x.get_value(borrow=True).shape[0] / batch_size
 
+    ishape = (28, 28)  # this is the size of MNIST images
+    n_in = 28 * 28  # number of input units
+    n_out = 10  # number of output units
 
     ######################
     # BUILD ACTUAL MODEL #
     ######################
     print '... building the model'
 
     # allocate symbolic variables for the data
-    minibatch_offset = T.lscalar() # offset to the start of a [mini]batch
+    minibatch_offset = T.lscalar()  # offset to the start of a [mini]batch
     x = T.matrix()   # the data is presented as rasterized images
     y = T.ivector()  # the labels are presented as 1D vector of
                      # [int] labels
 
-
     # construct the logistic regression class
-    classifier = LogisticRegression( input=x, n_in=28*28, n_out=10)
+    classifier = LogisticRegression(input=x, n_in=28 * 28, n_out=10)
 
     # the cost we minimize during training is the negative log likelihood of
     # the model in symbolic format
@@ -225,65 +213,72 @@ def shared_dataset(data_xy):
     # the model on a minibatch
     test_model = theano.function([minibatch_offset], classifier.errors(y),
             givens={
-                x:test_set_x[minibatch_offset:minibatch_offset+batch_size],
-                y:test_set_y[minibatch_offset:minibatch_offset+batch_size]},
+                x: test_set_x[minibatch_offset:minibatch_offset + batch_size],
+                y: test_set_y[minibatch_offset:minibatch_offset + batch_size]},
             name="test")
 
-    validate_model = theano.function([minibatch_offset],classifier.errors(y),
+    validate_model = theano.function([minibatch_offset], classifier.errors(y),
             givens={
-                x:valid_set_x[minibatch_offset:minibatch_offset+batch_size],
-                y:valid_set_y[minibatch_offset:minibatch_offset+batch_size]},
+                x: valid_set_x[minibatch_offset:
+                               minibatch_offset + batch_size],
+                y: valid_set_y[minibatch_offset:
+                               minibatch_offset + batch_size]},
             name="validate")
 
     #  compile a thenao function that returns the cost of a minibatch
     batch_cost = theano.function([minibatch_offset], cost,
-            givens= {
-                x : train_set_x[minibatch_offset:minibatch_offset+batch_size],
-                y : train_set_y[minibatch_offset:minibatch_offset+batch_size]},
+            givens={
+                x: train_set_x[minibatch_offset:
+                               minibatch_offset + batch_size],
+                y: train_set_y[minibatch_offset:
+                               minibatch_offset + batch_size]},
             name="batch_cost")
 
-
     # compile a theano function that returns the gradient of the minibatch
     # with respect to theta
-    batch_grad = theano.function([minibatch_offset], T.grad(cost,classifier.theta),
-            givens= {
-                x : train_set_x[minibatch_offset:minibatch_offset+batch_size],
-                y : train_set_y[minibatch_offset:minibatch_offset+batch_size]},
+    batch_grad = theano.function([minibatch_offset],
+                                 T.grad(cost, classifier.theta),
+                                 givens={
+                                     x: train_set_x[minibatch_offset:
+                                            minibatch_offset + batch_size],
+                                     y: train_set_y[minibatch_offset:
+                                            minibatch_offset + batch_size]},
             name="batch_grad")
 
-
     # creates a function that computes the average cost on the training set
     def train_fn(theta_value):
         classifier.theta.set_value(theta_value, borrow=True)
-        train_losses = [batch_cost(i*batch_size) for i in xrange(n_train_batches)]
+        train_losses = [batch_cost(i * batch_size)
+                        for i in xrange(n_train_batches)]
         return numpy.mean(train_losses)
 
     # creates a function that computes the average gradient of cost with
     # respect to theta
     def train_fn_grad(theta_value):
         classifier.theta.set_value(theta_value, borrow=True)
         grad = batch_grad(0)
-        for i in xrange(1,n_train_batches):
-            grad += batch_grad(i*batch_size)
-        return grad/n_train_batches
-
+        for i in xrange(1, n_train_batches):
+            grad += batch_grad(i * batch_size)
+        return grad / n_train_batches
 
     validation_scores = [numpy.inf, 0]
 
     # creates the validation function
     def callback(theta_value):
         classifier.theta.set_value(theta_value, borrow=True)
         #compute the validation loss
-        validation_losses = [validate_model(i*batch_size) for i in xrange(n_valid_batches)]
+        validation_losses = [validate_model(i * batch_size)
+                             for i in xrange(n_valid_batches)]
         this_validation_loss = numpy.mean(validation_losses)
-        print('validation error %f %%' % (this_validation_loss*100.,))
+        print('validation error %f %%' % (this_validation_loss * 100.,))
 
         # check if it is better then best validation score got until now
         if this_validation_loss < validation_scores[0]:
             # if so, replace the old one, and compute the score on the
             # testing dataset
             validation_scores[0] = this_validation_loss
-            test_losses = [test_model(i*batch_size) for i in xrange(n_test_batches)]
+            test_losses = [test_model(i * batch_size)
+                           for i in xrange(n_test_batches)]
             validation_scores[1] = numpy.mean(test_losses)
 
     ###############
@@ -295,18 +290,20 @@ def callback(theta_value):
     print ("Optimizing using scipy.optimize.fmin_cg...")
     start_time = time.clock()
     best_w_b = scipy.optimize.fmin_cg(
-               f        = train_fn,
-               x0       = numpy.zeros((n_in+1)*n_out, dtype=x.dtype),
-               fprime   = train_fn_grad,
-               callback = callback,
-               disp     = 0,
-               maxiter  = n_epochs)
+               f=train_fn,
+               x0=numpy.zeros((n_in + 1) * n_out, dtype=x.dtype),
+               fprime=train_fn_grad,
+               callback=callback,
+               disp=0,
+               maxiter=n_epochs)
     end_time = time.clock()
     print(('Optimization complete with best validation score of %f %%, with '
           'test performance %f %%') %
-               (validation_scores[0]*100., validation_scores[1]*100.))
+               (validation_scores[0] * 100., validation_scores[1] * 100.))
 
-    print >> sys.stderr, ('The code for file '+os.path.split(__file__)[1]+' ran for %.1fs' % ((end_time-start_time)))
+    print >> sys.stderr, ('The code for file ' +
+                          os.path.split(__file__)[1] +
+                          ' ran for %.1fs' % ((end_time - start_time)))
 
 
 if __name__ == '__main__':