mdda
diff --git a/‎code/DBN.py‎
Lines changed: 76 additions & 39 deletions b/‎code/DBN.py‎
Lines changed: 76 additions & 39 deletions
diff --git a/‎code/SdA.py‎
Lines changed: 44 additions & 25 deletions b/‎code/SdA.py‎
Lines changed: 44 additions & 25 deletions
diff --git a/‎code/cA.py‎
Lines changed: 17 additions & 10 deletions b/‎code/cA.py‎
Lines changed: 17 additions & 10 deletions
@@ -17,6 +17,7 @@
 from rbm import RBM
 
 
+# start-snippet-1
 class DBN(object):
     """Deep Belief Network
 
@@ -65,7 +66,7 @@ def __init__(self, numpy_rng, theano_rng=None, n_ins=784,
         self.x = T.matrix('x')  # the data is presented as rasterized images
         self.y = T.ivector('y')  # the labels are presented as 1D vector
                                  # of [int] labels
-
+        # end-snippet-1
         # The DBN is an MLP, for which all weights of intermediate
         # layers are shared with a different RBM.  We will first
         # construct the DBN as a deep multilayer perceptron, and when
@@ -174,12 +175,14 @@ def pretraining_functions(self, train_set_x, batch_size, k):
                                                  persistent=None, k=k)
 
             # compile the theano function
-            fn = theano.function(inputs=[index,
-                            theano.Param(learning_rate, default=0.1)],
-                                 outputs=cost,
-                                 updates=updates,
-                                 givens={self.x:
-                                    train_set_x[batch_begin:batch_end]})
+            fn = theano.function(
+                inputs=[index, theano.Param(learning_rate, default=0.1)],
+                outputs=cost,
+                updates=updates,
+                givens={
+                    self.x: train_set_x[batch_begin:batch_end]
+                }
+            )
             # append `fn` to the list of functions
             pretrain_fns.append(fn)
 
@@ -224,25 +227,45 @@ def build_finetune_functions(self, datasets, batch_size, learning_rate):
         for param, gparam in zip(self.params, gparams):
             updates.append((param, param - gparam * learning_rate))
 
-        train_fn = theano.function(inputs=[index],
-              outputs=self.finetune_cost,
-              updates=updates,
-              givens={self.x: train_set_x[index * batch_size:
-                                          (index + 1) * batch_size],
-                      self.y: train_set_y[index * batch_size:
-                                          (index + 1) * batch_size]})
-
-        test_score_i = theano.function([index], self.errors,
-                 givens={self.x: test_set_x[index * batch_size:
-                                            (index + 1) * batch_size],
-                         self.y: test_set_y[index * batch_size:
-                                            (index + 1) * batch_size]})
-
-        valid_score_i = theano.function([index], self.errors,
-              givens={self.x: valid_set_x[index * batch_size:
-                                          (index + 1) * batch_size],
-                      self.y: valid_set_y[index * batch_size:
-                                          (index + 1) * batch_size]})
+        train_fn = theano.function(
+            inputs=[index],
+            outputs=self.finetune_cost,
+            updates=updates,
+            givens={
+                self.x: train_set_x[
+                    index * batch_size: (index + 1) * batch_size
+                ],
+                self.y: train_set_y[
+                    index * batch_size: (index + 1) * batch_size
+                ]
+            }
+        )
+
+        test_score_i = theano.function(
+            [index],
+            self.errors,
+            givens={
+                self.x: test_set_x[
+                    index * batch_size: (index + 1) * batch_size
+                ],
+                self.y: test_set_y[
+                    index * batch_size: (index + 1) * batch_size
+                ]
+            }
+        )
+
+        valid_score_i = theano.function(
+            [index],
+            self.errors,
+            givens={
+                self.x: valid_set_x[
+                    index * batch_size: (index + 1) * batch_size
+                ],
+                self.y: valid_set_y[
+                    index * batch_size: (index + 1) * batch_size
+                ]
+            }
+        )
 
         # Create a function that scans the entire validation set
         def valid_score():
@@ -296,6 +319,7 @@ def test_DBN(finetune_lr=0.1, pretraining_epochs=100,
               hidden_layers_sizes=[1000, 1000, 1000],
               n_outs=10)
 
+    # start-snippet-2
     #########################
     # PRETRAINING THE MODEL #
     #########################
@@ -319,21 +343,23 @@ def test_DBN(finetune_lr=0.1, pretraining_epochs=100,
             print numpy.mean(c)
 
     end_time = time.clock()
+    # end-snippet-2
     print >> sys.stderr, ('The pretraining code for file ' +
                           os.path.split(__file__)[1] +
                           ' ran for %.2fm' % ((end_time - start_time) / 60.))
-
     ########################
     # FINETUNING THE MODEL #
     ########################
 
     # get the training, validation and testing function for the model
     print '... getting the finetuning functions'
     train_fn, validate_model, test_model = dbn.build_finetune_functions(
-                datasets=datasets, batch_size=batch_size,
-                learning_rate=finetune_lr)
+        datasets=datasets,
+        batch_size=batch_size,
+        learning_rate=finetune_lr
+    )
 
-    print '... finetunning the model'
+    print '... finetuning the model'
     # early-stopping parameters
     patience = 4 * n_train_batches  # look as this many examples regardless
     patience_increase = 2.    # wait this much longer when a new best is
@@ -342,7 +368,7 @@ def test_DBN(finetune_lr=0.1, pretraining_epochs=100,
                                    # considered significant
     validation_frequency = min(n_train_batches, patience / 2)
                                   # go through this many
-                                  # minibatche before checking the network
+                                  # minibatches before checking the network
                                   # on the validation set; in this case we
                                   # check every epoch
 
@@ -365,16 +391,24 @@ def test_DBN(finetune_lr=0.1, pretraining_epochs=100,
 
                 validation_losses = validate_model()
                 this_validation_loss = numpy.mean(validation_losses)
-                print('epoch %i, minibatch %i/%i, validation error %f %%' % \
-                      (epoch, minibatch_index + 1, n_train_batches,
-                       this_validation_loss * 100.))
+                print(
+                    'epoch %i, minibatch %i/%i, validation error %f %%'
+                    % (
+                        epoch,
+                        minibatch_index + 1,
+                        n_train_batches,
+                        this_validation_loss * 100.
+                    )
+                )
 
                 # if we got the best validation score until now
                 if this_validation_loss < best_validation_loss:
 
                     #improve patience if loss improvement is good enough
-                    if (this_validation_loss < best_validation_loss *
-                        improvement_threshold):
+                    if (
+                        this_validation_loss < best_validation_loss *
+                        improvement_threshold
+                    ):
                         patience = max(patience, iter * patience_increase)
 
                     # save best validation score and iteration number
@@ -394,9 +428,12 @@ def test_DBN(finetune_lr=0.1, pretraining_epochs=100,
                 break
 
     end_time = time.clock()
-    print(('Optimization complete with best validation score of %f %%,'
-           'with test performance %f %%') %
-                 (best_validation_loss * 100., test_score * 100.))
+    print(
+        (
+            'Optimization complete with best validation score of %f %%,'
+            'with test performance %f %%'
+        ) % (best_validation_loss * 100., test_score * 100.)
+    )
     print >> sys.stderr, ('The fine tuning code for file ' +
                           os.path.split(__file__)[1] +
                           ' ran for %.2fm' % ((end_time - start_time)
 
@@ -46,6 +46,7 @@
 from dA import dA
 
 
+# start-snippet-1
 class SdA(object):
     """Stacked denoising auto-encoder class (SdA)
 
@@ -104,6 +105,7 @@ def __init__(
         self.x = T.matrix('x')  # the data is presented as rasterized images
         self.y = T.ivector('y')  # the labels are presented as 1D vector of
                                  # [int] labels
+        # end-snippet-1
 
         # The SdA is an MLP, for which all weights of intermediate layers
         # are shared with a different denoising autoencoders
@@ -115,6 +117,7 @@ def __init__(
         # During finetunining we will finish training the SdA by doing
         # stochastich gradient descent on the MLP
 
+        # start-snippet-2
         for i in xrange(self.n_layers):
             # construct the sigmoidal layer
 
@@ -157,11 +160,13 @@ def __init__(
                           W=sigmoid_layer.W,
                           bhid=sigmoid_layer.b)
             self.dA_layers.append(dA_layer)
-
+        # end-snippet-2
         # We now need to add a logistic layer on top of the MLP
         self.logLayer = LogisticRegression(
-                         input=self.sigmoid_layers[-1].output,
-                         n_in=hidden_layers_sizes[-1], n_out=n_outs)
+            input=self.sigmoid_layers[-1].output,
+            n_in=hidden_layers_sizes[-1],
+            n_out=n_outs
+        )
 
         self.params.extend(self.logLayer.params)
         # construct a function that implements one step of finetunining
@@ -210,13 +215,18 @@ def pretraining_functions(self, train_set_x, batch_size):
             cost, updates = dA.get_cost_updates(corruption_level,
                                                 learning_rate)
             # compile the theano function
-            fn = theano.function(inputs=[index,
-                              theano.Param(corruption_level, default=0.2),
-                              theano.Param(learning_rate, default=0.1)],
-                                 outputs=cost,
-                                 updates=updates,
-                                 givens={self.x: train_set_x[batch_begin:
-                                                             batch_end]})
+            fn = theano.function(
+                inputs=[
+                    index,
+                    theano.Param(corruption_level, default=0.2),
+                    theano.Param(learning_rate, default=0.1)
+                ],
+                outputs=cost,
+                updates=updates,
+                givens={
+                    self.x: train_set_x[batch_begin: batch_end]
+                }
+            )
             # append `fn` to the list of functions
             pretrain_fns.append(fn)
 
@@ -282,12 +292,12 @@ def build_finetune_functions(self, datasets, batch_size, learning_rate):
             [index],
             self.errors,
             givens={
-               self.x: test_set_x[
-                   index * batch_size: (index + 1) * batch_size
-               ],
-               self.y: test_set_y[
-                   index * batch_size: (index + 1) * batch_size
-               ]
+                self.x: test_set_x[
+                    index * batch_size: (index + 1) * batch_size
+                ],
+                self.y: test_set_y[
+                    index * batch_size: (index + 1) * batch_size
+                ]
             },
             name='test'
         )
@@ -354,6 +364,7 @@ def test_SdA(finetune_lr=0.1, pretraining_epochs=15,
     n_train_batches /= batch_size
 
     # numpy random generator
+    # start-snippet-3
     numpy_rng = numpy.random.RandomState(89677)
     print '... building the model'
     # construct the stacked denoising autoencoder class
@@ -363,7 +374,7 @@ def test_SdA(finetune_lr=0.1, pretraining_epochs=15,
         hidden_layers_sizes=[1000, 1000, 1000],
         n_outs=10
     )
-
+    # end-snippet-3 start-snippet-4
     #########################
     # PRETRAINING THE MODEL #
     #########################
@@ -392,16 +403,18 @@ def test_SdA(finetune_lr=0.1, pretraining_epochs=15,
     print >> sys.stderr, ('The pretraining code for file ' +
                           os.path.split(__file__)[1] +
                           ' ran for %.2fm' % ((end_time - start_time) / 60.))
-
+    # end-snippet-4
     ########################
     # FINETUNING THE MODEL #
     ########################
 
     # get the training, validation and testing function for the model
     print '... getting the finetuning functions'
     train_fn, validate_model, test_model = sda.build_finetune_functions(
-                datasets=datasets, batch_size=batch_size,
-                learning_rate=finetune_lr)
+        datasets=datasets,
+        batch_size=batch_size,
+        learning_rate=finetune_lr
+    )
 
     print '... finetunning the model'
     # early-stopping parameters
@@ -441,8 +454,10 @@ def test_SdA(finetune_lr=0.1, pretraining_epochs=15,
                 if this_validation_loss < best_validation_loss:
 
                     #improve patience if loss improvement is good enough
-                    if (this_validation_loss < best_validation_loss *
-                        improvement_threshold):
+                    if (
+                        this_validation_loss < best_validation_loss *
+                        improvement_threshold
+                    ):
                         patience = max(patience, iter * patience_increase)
 
                     # save best validation score and iteration number
@@ -462,9 +477,13 @@ def test_SdA(finetune_lr=0.1, pretraining_epochs=15,
                 break
 
     end_time = time.clock()
-    print(('Optimization complete with best validation score of %f %%,'
-           'with test performance %f %%') %
-                 (best_validation_loss * 100., test_score * 100.))
+    print(
+        (
+            'Optimization complete with best validation score of %f %%,'
+            'with test performance %f %%'
+        )
+        % (best_validation_loss * 100., test_score * 100.)
+    )
     print >> sys.stderr, ('The training code for file ' +
                           os.path.split(__file__)[1] +
                           ' ran for %.2fm' % ((end_time - start_time) / 60.))
 
@@ -131,11 +131,14 @@ def __init__(self, numpy_rng, input=None, n_visible=784, n_hidden=100,
             # 4*sqrt(6./(n_hidden+n_visible))the output of uniform if
             # converted using asarray to dtype
             # theano.config.floatX so that the code is runable on GPU
-            initial_W = numpy.asarray(numpy_rng.uniform(
-                      low=-4 * numpy.sqrt(6. / (n_hidden + n_visible)),
-                      high=4 * numpy.sqrt(6. / (n_hidden + n_visible)),
-                      size=(n_visible, n_hidden)),
-                                      dtype=theano.config.floatX)
+            initial_W = numpy.asarray(
+                numpy_rng.uniform(
+                    low=-4 * numpy.sqrt(6. / (n_hidden + n_visible)),
+                    high=4 * numpy.sqrt(6. / (n_hidden + n_visible)),
+                    size=(n_visible, n_hidden)
+                ),
+                dtype=theano.config.floatX
+            )
             W = theano.shared(value=initial_W, name='W', borrow=True)
 
         if not bvis:
@@ -186,7 +189,7 @@ def get_reconstructed_input(self, hidden):
         hidden layer
 
         """
-        return  T.nnet.sigmoid(T.dot(hidden, self.W_prime) + self.b_prime)
+        return T.nnet.sigmoid(T.dot(hidden, self.W_prime) + self.b_prime)
 
     def get_cost_updates(self, contraction_level, learning_rate):
         """ This function computes the cost and the updates for one trainng
@@ -265,10 +268,14 @@ def test_cA(learning_rate=0.01, training_epochs=20,
     cost, updates = ca.get_cost_updates(contraction_level=contraction_level,
                                         learning_rate=learning_rate)
 
-    train_ca = theano.function([index], [T.mean(ca.L_rec), ca.L_jacob],
-                               updates=updates,
-                               givens={x: train_set_x[index * batch_size:
-                                                    (index + 1) * batch_size]})
+    train_ca = theano.function(
+        [index],
+        [T.mean(ca.L_rec), ca.L_jacob],
+        updates=updates,
+        givens={
+            x: train_set_x[index * batch_size: (index + 1) * batch_size]
+        }
+    )
 
     start_time = time.clock()