try use eval instead of function

chaosconst · chaosconst · commit 171baab72bb8 · 2013-09-23T17:32:52.000+08:00
diff --git a/code/DBN.py b/code/DBN.py
@@ -12,7 +12,7 @@
 import theano.tensor as T
 from theano.tensor.shared_randomstreams import RandomStreams
 
-from logistic_sgd import LogisticRegression, load_data
+from logistic_sgd_kaggle import LogisticRegression, load_data
 from mlp import HiddenLayer
 from rbm import RBM
 
diff --git a/code/convolutional_mlp_kaggle.py b/code/convolutional_mlp_kaggle.py
@@ -34,7 +34,7 @@
 from theano.tensor.signal import downsample
 from theano.tensor.nnet import conv
 
-from logistic_sgd import LogisticRegression, load_data
+from logistic_sgd_kaggle import LogisticRegression, load_data
 from mlp import HiddenLayer
 
 
@@ -196,10 +196,6 @@ def evaluate_lenet5(learning_rate=0.1, n_epochs=200,
                 x: test_set_x[index * batch_size: (index + 1) * batch_size],
                 y: test_set_y[index * batch_size: (index + 1) * batch_size]})
 
-    predict_model = theano.function([index], layer3.predict(),
-             givens={
-                x: predict_set_x[index * batch_size: (index + 1) * batch_size]})
-
     validate_model = theano.function([index], layer3.errors(y),
             givens={
                 x: valid_set_x[index * batch_size: (index + 1) * batch_size],
@@ -286,8 +282,8 @@ def evaluate_lenet5(learning_rate=0.1, n_epochs=200,
                     test_losses = [test_model(i) for i in xrange(n_test_batches)]
                     test_score = numpy.mean(test_losses)
                     
-                    predict_res_array = [predict_model(i) for i in xrange(n_predict_batches)]
-                    print predict_res_array;
+                    predict_res_array = [layer3.y_pred.eval({input:predict_set_x[i * batch_size: (i + 1) * batch_size]})
+                    
                     f = open("predict_res","w+");
                     for y_pred_item_array in predict_res_array:
                       for y_pred_item in y_pred_item_array:
diff --git a/code/logistic_sgd_kaggle.py b/code/logistic_sgd_kaggle.py
@@ -121,11 +121,9 @@ def negative_log_likelihood(self, y):
         # LP[n-1,y[n-1]]] and T.mean(LP[T.arange(y.shape[0]),y]) is
         # the mean (across minibatch examples) of the elements in v,
         # i.e., the mean log-likelihood across the minibatch.
-        return -T.mean(T.log(self.p_y_given_x)[T.arange(y.shape[0]), y])
 
-    def predict(self):
-        return T.mul(self.y_pred,1)
-        
+        return -T.mean(T.log(self.p_y_given_x)[T.arange(y.shape[0]), y]) + 0.0001*T.sum(self.W **2) 
+
     def errors(self, y):
         """Return a float representing the number of errors in the minibatch
         over the total number of examples of the minibatch ; zero one
@@ -194,7 +192,7 @@ def load_data(dataset):
     test_set_size = 1000;
     predict_set_size = 28000;
 
-    debug = "false";
+    debug = "true";
     if debug == "true":
       train_set_size = 3600;
       valid_set_size = 500;
@@ -285,7 +283,7 @@ def shared_dataset(data_xy, borrow=True):
 
 def sgd_optimization_mnist(learning_rate=0.13, n_epochs=1000,
                            dataset='../data/mnist.pkl.gz',
-                           batch_size=600):
+                           batch_size=500):
     """
     Demonstrate stochastic gradient descent optimization of a log-linear
     model
@@ -344,11 +342,6 @@ def sgd_optimization_mnist(learning_rate=0.13, n_epochs=1000,
                 x: test_set_x[index * batch_size: (index + 1) * batch_size],
                 y: test_set_y[index * batch_size: (index + 1) * batch_size]})
 
-    release_output = theano.function(inputs=[index],
-            outputs=classifier.release_output(),
-            givens={
-                x: predict_set_x[index:]})
-
     validate_model = theano.function(inputs=[index],
             outputs=classifier.errors(y),
             givens={
@@ -428,9 +421,11 @@ def sgd_optimization_mnist(learning_rate=0.13, n_epochs=1000,
                     test_losses = [test_model(i)
                                    for i in xrange(n_test_batches)]
                     test_score = numpy.mean(test_losses)
+                    
+                    y_pred_show = classifier.y_pred.eval({input:predict_set_x})
 
-                    y_pred_show = [release_output(i)
-                                   for i in xrange(n_predict_batches)]
+                    y_pred_show = [classifier.y_pred.eval({input:predict_set_x[index * batch_size: (index + 1) * batch_size]})
+                                   for index in xrange(n_predict_batches)]
 
                     print y_pred_show;
                     f = open("predict_res","w+");