lisa-lab
diff --git a/‎code/best_model.pkl
Lines changed: 1990 additions & 325 deletions b/‎code/best_model.pkl
Lines changed: 1990 additions & 325 deletions
diff --git a/‎code/convolutional_mlp_test.py renamed to ‎code/convolutional_mlp_v2.py
Lines changed: 174 additions & 25 deletions b/‎code/convolutional_mlp_test.py renamed to ‎code/convolutional_mlp_v2.py
Lines changed: 174 additions & 25 deletions
@@ -26,6 +26,7 @@
 import timeit
 
 import numpy
+import cPickle
 
 import theano
 import theano.tensor as T
@@ -34,6 +35,7 @@
 
 from logistic_sgd_test import LogisticRegression, load_data
 from mlp import HiddenLayer
+from fetex_image import FetexImage
 
 
 class LeNetConvPoolLayer(object):
@@ -117,9 +119,9 @@ def __init__(self, rng, input, filter_shape, image_shape, poolsize=(2, 2)):
 # def evaluate_lenet5(learning_rate=0.1, n_epochs=100,
 #                     dataset='mnist.pkl.gz',
 #                     nkerns=[(96) , (256)], batch_size=300):
-def evaluate_lenet5(learning_rate=0.1, n_epochs=100,
+def evaluate_lenet5(learning_rate=0.1, n_epochs=2,
                     dataset='mnist.pkl.gz',
-                    nkerns=[(25 / 1) , (25 / 1)], batch_size=4):
+                    nkerns=[(25 / 1) , (25 / 1)], batch_size=400):
 
     """ Demonstrates lenet on MNIST dataset
 
@@ -224,14 +226,14 @@ def evaluate_lenet5(learning_rate=0.1, n_epochs=100,
         rng,
         input=layer2_input,
         n_in=nkerns[1] * 13 * 13,
-        n_out=2,
+        n_out=400,
         activation=T.tanh
     )
 
     # classify the values of the fully-connected sigmoidal layer
     #layer3 = LogisticRegression(input=layer2.output, n_in=500, n_out=10)
     #layer3 = LogisticRegression(input=layer2.output, n_in=500, n_out=2)
-    layer4 = LogisticRegression(input=layer3.output, n_in=2, n_out=2)
+    layer4 = LogisticRegression(input=layer3.output, n_in=400, n_out=21)
 
     # the cost we minimize during training is the NLL of the model
     #cost = layer3.negative_log_likelihood(y)
@@ -352,9 +354,33 @@ def evaluate_lenet5(learning_rate=0.1, n_epochs=100,
                           (epoch, minibatch_index + 1, n_train_batches,
                            test_score * 100.))
 
+                    output = open('../data/layer0.pkl', 'wb')
+                    cPickle.dump(layer0, output,protocol=-1)
+                    output.close()
+
+                    output = open('../data/layer1.pkl', 'wb')
+                    cPickle.dump(layer1, output,protocol=-1)
+                    output.close()
+
+                    # output = open('../data/layer2.pkl', 'wb')
+                    # cPickle.dump(layer2, output,protocol=-1)
+                    # output.close()
+
+                    output = open('../data/layer3.pkl', 'wb')
+                    cPickle.dump(layer3, output,protocol=-1)
+                    output.close()
+
+                    output = open('../data/layer4.pkl', 'wb')
+                    cPickle.dump(layer4, output,protocol=-1)
+                    output.close()
+                    
                     # save the best model
                     # with open('best_model.pkl', 'w') as f:
-                    #     cPickle.dump(classifier, f)
+                    #     cPickle.dump(layer0, f)                                                
+                    #     cPickle.dump(layer1, f)                        
+                    #     cPickle.dump(layer2, f)                        
+                    #     cPickle.dump(layer3, f)
+                    #     cPickle.dump(layer4, f)
 
             if patience <= iter:
                 done_looping = True
@@ -369,32 +395,155 @@ def evaluate_lenet5(learning_rate=0.1, n_epochs=100,
                           os.path.split(__file__)[1] +
                           ' ran for %.2fm' % ((end_time - start_time) / 60.))
 
-    def predict():
-        """
-        An example of how to load a trained model and use it
-        to predict labels.
-        """
+# def predict(self, data):
+#     """
+#     the CNN expects inputs with Nsamples = self.batch_size.
+#     In order to run 'predict' on an arbitrary number of samples we
+#     pad as necessary.
+#     """
+#     if isinstance(data, list):
+#         data = np.array(data)
+#     if data.ndim == 1:
+#         data = np.array([data])
+
+#     nsamples = data.shape[0]
+#     n_batches = nsamples//self.batch_size
+#     n_rem = nsamples%self.batch_size
+#     if n_batches > 0:
+#         preds = [list(self.predict_wrap(data[i*self.batch_size:(i+1)*self.batch_size]))\
+#                                        for i in range(n_batches)]
+#     else:
+#         preds = []
+#     if n_rem > 0:
+#         z = np.zeros((self.batch_size, self.n_in * self.n_in))
+#         z[0:n_rem] = data[n_batches*self.batch_size:n_batches*self.batch_size+n_rem]
+#         preds.append(self.predict_wrap(z)[0:n_rem])
+    
+#     return np.hstack(preds).flatten()
+
+def cosine_distance(a, b):
+    import numpy as np
+    from numpy import linalg as LA 
+    dot_product =  np.dot(a,b.T)
+    cosine_distance = dot_product / (LA.norm(a) * LA.norm(b))
+    return cosine_distance
+
+def predict():
+
+    from sktheano_cnn import MetaCNN as CNN
+    cnn = CNN()
+
+    pkl_file = open( '../data/train_set.pkl', 'rb')
+    train_set = cPickle.load(pkl_file)
+
+    pkl_file = open( '../data/valid_set.pkl', 'rb')
+    valid_set = cPickle.load(pkl_file)
+
+    pkl_file = open( '../data/test_set.pkl', 'rb')
+    test_set = cPickle.load(pkl_file)
+
+    """An example of how to load a trained model and use it
+    to predict labels.
+    """
+
+    fe = FetexImage(verbose=True)
+    # load the saved model
+    classifier = cPickle.load(open('best_model.pkl'))
+
+    layer0 = cPickle.load(open('../data/layer0.pkl'))
+    layer1 = cPickle.load(open('../data/layer1.pkl'))
+    # layer2 = cPickle.load(open('../data/layer2.pkl')) 
+    layer3 = cPickle.load(open('../data/layer3.pkl'))
+    layer4 = cPickle.load(open('../data/layer4.pkl'))
+
+    #layer0_input = x.reshape((batch_size, 3, 64, 64))
+
+    # predict = theano.function(
+    #     outputs=layer4.y_pred,
+    #     givens = {x : train_set_x[0] }
+    # )
+
+    # compile a predictor function
+    predict_model = theano.function(
+        inputs=[classifier.input],
+        outputs=classifier.y_pred)
+
+    # We can test it on some examples from test test
+    dataset='mnist.pkl.gz'
+    datasets = load_data(dataset)
 
-        # load the saved model
-        classifier = cPickle.load(open('best_model.pkl'))
+    test_set_x, test_set_y = datasets[2]
+    test_set_x = test_set_x.get_value()
 
-        # compile a predictor function
-        predict_model = theano.function(
-            inputs=[classifier.input],
-            outputs=classifier.y_pred)
+    train_set_x, train_set_y = datasets[0]
+    train_set_x = train_set_x.get_value()
+
+    pkl_file = open( '../data/X_original.pkl', 'rb')
+    X_original = cPickle.load(pkl_file)
+
+    a = X_original[0]
+    #fe.reconstructImage(a).show()
+
+    #predicted_values = predict_model([a])
+
+    get_input = theano.function(
+        inputs=[classifier.input],
+        outputs=classifier.input
+    )
 
-        # We can test it on some examples from test test
-        dataset='mnist.pkl.gz'
-        datasets = load_data(dataset)
-        test_set_x, test_set_y = datasets[2]
-        test_set_x = test_set_x.get_value()
+    a = get_input(train_set_x[0:1])
+    #print a.shape
 
-        predicted_values = predict_model(test_set_x[:10])
-        print ("Predicted values for the first 10 examples in test set:")
-        print predicted_values
+    x = T.matrix('x')   # the data is presented as rasterized images
+    predict = theano.function(
+        inputs = [x],
+        outputs=layer3.output
+    )
+    # givens = { x : train_set_x[0] }
+    #train_set_x = train_set_x[0:400]
+    #x = train_set_x.reshape((400, 3, 64, 64))
+    x = train_set_x.reshape(np.zeros((400,3,64,64)))
+    print predict(x)
+    #predicted_values = predict_model([train_set_x[0]])
+    #print predicted_values
+    return "fffff"
+
+
+    max_similarity = 0
+    max_similarity_pos = -1
+    #for i in xrange(1,len(train_set_x)):
+    for i in xrange(1,1000):
+        b = get_input([train_set_x[i]])
+        d = cosine_distance(a, b)
+        if d > max_similarity:
+            max_similarity = d
+            max_similarity_pos = i
+
+    fe.reconstructImage(X_original[max_similarity_pos]).show()
+
+    #a = a.flatten(order='F')
+    # a = a * 256
+    # a = numpy.array(a,dtype=numpy.uint8)
+
+    #b = b.flatten(order='F')
+    # b = b * 256
+    # b = numpy.array(b,dtype=numpy.uint8)
+
+    # a = get_input([a])
+    # b = get_input([b])
+
+    print a.shape
+    print b.shape
+    print cosine_distance(a, b)
+
+    # #print get_input(test_set_x[0:1]).sum()
+
+    # print ("Predicted values for the first 10 examples in test set:")
+    # print predicted_values
 
 if __name__ == '__main__':
-    evaluate_lenet5()
+    #evaluate_lenet5()
+    predict()
 
 
 def experiment(state, channel):