CRBM

Yusuke Sugomori · Yusuke Sugomori · commit 3012646a84cc · 2013-01-29T10:33:09.000+09:00
diff --git a/RestrictedBoltzmannMachine.py b/RestrictedBoltzmannMachine.py
@@ -61,17 +61,17 @@ def contrastive_divergence(self, lr=0.1, k=1, input=None):
             self.input = input
         
         ''' CD-k '''
-        pre_sigmoid_ph, ph_mean, ph_sample = self.sample_h_given_v(self.input)
+        ph_mean, ph_sample = self.sample_h_given_v(self.input)
 
         chain_start = ph_sample
 
         for step in xrange(k):
             if step == 0:
-                pre_sigmoid_nvs, nv_means, nv_samples,\
-                pre_sigmoid_nhs, nh_means, nh_samples = self.gibbs_hvh(chain_start)
+                nv_means, nv_samples,\
+                nh_means, nh_samples = self.gibbs_hvh(chain_start)
             else:
-                pre_sigmoid_nvs, nv_means, nv_samples,\
-                pre_sigmoid_nhs, nh_means, nh_samples = self.gibbs_hvh(nh_samples)
+                nv_means, nv_samples,\
+                nh_means, nh_samples = self.gibbs_hvh(nh_samples)
 
         # chain_end = nv_samples
 
@@ -86,37 +86,37 @@ def contrastive_divergence(self, lr=0.1, k=1, input=None):
 
 
     def sample_h_given_v(self, v0_sample):
-        pre_sigmoid_h1, h1_mean = self.propup(v0_sample)
+        h1_mean = self.propup(v0_sample)
         h1_sample = self.numpy_rng.binomial(size=h1_mean.shape,   # discrete: binomial
                                        n=1,
                                        p=h1_mean)
 
-        return [pre_sigmoid_h1, h1_mean, h1_sample]
+        return [h1_mean, h1_sample]
 
 
     def sample_v_given_h(self, h0_sample):
-        pre_sigmoid_v1, v1_mean = self.propdown(h0_sample)
+        v1_mean = self.propdown(h0_sample)
         v1_sample = self.numpy_rng.binomial(size=v1_mean.shape,   # discrete: binomial
                                             n=1,
                                             p=v1_mean)
         
-        return [pre_sigmoid_v1, v1_mean, v1_sample]
+        return [v1_mean, v1_sample]
 
     def propup(self, v):
         pre_sigmoid_activation = numpy.dot(v, self.W) + self.hbias
-        return [pre_sigmoid_activation, sigmoid(pre_sigmoid_activation)]
+        return sigmoid(pre_sigmoid_activation)
 
     def propdown(self, h):
         pre_sigmoid_activation = numpy.dot(h, self.W.T) + self.vbias
-        return [pre_sigmoid_activation, sigmoid(pre_sigmoid_activation)]
+        return sigmoid(pre_sigmoid_activation)
 
 
     def gibbs_hvh(self, h0_sample):
-        pre_sigmoid_v1, v1_mean, v1_sample = self.sample_v_given_h(h0_sample)
-        pre_sigmoid_h1, h1_mean, h1_sample = self.sample_h_given_v(v1_sample)
+        v1_mean, v1_sample = self.sample_v_given_h(h0_sample)
+        h1_mean, h1_sample = self.sample_h_given_v(v1_sample)
 
-        return [pre_sigmoid_v1, v1_mean, v1_sample,
-                pre_sigmoid_h1, h1_mean, h1_sample]
+        return [v1_mean, v1_sample,
+                h1_mean, h1_sample]
     
 
     def get_reconstruction_cross_entropy(self):
@@ -139,6 +139,35 @@ def reconstruct(self, v):
         return reconstructed_v
 
 
+'''
+ RBM  w/ continuous-valued inputs (Linear Energy)
+'''
+class CRBM(RBM):
+    def propdown(self, h):
+        pre_activation = numpy.dot(h, self.W.T) + self.vbias
+        return pre_activation
+        
+
+
+    def sample_v_given_h(self, h0_sample):
+        a_h = self.propdown(h0_sample)
+        en = numpy.exp(-a_h)
+        ep = numpy.exp(a_h)
+
+        v1_mean = 1 / (1 - en) - 1 / a_h
+        U = numpy.array(self.numpy_rng.uniform(
+            low=0,
+            high=1,
+            size=v1_mean.shape))
+
+        v1_sample = numpy.log((1 - U * (1 - ep))) / a_h
+
+        
+        return [v1_mean, v1_sample]
+
+
+
+
 def test_rbm(learning_rate=0.1, k=1, training_epochs=1000):
     data = numpy.array([[1,1,1,0,0,0],
                         [1,0,1,0,0,0],
@@ -148,7 +177,6 @@ def test_rbm(learning_rate=0.1, k=1, training_epochs=1000):
                         [0,0,1,1,1,0]])
 
 
-
     rng = numpy.random.RandomState(123)
 
     # construct RBM
@@ -168,5 +196,35 @@ def test_rbm(learning_rate=0.1, k=1, training_epochs=1000):
     print rbm.reconstruct(v)
 
 
+
+def test_crbm(learning_rate=0.1, k=1, training_epochs=1000):
+    data = numpy.array([[0.4, 0.5, 0.5, 0.,  0.,  0.],
+                        [0.5, 0.3,  0.5, 0.,  0.,  0.],
+                        [0.4, 0.5, 0.5, 0.,  0.,  0.],
+                        [0.,  0.,  0.5, 0.3, 0.5, 0.],
+                        [0.,  0.,  0.5, 0.4, 0.5, 0.],
+                        [0.,  0.,  0.5, 0.5, 0.5, 0.]])
+
+
+    rng = numpy.random.RandomState(123)
+
+    # construct CRBM
+    rbm = CRBM(input=data, n_visible=6, n_hidden=5, numpy_rng=rng)
+
+    # train
+    for epoch in xrange(training_epochs):
+        rbm.contrastive_divergence(lr=learning_rate, k=k)
+        cost = rbm.get_reconstruction_cross_entropy()
+        print >> sys.stderr, 'Training epoch %d, cost is ' % epoch, cost
+
+
+    # test
+    v = numpy.array([[0.5, 0.5, 0., 0., 0., 0.],
+                     [0., 0., 0., 0.5, 0.5, 0.]])
+
+    print rbm.reconstruct(v)
+
+
 if __name__ == "__main__":
-    test_rbm()
+    # test_rbm()
+    test_crbm()
diff --git a/utils.py b/utils.py
@@ -1,23 +1,26 @@
 ''' '''
 import numpy
 
+
 numpy.seterr(all='ignore')
 
 
 def sigmoid(x):
-    # numpy.seterrcall(sigmoid_err_handler)  # overflow handling
-    # numpy.seterr(all='call')
     return 1. / (1 + numpy.exp(-x))
 
 
-def sigmoid_err_handler(type, flg):
-    # Log
-    return
-
-
 def softmax(x):
     e = numpy.exp(x - numpy.max(x))  # prevent overflow
     if e.ndim == 1:
         return e / numpy.sum(e, axis=0)
     else:  
         return e / numpy.array([numpy.sum(e, axis=1)]).T  # ndim = 2
+
+
+# # probability density for the Gaussian dist
+# def gaussian(x, mean=0.0, scale=1.0):
+#     s = 2 * numpy.power(scale, 2)
+#     e = numpy.exp( - numpy.power((x - mean), 2) / s )
+
+#     return e / numpy.square(numpy.pi * s)
+