dA

Yusuke Sugomori · Yusuke Sugomori · commit f4ddff14ccb4 · 2013-02-03T15:45:42.000+09:00
diff --git a/README.md b/README.md
@@ -10,6 +10,8 @@
 
   - CRBM: Restricted Boltzmann Machine w/ continuous-valued inputs
 
+  - dA:   Denoising Autoencoders
+
   - LogisticRegression: Logistic Regression
 
   - HiddenLayer: Hidden Layer of Neural Networks
diff --git a/dA.py b/dA.py
@@ -0,0 +1,138 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+
+import sys
+import numpy
+from utils import *
+
+
+class dA(object):
+    def __init__(self, input=None, n_visible=2, n_hidden=3, \
+        W=None, hbias=None, vbias=None, numpy_rng=None):
+
+        self.n_visible = n_visible  # num of units in visible (input) layer
+        self.n_hidden = n_hidden    # num of units in hidden layer
+
+        if numpy_rng is None:
+            numpy_rng = numpy.random.RandomState(1234)
+            
+        if W is None:
+            a = 1. / n_visible
+            initial_W = numpy.array(numpy_rng.uniform(  # initialize W uniformly
+                low=-a,
+                high=a,
+                size=(n_visible, n_hidden)))
+
+            W = initial_W
+
+        if hbias is None:
+            hbias = numpy.zeros(n_hidden)  # initialize h bias 0
+
+        if vbias is None:
+            vbias = numpy.zeros(n_visible)  # initialize v bias 0
+
+        self.numpy_rng = numpy_rng
+        self.x = input
+        self.W = W
+        self.W_prime = self.W.T
+        self.hbias = hbias
+        self.vbias = vbias
+
+        # self.params = [self.W, self.hbias, self.vbias]
+
+
+        
+    def get_corrupted_input(self, input, corruption_level):
+        assert corruption_level < 1
+
+        return self.numpy_rng.binomial(size=input.shape,
+                                       n=1,
+                                       p=1-corruption_level) * input
+
+    # Encode
+    def get_hidden_values(self, input):
+        return sigmoid(numpy.dot(input, self.W) + self.hbias)
+
+    # Decode
+    def get_reconstructed_input(self, hidden):
+        return sigmoid(numpy.dot(hidden, self.W_prime) + self.vbias)
+
+
+    def train(self, lr=0.1, corruption_level=0.3, input=None):
+        if input is not None:
+            self.x = input
+
+        x = self.x
+        tilde_x = self.get_corrupted_input(x, corruption_level)
+        y = self.get_hidden_values(tilde_x)
+        z = self.get_reconstructed_input(y)
+
+        L_h2 = x - z
+        L_h1 = numpy.dot(L_h2, self.W) * y * (1 - y)
+
+        L_vbias = L_h2
+        L_hbias = L_h1
+        L_W =  numpy.dot(tilde_x.T, L_h1) + numpy.dot(L_h2.T, y)
+
+
+        self.W += lr * L_W
+        self.hbias += lr * numpy.mean(L_hbias, axis=0)
+        self.vbias += lr * numpy.mean(L_vbias, axis=0)
+
+
+
+    def negative_log_likelihood(self, corruption_level=0.3):
+        tilde_x = self.get_corrupted_input(self.x, corruption_level)
+        y = self.get_hidden_values(tilde_x)
+        z = self.get_reconstructed_input(y)
+
+        cross_entropy = - numpy.mean(
+            numpy.sum(self.x * numpy.log(z) +
+            (1 - self.x) * numpy.log(1 - z),
+                      axis=1))
+
+        return cross_entropy
+
+
+    def reconstruct(self, x):
+        y = self.get_hidden_values(x)
+        z = self.get_reconstructed_input(y)
+        return z
+
+
+
+def test_dA(learning_rate=0.1, corruption_level=0.3, training_epochs=50):
+    data = numpy.array([[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0],
+                        [1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0],
+                        [1, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0],
+                        [1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0],
+                        [0, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0],
+                        [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1],
+                        [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1],
+                        [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 1, 1, 0, 1],
+                        [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1],
+                        [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 0]])
+    
+    rng = numpy.random.RandomState(123)
+
+    # construct dA
+    da = dA(input=data, n_visible=20, n_hidden=5, numpy_rng=rng)
+
+    # train
+    for epoch in xrange(training_epochs):
+        da.train(lr=learning_rate, corruption_level=corruption_level)
+        # cost = da.negative_log_likelihood(corruption_level=corruption_level)
+        # print >> sys.stderr, 'Training epoch %d, cost is ' % epoch, cost
+        # learning_rate *= 0.95
+
+
+    # test
+    x = numpy.array([[1, 0, 1, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1],
+                     [0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0]])
+
+    print da.reconstruct(x)
+
+
+
+if __name__ == "__main__":
+    test_dA()