replace python for loop with tf.scan

zach-nervana · zach-nervana · commit 006d3a581818 · 2017-10-30T15:01:01.000-04:00
diff --git a/tensorflow_hmm/hmm.py b/tensorflow_hmm/hmm.py
@@ -193,40 +193,48 @@ def forward_backward(self, y):
 
         # set up
         N = tf.shape(y)[0]
-        nT = self.length or y.shape[1]
-        # nT = tf.shape(y)[1]
 
-        forward = []
+        # y (batch, recurrent, features) -> (recurrent, batch, features)
+        y = tf.transpose(y, (1, 0, 2))
 
         # forward pass
-        forward.append(tf.ones((N, self.K)) * (1.0 / self.K))
-        for t in range(nT):
-            tmp = tf.multiply(tf.matmul(forward[t], self.P), y[:, t])
-
-            forward.append(tmp / tf.expand_dims(tf.reduce_sum(tmp, axis=1), axis=1))
+        def forward_function(last_forward, yi):
+            tmp = tf.multiply(tf.matmul(last_forward, self.P), yi)
+            return tmp / tf.reduce_sum(tmp, axis=1, keep_dims=True)
+
+        forward = tf.scan(
+            forward_function,
+            y,
+            initializer=tf.ones((N, self.K)) * (1.0 / self.K),
+        )
 
         # backward pass
-        backward = [None] * (nT + 1)
-        backward[-1] = tf.ones((N, self.K)) * (1.0 / self.K)
-        for t in range(nT, 0, -1):
+        def backward_function(last_backward, yi):
             # combine transition matrix with observations
             combined = tf.multiply(
-                tf.expand_dims(self.P, 0), tf.expand_dims(y[:, t - 1], 1)
+                tf.expand_dims(self.P, 0), tf.expand_dims(yi, 1)
             )
             tmp = tf.reduce_sum(
-                tf.multiply(combined, tf.expand_dims(backward[t], 1)), axis=2
+                tf.multiply(combined, tf.expand_dims(last_backward, 1)), axis=2
             )
-            backward[t - 1] = tmp / tf.expand_dims(tf.reduce_sum(tmp, axis=1), axis=1)
+            return tmp / tf.reduce_sum(tmp, axis=1, keep_dims=True)
 
-        # remove initial/final probabilities
-        forward = forward[1:]
-        backward = backward[:-1]
+        backward = tf.scan(
+            backward_function,
+            tf.reverse(y, [0]),
+            initializer=tf.ones((N, self.K)) * (1.0 / self.K),
+        )
+        backward = tf.reverse(backward, [0])
 
+		# combine forward and backward into posterior probabilities
+        # (recurrent, batch, features)
+        posterior = forward * backward
+        posterior = posterior / tf.reduce_sum(posterior, axis=2, keep_dims=True)
 
-        # combine and normalize
-        posterior = [f * b for f, b in zip(forward, backward)]
-        posterior = [p / tf.expand_dims(tf.reduce_sum(p, axis=1), axis=1) for p in posterior]
-        posterior = tf.stack(posterior, axis=1)
+        # (recurrent, batch, features) -> (batch, recurrent, features)
+        posterior = tf.transpose(posterior, (1, 0, 2))
+        forward = tf.transpose(forward, (1, 0, 2))
+        backward = tf.transpose(backward, (1, 0, 2))
 
         return posterior, forward, backward
 
diff --git a/tensorflow_hmm/hmm_layer.py b/tensorflow_hmm/hmm_layer.py
@@ -14,7 +14,7 @@ def __init__(self, states, length=None):
         for i in range(states):
             self.P[i, i] = 0.99
 
-        self.hmm = HMMTensorflow(self.P, length=length)
+        self.hmm = HMMTensorflow(self.P)
 
         super(HMMLayer, self).__init__()
 
diff --git a/test/test_hmm.py b/test/test_hmm.py
@@ -101,16 +101,21 @@ def test_hmm_tf_latch_forward_backward_multiple_batch(hmm_tf_latch, hmm_latch):
     y = lik(np.array([0, 0, 1, 1]))
     y = np.stack([y] * 3)
 
-    np_posterior, np_forward, _ = hmm_latch.forward_backward(y)
+    np_posterior, np_forward, np_backward = hmm_latch.forward_backward(y)
     print('tf')
-    g_posterior, g_forward, _ = hmm_tf_latch.forward_backward(y)
+    g_posterior, g_forward, g_backward = hmm_tf_latch.forward_backward(y)
     tf_posterior = tf.Session().run(g_posterior)
+    tf_forward = tf.Session().run(g_forward)
+    tf_backward = tf.Session().run(g_backward)
 
+    assert np.isclose(np_forward, tf_forward).all()
+    print('np_backward', np_backward)
+    print('tf_backward', tf_backward)
+    assert np.isclose(np_backward, tf_backward).all()
     print('np_posterior', np_posterior)
     print('tf_posterior', tf_posterior)
     assert np.isclose(np_posterior, tf_posterior).all()
 
-
 def test_lik():
     yin = np.array([0, 0.25, 0.5, 0.75, 1])
     y = lik(yin)