Reuse testcases in both CPU and GPU tests of CTC

Signed-off-by: João Victor Tozatti Risso <joaovictor.risso@gmail.com>

Reuse testcases in both CPU and GPU tests of CTC
d35d01b1 · João Victor Tozatti Risso · b4f54eae · d35d01b1 · d35d01b1
--- a/theano/gpuarray/tests/test_ctc.py
+++ b/theano/gpuarray/tests/test_ctc.py
@@ -9,6 +9,7 @@ from theano.tests import unittest_tools as utt
 import theano.gpuarray
 from theano.gpuarray.ctc import (gpu_ctc, GpuConnectionistTemporalClassification)
 from theano.tensor.nnet.ctc import (ctc, ctc_available, ConnectionistTemporalClassification)
+from theano.tensor.nnet.tests.test_ctc import (setup_torch_case, setup_ctc_case, setup_grad_case)
 from .config import (mode_with_gpu, mode_without_gpu)
@@ -118,53 +119,12 @@ class TestCTC(unittest.TestCase):
    # Test obtained from Torch tutorial at:
    # https://github.com/baidu-research/warp-ctc/blob/master/torch_binding/TUTORIAL.md
    def test_torch_case(self):
-        # Layout, from slowest to fastest changing dimension, is (time, batchSize, inputLayerSize)
+        activations, labels, activation_times, expected_costs, expected_grads = setup_torch_case()
-        activations = np.asarray([[[0, 0, 0, 0, 0], [1, 2, 3, 4, 5], [-5, -4, -3, -2, -1]],
+        self.check_ctc(activations, labels, activation_times, expected_costs, expected_grads)
-                                  [[0, 0, 0, 0, 0], [6, 7, 8, 9, 10], [-10, -9, -8, -7, -6]],
-                                  [[0, 0, 0, 0, 0], [11, 12, 13, 14, 15], [-15, -14, -13, -12, -11]]],
-                                 dtype=np.float32)
-        # Duration of each sequence
-        activation_times = np.asarray([1, 3, 3], dtype=np.int32)
-        # Labels for each sequence
-        labels = np.asarray([[1, -1],
-                             [3, 3],
-                             [2, 3]], dtype=np.int32)
-        expected_costs = np.asarray([1.609437943, 7.355742931, 4.938849926],
-                                    dtype=np.float32)
-        grads = [[[0.2, -0.8, 0.2, 0.2, 0.2],
-                  [0.01165623125, 0.03168492019, 0.08612854034, -0.7658783197, 0.636408627],
-                  [-0.02115798369, 0.03168492019, -0.8810571432, 0.2341216654, 0.636408627]],
-                 [[0, 0, 0, 0, 0],
-                  [-0.9883437753, 0.03168492019, 0.08612854034, 0.2341216654, 0.636408627],
-                  [-0.02115798369, 0.03168492019, -0.1891518533, -0.4577836394, 0.636408627]],
-                 [[0, 0, 0, 0, 0],
-                  [0.01165623125, 0.03168492019, 0.08612854034, -0.7658783197, 0.636408627],
-                  [-0.02115798369, 0.03168492019, 0.08612854034, -0.7330639958, 0.636408627]]]
-        expected_gradients = np.asarray(grads, dtype=np.float32)
-        self.check_ctc(activations, labels, activation_times, expected_costs, expected_gradients)
    def test_ctc(self):
-        activations = np.asarray([[[0.1, 0.6, 0.1, 0.1, 0.1], [0.1, 0.1, 0.6, 0.1, 0.1]],
+        activations, labels, input_length, expected_costs, expected_grads = setup_ctc_case()
-                                  [[0.6, 0.1, 0.1, 0.1, 0.1], [0.1, 0.1, 0.5, 0.2, 0.1]]],
+        self.check_ctc(activations, labels, input_length, expected_costs, expected_grads)
-                                 dtype=np.float32)
-        activation_times = np.asarray([2, 2], dtype=np.int32)
-        labels = np.asarray([[1, 2], [1, 2]], dtype=np.int32)
-        expected_costs = np.asarray([2.962858438, 3.053659201], dtype=np.float32)
-        grads = [[[0.177031219, -0.7081246376, 0.177031219, 0.177031219, 0.177031219],
-                  [0.177031219, -0.8229685426, 0.291875124, 0.177031219, 0.177031219]],
-                 [[0.291875124, 0.177031219, -0.8229685426, 0.177031219, 0.177031219],
-                  [0.1786672771, 0.1786672771, -0.7334594727, 0.1974578798, 0.1786672771]]]
-        expected_gradients = np.asarray(grads, dtype=np.float32)
-        self.check_ctc(activations, labels, activation_times, expected_costs, expected_gradients)
    def test_verify_grad(self):
        def ctc_op_functor(labels, in_lengths):
@@ -175,13 +135,7 @@ class TestCTC(unittest.TestCase):
                return gpu_ctc(acts, t_labels, t_activation_times)
            return wrapper
-        activations = np.asarray([[[0.1, 0.6, 0.1, 0.1, 0.1], [0.1, 0.1, 0.6, 0.1, 0.1]],
+        activations, activation_times, labels = setup_grad_case()
-                                  [[0.6, 0.1, 0.1, 0.1, 0.1], [0.1, 0.1, 0.5, 0.2, 0.1]]],
-                                 dtype=np.float32)
-        activation_times = np.asarray([2, 2], dtype=np.int32)
-        labels = np.asarray([[1, 2], [1, 2]], dtype=np.int32)
        ctc_op = ctc_op_functor(labels, activation_times)

--- a/theano/tensor/nnet/tests/test_ctc.py
+++ b/theano/tensor/nnet/tests/test_ctc.py
@@ -9,50 +9,10 @@ from theano.tests import unittest_tools as utt
 from theano.tensor.nnet.ctc import (ctc_available, ctc, ConnectionistTemporalClassification)
-class TestCTC(unittest.TestCase):
+def setup_torch_case():
-    """
-    Test Baidu CTC wrapper implementation.
-    Expected values for costs and gradients are obtained through an external
-    C implementation, that uses the library directly.
-    """
-    def setUp(self):
-        if not ctc_available():
-            self.skipTest('Optional library warp-ctc not available')
-    def run_ctc(self, activations, labels, input_length, expected_costs, expected_grads):
-        # Create symbolic variables
-        t_activations = theano.shared(activations, name="activations")
-        t_activation_times = theano.shared(input_length, name="activation_times")
-        t_labels = theano.shared(labels, name="labels")
-        t_cost = ctc(t_activations, t_labels, t_activation_times)
-        # Symbolic gradient of CTC cost
-        t_grad = T.grad(T.mean(t_cost), t_activations)
-        # Compile symbolic functions
-        train = theano.function([], [t_cost, t_grad])
-        cost, grad = train()
-        utt.assert_allclose(expected_grads / cost.shape[0], grad)
-        utt.assert_allclose(expected_costs, cost)
-        self.check_grads_disabled(t_activations, t_labels, t_activation_times)
-    def check_grads_disabled(self, activations, labels, input_length):
-        """
-        Check if optimization to disable gradients is working
-        """
-        ctc_cost = ctc(activations, labels, input_length)
-        ctc_function = theano.function([], [ctc_cost])
-        for node in ctc_function.maker.fgraph.apply_nodes:
-            if isinstance(node.op, ConnectionistTemporalClassification):
-                assert (node.op.compute_grad is False)
    # Test obtained from Torch tutorial at:
    # https://github.com/baidu-research/warp-ctc/blob/master/torch_binding/TUTORIAL.md
-    def test_torch_case(self):
    # Layout, from slowest to fastest changing dimension, is (time, batchSize, inputLayerSize)
    activations = np.asarray([[[0, 0, 0, 0, 0], [1, 2, 3, 4, 5], [-5, -4, -3, -2, -1]],
                              [[0, 0, 0, 0, 0], [6, 7, 8, 9, 10], [-10, -9, -8, -7, -6]],
@@ -79,9 +39,10 @@ class TestCTC(unittest.TestCase):
              [-0.02115798369, 0.03168492019, 0.08612854034, -0.7330639958, 0.636408627]]]
    expected_gradients = np.asarray(grads, dtype=np.float32)
-        self.run_ctc(activations, labels, activation_times, expected_costs, expected_gradients)
+    return [activations, labels, activation_times, expected_costs, expected_gradients]
-    def test_ctc(self):
+def setup_ctc_case():
    activations = np.asarray([[[0.1, 0.6, 0.1, 0.1, 0.1], [0.1, 0.1, 0.6, 0.1, 0.1]],
                              [[0.6, 0.1, 0.1, 0.1, 0.1], [0.1, 0.1, 0.5, 0.2, 0.1]]],
                             dtype=np.float32)
@@ -99,7 +60,69 @@ class TestCTC(unittest.TestCase):
    expected_gradients = np.asarray(grads, dtype=np.float32)
-        self.run_ctc(activations, labels, activation_times, expected_costs, expected_gradients)
+    return [activations, labels, activation_times, expected_costs, expected_gradients]
+def setup_grad_case():
+    activations = np.asarray([[[0.1, 0.6, 0.1, 0.1, 0.1], [0.1, 0.1, 0.6, 0.1, 0.1]],
+                              [[0.6, 0.1, 0.1, 0.1, 0.1], [0.1, 0.1, 0.5, 0.2, 0.1]]],
+                             dtype=np.float32)
+    activation_times = np.asarray([2, 2], dtype=np.int32)
+    labels = np.asarray([[1, 2], [1, 2]], dtype=np.int32)
+    return [activations, labels, activation_times]
+class TestCTC(unittest.TestCase):
+    """
+    Test Baidu CTC wrapper implementation.
+    Expected values for costs and gradients are obtained through an external
+    C implementation, that uses the library directly.
+    """
+    def setUp(self):
+        if not ctc_available():
+            self.skipTest('Optional library warp-ctc not available')
+    def run_ctc(self, activations, labels, input_length, expected_costs, expected_grads):
+        # Create symbolic variables
+        t_activations = theano.shared(activations, name="activations")
+        t_activation_times = theano.shared(input_length, name="activation_times")
+        t_labels = theano.shared(labels, name="labels")
+        t_cost = ctc(t_activations, t_labels, t_activation_times)
+        # Symbolic gradient of CTC cost
+        t_grad = T.grad(T.mean(t_cost), t_activations)
+        # Compile symbolic functions
+        train = theano.function([], [t_cost, t_grad])
+        cost, grad = train()
+        utt.assert_allclose(expected_grads / cost.shape[0], grad)
+        utt.assert_allclose(expected_costs, cost)
+        self.check_grads_disabled(t_activations, t_labels, t_activation_times)
+    def check_grads_disabled(self, activations, labels, input_length):
+        """
+        Check if optimization to disable gradients is working
+        """
+        ctc_cost = ctc(activations, labels, input_length)
+        ctc_function = theano.function([], [ctc_cost])
+        for node in ctc_function.maker.fgraph.apply_nodes:
+            if isinstance(node.op, ConnectionistTemporalClassification):
+                assert (node.op.compute_grad is False)
+    def test_torch_case(self):
+        activations, labels, input_length, expected_costs, expected_grads = setup_torch_case()
+        self.run_ctc(activations, labels, input_length, expected_costs, expected_grads)
+    def test_ctc(self):
+        activations, labels, input_length, expected_costs, expected_grads = setup_ctc_case()
+        self.run_ctc(activations, labels, input_length, expected_costs, expected_grads)
    def test_verify_grad(self):
        def ctc_op_functor(labels, in_lengths):
@@ -110,13 +133,7 @@ class TestCTC(unittest.TestCase):
                return ctc(acts, t_labels, t_activation_times)
            return wrapper
-        activations = np.asarray([[[0.1, 0.6, 0.1, 0.1, 0.1], [0.1, 0.1, 0.6, 0.1, 0.1]],
+        activations, activation_times, labels = setup_grad_case()
-                                  [[0.6, 0.1, 0.1, 0.1, 0.1], [0.1, 0.1, 0.5, 0.2, 0.1]]],
-                                 dtype=np.float32)
-        activation_times = np.asarray([2, 2], dtype=np.int32)
-        labels = np.asarray([[1, 2], [1, 2]], dtype=np.int32)
        ctc_op = ctc_op_functor(labels, activation_times)