Merge pull request #154 from brandonwillard/misc-fixes

Misc. Dot test and interface fixes

Merge pull request #154 from brandonwillard/misc-fixes
99bb8083 · Brandon T. Willard · GitHub · b0264ee4 · 8006954f · 99bb8083
--- a/tests/tensor/test_basic.py
+++ b/tests/tensor/test_basic.py
@@ -71,6 +71,7 @@ from tests.tensor.utils import (
 from theano import change_flags, compile, config, function, gof, shared
 from theano.compile import DeepCopyOp
 from theano.compile.mode import get_default_mode
+from theano.gof.graph import Variable
 from theano.scalar import autocast_float, autocast_float_as
 from theano.tensor import (
    Alloc,
@@ -704,8 +705,8 @@ TestConjBroadcast = makeBroadcastTester(
 )
-TestDot = makeTester(
+TestDenseDot = makeTester(
-    name="DotTester",
+    name="DenseDotTester",
    op=dense_dot,
    expected=lambda x, y: np.dot(x, y),
    checks={},
@@ -3646,24 +3647,20 @@ class TestMatinv:
        assert_almost_equal(ssd, myssd)
+def test_dot_numpy_inputs():
+    """Test the `theano.tensor.dot` interface function with NumPy inputs."""
+    a = np.ones(2)
+    b = np.ones(2)
+    res = tt.dot(a, b)
+    assert isinstance(res, Variable)
+    assert isinstance(res.owner.op, Dot)
 class TestDot:
    def setup_method(self):
        utt.seed_rng()
-    def cmp_dot(self, x, y):
-        # x, y are matrices or numbers
-        def spec(x):
-            x = np.asarray(x)
-            return type(x), x.dtype, x.shape
-        nz = np.dot(x, y)
-        tz = eval_outputs([dense_dot(as_tensor_variable(x), as_tensor_variable(y))])
-        assert tz.dtype == nz.dtype, (tz.dtype, tz.dtype.num, nz.dtype, nz.dtype.num)
-        assert tz.shape == nz.shape, (tz.shape, nz.shape)
-        utt.assert_allclose(nz, tz, rtol=1e-4, atol=1e-4)
    def test_Op_dims(self):
-        # _dot is a Dot op instance
        _dot = tt.basic._dot
        d0 = scalar()
        d1 = vector()
@@ -3699,145 +3696,26 @@ class TestDot:
        with pytest.raises(TypeError):
            _dot(d3, d3)
-    def test_dot_0d_0d(self):
-        self.cmp_dot(rand(), rand())
-    def test_dot_0d_1d(self):
-        self.cmp_dot(rand(), rand(5))
-    def test_dot_0d_2d(self):
-        self.cmp_dot(rand(), rand(6, 7))
-    def test_dot_0d_3d(self):
-        self.cmp_dot(rand(), rand(8, 6, 7))
-    def test_dot_1d_0d(self):
-        self.cmp_dot(rand(5), rand())
-    def test_dot_1d_1d(self):
-        self.cmp_dot(rand(5), rand(5))
-    def test_dot_1d0_1d0(self):
-        self.cmp_dot(rand(0), rand(0))
-    # numpy return matrix not aligned...
-    def test_dot_1d_1d0(self):
-        with pytest.raises(ValueError):
-            self.cmp_dot(rand(5), rand(0))
-    # numpy return matrix not aligned...
-    def test_dot_1d0_1d(self):
-        with pytest.raises(ValueError):
-            self.cmp_dot(rand(0), rand(5))
-    def test_dot_1d_2d(self):
-        self.cmp_dot(rand(6), rand(6, 7))
-    def test_dot_1d0_2d(self):
-        self.cmp_dot(rand(0), rand(0, 7))
-    def test_dot_1d_2d0(self):
-        self.cmp_dot(rand(6), rand(6, 0))
-    def test_dot_1d0_2d0(self):
-        self.cmp_dot(rand(0), rand(0, 0))
-    def test_dot_1d_3d(self):
-        self.cmp_dot(rand(6), rand(8, 6, 7))
-    def test_dot_2d_0d(self):
-        self.cmp_dot(rand(5, 6), rand())
-    def test_dot_2d_1d(self):
-        self.cmp_dot(rand(5, 6), rand(6))
-    def test_dot_2d0_1d(self):
-        self.cmp_dot(rand(0, 6), rand(6))
-    def test_dot_2d_1d0(self):
-        self.cmp_dot(rand(5, 0), rand(0))
-    def test_dot_2d0_1d0(self):
-        self.cmp_dot(rand(0, 0), rand(0))
-    def test_dot_2d_2d(self):
-        self.cmp_dot(rand(5, 6), rand(6, 7))
-    def test_dot_2d0_2d(self):
-        self.cmp_dot(rand(0, 6), rand(6, 7))
-    def test_dot_2d_2d0(self):
-        self.cmp_dot(rand(5, 6), rand(6, 0))
-    def test_dot_2d0_2d0(self):
-        self.cmp_dot(rand(0, 6), rand(6, 0))
-    def test_dot_2d_0_2d(self):
-        self.cmp_dot(rand(5, 0), rand(0, 7))
-    def test_dot_2d0_0_2d0(self):
-        self.cmp_dot(rand(0, 6), rand(6, 0))
-    def test_dot_2d_3d(self):
-        self.cmp_dot(rand(5, 6), rand(8, 6, 7))
-    def test_dot_3d_0d(self):
-        self.cmp_dot(rand(4, 5, 6), rand())
-    def test_dot_3d_1d(self):
-        self.cmp_dot(rand(4, 5, 6), rand(6))
-    def test_dot_3d_2d(self):
-        self.cmp_dot(rand(4, 5, 6), rand(6, 7))
-    def test_dot_3d_3d(self):
-        self.cmp_dot(rand(4, 5, 6), rand(8, 6, 7))
-    def not_aligned(self, x, y):
-        with change_flags(compute_test_value="off"):
-            z = dense_dot(x, y)
-        with pytest.raises(ValueError):
-            eval_outputs([z])
-    def test_not_aligned(self):
-        self.not_aligned(rand(5), rand(6))
-        self.not_aligned(rand(5), rand(6, 4))
-        self.not_aligned(rand(5), rand(6, 4, 7))
-        self.not_aligned(rand(5, 4), rand(6))
-        self.not_aligned(rand(5, 4), rand(6, 7))
-        self.not_aligned(rand(5, 4), rand(6, 7, 8))
-        self.not_aligned(rand(5, 4, 3), rand(6))
-        self.not_aligned(rand(5, 4, 3), rand(6, 7))
-        self.not_aligned(rand(5, 4, 3), rand(6, 7, 8))
    def test_grad(self):
        utt.verify_grad(dense_dot, [rand(2, 3), rand(3, 2)])
        utt.verify_grad(dense_dot, [rand(2), rand(2, 3)])
        utt.verify_grad(dense_dot, [rand(3, 2), rand(2)])
        utt.verify_grad(dense_dot, [rand(2), rand(2)])
-        utt.verify_grad(dense_dot, [rand(), rand(2)])
+        utt.verify_grad(dense_dot, [rand(), rand()])
-        utt.verify_grad(dense_dot, [rand(), rand(2, 5)])
+        # TODO: What about the broadcastable conditions in `Dot.grad`?
-        utt.verify_grad(dense_dot, [rand(2), rand()])
-        utt.verify_grad(dense_dot, [rand(2, 5), rand()])
-        utt.verify_grad(dense_dot, [rand(2, 3, 4), rand(4)])
-        utt.verify_grad(dense_dot, [rand(3), rand(2, 3, 4)])
-        utt.verify_grad(dense_dot, [rand(4, 3), rand(2, 3, 4)])
-        utt.verify_grad(dense_dot, [rand(2, 3, 4), rand(4, 5)])
-        utt.verify_grad(dense_dot, [rand(2, 3, 4), rand(3, 4, 5)])
-    @pytest.mark.slow
    def test_broadcastable_patterns(self):
        #
-        # These examples should all work because we broadcastable or
+        # These examples should all work.  All dimensions of all results have
-        # no, all dimensions of all results have size 1.
+        # size 1.
        #
        def val_for(r):
            if r.dtype.startswith("complex"):
                # We want to test complex at the same time, so we give a value
-                # To the imaginary component.
+                # to the imaginary component.
                # This strange way of doing things is the only way that worked
-                # on numpy 1.4.1
+                # on NumPy 1.4.1.
                if r.ndim == 0:
                    return np.asarray(np.complex(1.1, 2.1), dtype=r.dtype)
                if r.ndim == 1:
@@ -3857,7 +3735,7 @@ class TestDot:
                return np.asarray([1.2], dtype=r.dtype)
            elif r.ndim == 2:
                return np.asarray([[1.3]], dtype=r.dtype)
-            raise ValueError()
+            raise AssertionError()
        for dtype0 in ("float32", "float64", "complex64"):
            for dtype1 in ("float32", "complex64", "complex128"):
@@ -3881,15 +3759,7 @@ class TestDot:
                        y = TensorType(dtype=dtype1, broadcastable=bc1)()
                        z = dense_dot(x, y)
-                        t = TensorType(dtype=dtype0, broadcastable=z.broadcastable)()
-                        rval = z * 3 + 2 * t
-                        f = function([x, y, t], rval)
-                        xval = val_for(x)
-                        yval = val_for(y)
-                        tval = val_for(t)
-                        f(xval, yval, tval)  # debugmode checks result
                        if dtype0.startswith("float") and dtype1.startswith("float"):
                            g = grad(z.sum(), x)
                            assert g.broadcastable == x.broadcastable

--- a/theano/tensor/basic.py
+++ b/theano/tensor/basic.py
@@ -6311,6 +6311,13 @@ def dot(l, r):
    This is designed to work with both sparse and dense tensors types.
    """
+    if not isinstance(l, Variable):
+        l = as_tensor_variable(l)
+    if not isinstance(r, Variable):
+        r = as_tensor_variable(r)
    try:
        res = l.__dot__(r)
        if res is NotImplemented: