BatchedDot: test and fix grad

ed4e0679 · Tim Cooijmans · e68999e8 · ed4e0679 · ed4e0679
--- a/theano/tensor/basic.py
+++ b/theano/tensor/basic.py
@@ -3449,12 +3449,12 @@ class BatchedDot(Op):
            ygrad = x.dimshuffle(0, 1, 'x') * gz.dimshuffle(0, 'x', 1)
        # x is matrix, y is vector, grad is vector
-        elif xdim == 2 and ydim == 1:
+        elif xdim == 3 and ydim == 2:
            xgrad = gz.dimshuffle(0, 1, 'x') * y.dimshuffle(0, 'x', 1)
            ygrad = batched_dot(x.dimshuffle(0, 2, 1), gz)
        # x is matrix, y is matrix, grad is matrix
-        elif xdim == ydim == 2:
+        elif xdim == ydim == 3:
            xgrad = batched_dot(gz, y.dimshuffle(0, 2, 1))
            ygrad = batched_dot(x.dimshuffle(0, 2, 1), gz)

--- a/theano/tensor/tests/test_basic.py
+++ b/theano/tensor/tests/test_basic.py
@@ -1931,13 +1931,22 @@ DotTester = makeTester(name='DotTester',
                        bad_build=dict(),
                        bad_runtime=dict(bad1=(rand(5, 7), rand(5, 7)),
                                         bad2=(rand(5, 7), rand(8, 3))))
 BatchedDotTester = makeTester(
    name='BatchedDotTester',
    op=batched_dot,
    expected=lambda xs, ys: numpy.asarray(list(
        numpy.dot(x, y) for x, y in zip(xs, ys))),
    checks={},
+    grad=dict(correct1=(rand(3, 5, 7), rand(3, 7, 5)),
+              correct2=(rand(3, 5, 7), rand(3, 7, 9)),
+              correct3=(rand(3, 5, 7), rand(3, 7)),
+              correct4=(rand(3, 5), rand(3, 5, 7)),
+              correct5=(rand(3), rand(3, 5, 7)),
+              correct6=(rand(3, 5), rand(3)),
+              mixed1=(rand(3, 5).astype('float32'),
+                      rand(3, 5, 7)),
+              mixed2=(rand(3, 5).astype('float64'),
+                      rand(3, 5, 7))),
    good=dict(correct1=(rand(3, 5, 7), rand(3, 7, 5)),
              correct2=(rand(3, 5, 7), rand(3, 7, 9)),
              correct3=(rand(3, 5, 7), rand(3, 7)),