Merge pull request #1993 from nouiz/crash_inc_sub_grad

Crash fix in IncSubtensor.grad

Merge pull request #1993 from nouiz/crash_inc_sub_grad
53532957 · abergeron · d19e66d9 · 852114f3 · 53532957 · 53532957
--- a/theano/tensor/subtensor.py
+++ b/theano/tensor/subtensor.py
@@ -594,8 +594,7 @@ class Subtensor(Op):
    @staticmethod
    def helper_c_code(node, name, inputs, outputs, sub, idx_list, view_ndim,
                      c_prefix=None,
-                      strides_mul=None,
+                      strides_mul=None):
-    ):
        """
        The parameters c_prefix are there to allow reusing this
        function on PyArray and CudaNdarray object.
@@ -682,7 +681,8 @@ class Subtensor(Op):
            subensor_spec = "npy_intp * subtensor_spec = NULL;"
        if is_slice:
-            is_slice_init = "int is_slice[] = {" + ",".join([str(s) for s in is_slice]) + "};"
+            is_slice_init = "int is_slice[] = {" + ",".join([str(s) for s in
+                                                             is_slice]) + "};"
        else:
            is_slice_init = "int* is_slice = NULL;"
        subtensor_init = "\n".join(init_cmds)
@@ -897,7 +897,8 @@ class Subtensor(Op):
        %(z)s = xview;
        """ % locals()
-        return decl + checkNDim + "{" + get_xview + build_view + finish_view + "}"
+        return (decl + checkNDim +
+                "{" + get_xview + build_view + finish_view + "}")
    def c_code_cache_version(self):
        hv = self.helper_c_code_cache_version()
@@ -1022,9 +1023,9 @@ def inc_subtensor(x, y, inplace=False, set_instead_of_inc=False,
            destroyhandler_tolerate_aliased = [[0, 1]]
        else:
            destroyhandler_tolerate_aliased = []
-        the_op = IncSubtensor(x.owner.op.idx_list, inplace, set_instead_of_inc,
+        the_op = IncSubtensor(
-                destroyhandler_tolerate_aliased=destroyhandler_tolerate_aliased
+            x.owner.op.idx_list, inplace, set_instead_of_inc,
-                )
+            destroyhandler_tolerate_aliased=destroyhandler_tolerate_aliased)
        real_x = x.owner.inputs[0]
        real_idxargs = x.owner.inputs[1:]
        return the_op(real_x, y, *real_idxargs)
@@ -1105,10 +1106,10 @@ class IncSubtensor(Op):
        self.set_instead_of_inc = set_instead_of_inc
    def __eq__(self, other):
-        return type(self) == type(other) \
+        return (type(self) == type(other) and
-                and self.idx_list == other.idx_list \
+                self.idx_list == other.idx_list and
-                and self.inplace == other.inplace \
+                self.inplace == other.inplace and
-                and self.set_instead_of_inc == other.set_instead_of_inc
+                self.set_instead_of_inc == other.set_instead_of_inc)
    def __hash__(self):
        msg = []
@@ -1120,12 +1121,12 @@ class IncSubtensor(Op):
        idx_list = tuple(msg)
        # backport
-        #idx_list = tuple((entry.start, entry.stop, entry.step)
+        # idx_list = tuple((entry.start, entry.stop, entry.step)
        #                 if isinstance(entry, slice)
        #                 else entry
        #                 for entry in self.idx_list)
-        return hashtype(self) ^ hash(idx_list) ^ hash(self.inplace) \
+        return (hashtype(self) ^ hash(idx_list) ^ hash(self.inplace) ^
-               ^ hash(self.set_instead_of_inc)
+                hash(self.set_instead_of_inc))
    def __str__(self):
        indices = []
@@ -1225,7 +1226,7 @@ class IncSubtensor(Op):
            if not self.set_instead_of_inc:
                sub_x += y
            else:
-                #sub_x += -sub_x + y
+                # sub_x += -sub_x + y
                x.__setitem__(cdata, y)
        else:
            # scalar case
@@ -1295,7 +1296,7 @@ class IncSubtensor(Op):
            ** helper_args
        )
-        #Make a view on the output, as we will write into it.
+        # Make a view on the output, as we will write into it.
        alloc_zview = self.make_view_array(z, view_ndim)
        build_view = """
@@ -1460,7 +1461,8 @@ class IncSubtensor(Op):
            gx = g_output
        gy = Subtensor(idx_list=self.idx_list)(g_output, *idx_list)
        if gy.broadcastable != y.broadcastable:
-            y_broad = (True,) * (gy.ndim - y.ndim) + y.broadcastable
+            y_dim_added = gy.ndim - y.ndim
+            y_broad = (True,) * y_dim_added + y.broadcastable
            assert sum(gy.broadcastable) < sum(y_broad)
            axis_to_sum = []
            for i in range(gy.ndim):
@@ -1468,7 +1470,7 @@ class IncSubtensor(Op):
                    axis_to_sum.append(i)
                elif (gy.broadcastable[i] is True and
                      y_broad[i] is False):
-                    # This mean that THeano where able to infer that
+                    # This mean that Theano where able to infer that
                    # gy.shape[i] is 1, so y.shape[i] is 1, but we
                    # didn't know it. It is fine.
                    pass
@@ -1476,7 +1478,10 @@ class IncSubtensor(Op):
                    assert gy.broadcastable[i] == y_broad[i]
            gy = gy.sum(axis=axis_to_sum, keepdims=True)
            if gy.ndim != y.ndim:
-                gy = gy.dimshuffle(*range(y.ndim, gy.ndim))
+                assert gy.ndim > y.ndim
+                for i in range(y_dim_added):
+                    assert gy.broadcastable[i]
+                gy = gy.dimshuffle(*range(y_dim_added, gy.ndim))
            assert gy.broadcastable == y.broadcastable
        return [gx, gy] + [DisconnectedType()()] * len(idx_list)
@@ -1540,7 +1545,8 @@ class AdvancedSubtensor1(Op):
            if not numpy.can_cast(i.dtype, numpy.intp):
                # Check if there was actually an incorrect conversion
                if numpy.any(i != i_):
-                    raise IndexError('index contains values that are bigger '
+                    raise IndexError(
+                        'index contains values that are bigger '
                        'than the maximum array size on this system.', i)
            i = i_
@@ -1732,7 +1738,8 @@ class AdvancedIncSubtensor1(Op):
                opname = 'set'
            else:
                opname = 'increment'
-            raise TypeError('cannot %s x subtensor with ndim=%s'
+            raise TypeError(
+                'cannot %s x subtensor with ndim=%s'
                ' by y with ndim=%s to x subtensor with ndim=%s ' % (
                    opname, x_.type.ndim, y_.type.ndim))
@@ -1837,7 +1844,7 @@ def adv_index_broadcastable_pattern(a, idx):
    newidx = tuple(map(replace_slice, idx))
-    #2 - True = 1; 2 - False = 2
+    # 2 - True = 1; 2 - False = 2
    fakeshape = [2 - bc for bc in a.broadcastable]
    retshape = numpy.empty(fakeshape)[newidx].shape
    return tuple([dim == 1 for dim in retshape])
@@ -1902,8 +1909,6 @@ class AdvancedSubtensor(Op):
                'are too big (>= 2^32 elements). It is possible that '
                'out[0] (%s), with shape %s, is not correctly filled.'
                % (out[0], out[0].shape))
-        # return
-        #raise NotImplementedError()
    def connection_pattern(self, node):
@@ -1956,7 +1961,8 @@ class AdvancedIncSubtensor(Op):
    def __str__(self):
        return "%s{%s, %s}" % (self.__class__.__name__,
                               "inplace=" + str(self.inplace),
-                " set_instead_of_inc=" + str(self. set_instead_of_inc))
+                               " set_instead_of_inc=" +
+                               str(self. set_instead_of_inc))
    def make_node(self, x, y, *inputs):
        x = theano.tensor.as_tensor_variable(x)
@@ -1999,7 +2005,8 @@ class AdvancedIncSubtensor(Op):
        return gof.Apply(op,
                         (x, y) + inputs,
-                        [theano.tensor.tensor(dtype=x.type.dtype,
+                         [theano.tensor.tensor(
+                             dtype=x.type.dtype,
                             broadcastable=x.type.broadcastable)])
    def perform(self, node, inputs, out_):

--- a/theano/tensor/tests/test_inc_subtensor.py
+++ b/theano/tensor/tests/test_inc_subtensor.py
@@ -100,30 +100,42 @@ class Test_inc_subtensor(unittest.TestCase):
        sl2 = slice(sl2_end)
        sl3 = 2
-        for do_set in [True, False]:
-            print "Set", do_set
-            if do_set:
-                resut = tt.set_subtensor(a[sl1, sl3, sl2], increment)
-            else:
-                resut = tt.inc_subtensor(a[sl1, sl3, sl2], increment)
-            f = theano.function([a, increment, sl2_end], resut)
        val_a = numpy.ones((5, 3, 4))
        val_inc = 2.3
        val_sl2_end = 2
+        for method in [tt.set_subtensor, tt.inc_subtensor]:
+            print "MethodSet", method
+            resut = method(a[sl1, sl3, sl2], increment)
+            f = theano.function([a, increment, sl2_end], resut)
            expected_result = numpy.copy(val_a)
            result = f(val_a, val_inc, val_sl2_end)
-            if do_set:
+            if method is tt.set_subtensor:
                expected_result[:, sl3, :val_sl2_end] = val_inc
            else:
                expected_result[:, sl3, :val_sl2_end] += val_inc
            utt.assert_allclose(result, expected_result)
+            # Test when we broadcast the result
+            resut = method(a[sl1, sl2], increment)
+            f = theano.function([a, increment, sl2_end], resut)
+            expected_result = numpy.copy(val_a)
+            result = f(val_a, val_inc, val_sl2_end)
+            if method is tt.set_subtensor:
+                expected_result[:, :val_sl2_end] = val_inc
+            else:
+                expected_result[:, :val_sl2_end] += val_inc
+            utt.assert_allclose(result, expected_result)
    def test_grad_inc_set(self):
        def inc_slice(*s):
            def just_numeric_args(a, b):
@@ -148,9 +160,14 @@ class Test_inc_subtensor(unittest.TestCase):
                (numpy.asarray([[0, 1], [2, 3], [4, 5.]]),
                 numpy.asarray([[9, 9.]]), ))
-            #single element
+            # single element
            utt.verify_grad(
                f_slice(2, 1),
                (numpy.asarray([[0, 1], [2, 3], [4, 5.]]),
                 numpy.asarray(9.),))
+            # broadcast
+            utt.verify_grad(
+                f_slice(2),
+                (numpy.asarray([[0, 1], [2, 3], [4, 5.]]),
+                 numpy.asarray(9.),))