Merge pull request #6413 from ReyhaneAskari/gpu_stack_follow_up

Gpu stack follow up

Merge pull request #6413 from ReyhaneAskari/gpu_stack_follow_up
b602f833 · Frédéric Bastien · GitHub · 3b2f7b8a · 413bd7ed · b602f833
--- a/theano/gpuarray/opt.py
+++ b/theano/gpuarray/opt.py
@@ -962,18 +962,19 @@ def local_gpu_pdbbreakpoint_op(node):
            return False

        # Apply the op on the new inputs
-        new_op_outputs = node.op(*new_inputs, return_list=True)
-
-        # Propagate the transfer to the gpu through the outputs that require
-        # it
-        new_outputs = []
-        for i in range(len(new_op_outputs)):
-            if input_transfered[i]:
-                new_outputs.append(new_op_outputs[i].transfer('cpu'))
-            else:
-                new_outputs.append(new_op_outputs[i])
+        with inherit_stack_trace(node.outputs):
+            new_op_outputs = node.op(*new_inputs, return_list=True)
+
+            # Propagate the transfer to the gpu through the outputs that require
+            # it
+            new_outputs = []
+            for i in range(len(new_op_outputs)):
+                if input_transfered[i]:
+                    new_outputs.append(new_op_outputs[i].transfer('cpu'))
+                else:
+                    new_outputs.append(new_op_outputs[i])

-        return new_outputs
+            return new_outputs

    return False

@@ -2407,8 +2408,8 @@ def local_gpu_elemwise_careduce(node):
        inp = node.inputs[0].owner.inputs[0]
        props = node.op._props_dict()
        props["pre_scalar_op"] = scalar.basic.sqr
-        out = GpuCAReduceCuda(**props)(inp)
        with inherit_stack_trace(node.outputs):
+            out = GpuCAReduceCuda(**props)(inp)
            return [out]



--- a/theano/gpuarray/tests/test_opt.py
+++ b/theano/gpuarray/tests/test_opt.py
@@ -40,11 +40,9 @@ def _check_stack_trace(thing):
                                   theano.tensor.elemwise.Elemwise,
                                   theano.ifelse.IfElse,
                                   GpuFromHost, HostFromGpu,
-                                   GpuCAReduceCuda,
                                   basic_ops.GpuContiguous,
                                   GpuElemwise,
                                   theano.printing.Print,
-                                   PdbBreakpoint,
                                   ))
    return check_stack_trace(thing, ops_to_check=_ops_to_check,
                             bug_print="ignore")