Regroup optimizations and add an error for ConvOp.

830e5c51 · Arnaud Bergeron · Pascal Lamblin · 25bce5d7 · 830e5c51 · 830e5c51
--- a/theano/sandbox/gpuarray/opt.py
+++ b/theano/sandbox/gpuarray/opt.py
@@ -780,36 +780,37 @@ def local_assert(node, context_name):
                                      *node.inputs[1:]))]
-# These two deal with any abstract convs that have a transfer somewhere
+@register_opt('fast_compile')
-@register_opt()
+@op_lifter([ConvOp])
-@op_lifter([AbstractConv2d])
+def local_error_convop(node, context_name):
-def local_lift_abstractconv2d(node, context_name):
+    assert False, """
-    return [node.op(as_gpuarray_variable(node.inputs[0],
+ConvOp does not work with the gpuarray backend.
-                                         context_name=context_name),
-                    as_gpuarray_variable(node.inputs[0],
-                                         context_name=context_name))]
+Use the new convolution interface to have GPU convolution working:
+theano.tensor.nnet.abstract_conv2d.conv2d()
+"""
-@register_opt()
+# This deals with any abstract convs that have a transfer somewhere
-@op_lifter([AbstractConv2d_gradWeights,
+@register_opt('fast_compile')
+@op_lifter([AbstractConv2d,
+            AbstractConv2d_gradWeights,
            AbstractConv2d_gradInputs])
-def local_lift_abstractconv2dgrad(node, context_name):
+def local_lift_abstractconv2d(node, context_name):
-    return [node.op(as_gpuarray_variable(node.inputs[0],
+    inps = list(node.inputs)
-                                         context_name=context_name),
+    inps[0] = as_gpuarray_variable(node.inputs[0],
-                    as_gpuarray_variable(node.inputs[0],
+                                   context_name=context_name)
-                                         context_name=context_name),
+    inps[1] = as_gpuarray_variable(node.inputs[1],
-                    node.inputs[2])]
+                                   context_name=context_name)
+    return [node.op(*inps)]
-# Register this here so that it goes after the abstract lifting
-register_opt()(conv_groupopt)
 # This will deal with ops that don't have an explicit transfer but
 # have one of their inputs on the GPU already and the other not on the
 # GPU (to avoid endlessly replacing things).
-@register_opt()
+@register_opt('fast_compile')
-@local_optimizer([AbstractConv2d])
+@local_optimizer([AbstractConv2d,
+                  AbstractConv2d_gradWeights,
+                  AbstractConv2d_gradInputs])
 def local_gpu_abstractconv2d(node):
    if isinstance(node.op, BaseAbstractConv2d):
        if ((isinstance(node.inputs[0].type, GpuArrayType) or
@@ -822,6 +823,9 @@ def local_gpu_abstractconv2d(node):
            inps[1] = as_gpuarray_variable(inps[1], context_name=ctx_name)
            return as_tensor_variable(node.op(*inps))
+# Register this here so that it goes after the abstract lifting
+register_opt()(conv_groupopt)
 @register_opt("low_memory")
 @local_optimizer([GpuCAReduceCuda])

--- a/theano/sandbox/gpuarray/tests/test_opt.py
+++ b/theano/sandbox/gpuarray/tests/test_opt.py
@@ -31,7 +31,7 @@ def test_local_remove_all_assert():
    a = theano.tensor.opt.assert_op(x, theano.tensor.eq(x, 0).any())
    # By default `unsafe` should not be there
-    f = theano.function([x], a, mode=mode_with_gpu)
+    f = theano.function([x], a, mode=mode_with_gpu.excluding('unsafe'))
    topo = f.maker.fgraph.toposort()
    a_op = [n for n in topo if isinstance(n.op, theano.tensor.opt.Assert)]
    assert len(a_op) == 1