Merge pull request #19 from nouiz/abergeron-cudnn_r2_alg

Fix cudnn crash with v1

Merge pull request #19 from nouiz/abergeron-cudnn_r2_alg
009733e0 · abergeron · 1d074416 · 105aff7c · 009733e0 · 009733e0
--- a/theano/sandbox/cuda/cudnn_helper.h
+++ b/theano/sandbox/cuda/cudnn_helper.h
@@ -73,6 +73,20 @@ cudnnGetConvolutionForwardAlgorithm(
  return CUDNN_STATUS_SUCCESS;
 }

+static inline cudnnStatus_t
+cudnnGetConvolutionForwardWorkspaceSize(
+ cudnnHandle_t handle,
+ const cudnnTensorDescriptor_t srcDesc,
+ const cudnnFilterDescriptor_t filterDesc,
+ const cudnnConvolutionDescriptor_t convDesc,
+ const cudnnTensor4dDescriptor_t destDesc,
+ cudnnConvolutionFwdAlgo_t algo,
+ size_t *sizeInBytes) {
+  *sizeInBytes = 0;
+  return CUDNN_STATUS_SUCCESS;
+}
+
+
 static inline cudnnStatus_t
 cudnnConvolutionForward_v2(
  cudnnHandle_t handle,

--- a/theano/sandbox/cuda/dnn.py
+++ b/theano/sandbox/cuda/dnn.py
@@ -362,6 +362,8 @@ class GpuDnnConv(DnnBase, COp):
            self.workmem = 'small'

    def get_op_params(self):
+        if version() == -1:
+            return [('CONV_ALGO', "0")]
        if self.workmem == 'none':
            alg = 'CUDNN_CONVOLUTION_FWD_ALGO_IMPLICIT_GEMM'
        elif self.workmem == 'small':