Just standardize `c_set_math_type_for_conv()`.

6384da8a · notoraptor · c5944c7d · 6384da8a · 6384da8a · 6384da8a
--- a/theano/gpuarray/c_code/dnn_conv_base.c
+++ b/theano/gpuarray/c_code/dnn_conv_base.c
@@ -37,7 +37,7 @@ static int c_set_math_type_for_conv(cudnnConvolutionDescriptor_t desc, cudnnMath
    return -1;
  }
 #endif
-  return 1;
+  return 0;
 }
 #section init_code_struct

--- a/theano/gpuarray/c_code/dnn_fwd.c
+++ b/theano/gpuarray/c_code/dnn_fwd.c
@@ -191,7 +191,7 @@ APPLY_SPECIFIC(conv_fwd)(PyGpuArrayObject *input, PyGpuArrayObject *kerns,
  size_t maxfree = c_get_largest_free_block_size(c);
  if (PyErr_Occurred()) return 1;
  if (params->choose_algo) {
    if (!reuse_algo) {
@@ -286,7 +286,7 @@ APPLY_SPECIFIC(conv_fwd)(PyGpuArrayObject *input, PyGpuArrayObject *kerns,
      }
    }
  }
  if (c_set_math_type_for_conv(desc, mathtype) == -1 ||
      dnn_conv_fwd_fallback(&algo, input, kerns, desc) != 0) {
    cuda_exit(c->ctx);

--- a/theano/gpuarray/c_code/dnn_gi.c
+++ b/theano/gpuarray/c_code/dnn_gi.c
@@ -192,7 +192,7 @@ APPLY_SPECIFIC(conv_gi)(PyGpuArrayObject *kerns, PyGpuArrayObject *output,
        // set the 'tensor math ok' flag
        c_set_math_type_for_conv(desc, CUDNN_TENSOR_OP_MATH);
        tmpmem = gpudata_alloc(c->ctx, maxfree, NULL, 0, NULL);
        if (tmpmem == NULL) {
          PyErr_SetString(PyExc_MemoryError, "Could not allocate working GPU memory");
@@ -251,7 +251,7 @@ APPLY_SPECIFIC(conv_gi)(PyGpuArrayObject *kerns, PyGpuArrayObject *output,
      }
    }
  }
  if (c_set_math_type_for_conv(desc, mathtype) == -1 ||
      dnn_conv_gi_fallback(&algo, *input, kerns, desc) != 0) {
    cuda_exit(c->ctx);
@@ -320,7 +320,7 @@ APPLY_SPECIFIC(conv_gi)(PyGpuArrayObject *kerns, PyGpuArrayObject *output,
  if (params->choose_once) {
    reuse_algo = 1;
  }
  gpudata *workspace = 0;
  if (worksize != 0) {
    workspace = gpudata_alloc(c->ctx, worksize, NULL, 0, NULL);

--- a/theano/gpuarray/c_code/dnn_gw.c
+++ b/theano/gpuarray/c_code/dnn_gw.c
@@ -176,7 +176,7 @@ APPLY_SPECIFIC(conv_gw)(PyGpuArrayObject *input, PyGpuArrayObject *output,
        int count;
        cudnnConvolutionBwdFilterAlgoPerf_t choice;
        gpudata *tmpmem;
        // set the 'tensor math ok' flag
        c_set_math_type_for_conv(desc, CUDNN_TENSOR_OP_MATH);
@@ -241,7 +241,7 @@ APPLY_SPECIFIC(conv_gw)(PyGpuArrayObject *input, PyGpuArrayObject *output,
      }
    }
  } /* choose_algo */
  if (c_set_math_type_for_conv(desc, mathtype) == -1 ||
      dnn_conv_gw_fallback(&algo, input, *kerns, desc) != 0) {
    cuda_exit(c->ctx);
@@ -310,9 +310,9 @@ APPLY_SPECIFIC(conv_gw)(PyGpuArrayObject *input, PyGpuArrayObject *output,
  if (params->choose_once) {
    reuse_algo = 1;
  }
  gpudata *workspace = 0;
  if (worksize != 0) {
    workspace = gpudata_alloc(c->ctx, worksize, NULL, 0, NULL);
    if (workspace == NULL) {