Use theano_prep_output to allocate output in spatialtf_grid C implementation

Signed-off-by: João Victor Tozatti Risso <joaovictor.risso@gmail.com>

Use theano_prep_output to allocate output in spatialtf_grid C implementation
3e3b384b · João Victor Tozatti Risso · dedc5aef · 3e3b384b
--- a/theano/gpuarray/c_code/spatialtf_grid.c
+++ b/theano/gpuarray/c_code/spatialtf_grid.c
 #section support_code
-int spatialtf_grid(cudnnSpatialTransformerDescriptor_t desc,
+int
-                   PyGpuArrayObject * theta,
+spatialtf_grid(cudnnSpatialTransformerDescriptor_t desc,
-                   PyArrayObject * dimensions,
+               PyGpuArrayObject * theta,
-                   PyGpuArrayObject ** grid,
+               PyArrayObject * grid_dimensions,
-                   cudnnHandle_t _handle)
+               PyGpuArrayObject ** grid,
+               cudnnHandle_t _handle)
 {
    PyGpuContextObject * gpu_ctx = theta->context;
-    cudnnDataType_t dt;
    cudnnStatus_t err;
-    // Obtain GPU datatype from theta
+    if ( theta->ga.typecode != GA_FLOAT &&
-    switch( theta->ga.typecode )
+         theta->ga.typecode != GA_DOUBLE &&
+         theta->ga.typecode != GA_HALF )
    {
-    case GA_FLOAT:
-        dt = CUDNN_DATA_FLOAT;
-        break;
-    case GA_DOUBLE:
-        dt = CUDNN_DATA_DOUBLE;
-        break;
-    case GA_HALF:
-        dt = CUDNN_DATA_HALF;
-        break;
-    default:
        PyErr_SetString( PyExc_TypeError, "Unsupported data type for theta" );
        return -1;
    }
-    if ( NULL == *grid )
+    if ( PyArray_NDIM( grid_dimensions ) < 4 )
    {
-        // Obtain grid dimensions
+        PyErr_Format( PyExc_RuntimeError,
-        npy_int * dimensions_data = (npy_int *)PyArray_DATA( dimensions );
+                      "Grid dimensions array must have at least 4 dimensions!" );
-        const size_t width = dimensions_data[0];
+        return -1;
-        const size_t height = dimensions_data[1];
+    }
-        const size_t num_images = dimensions_data[3];
-        // Grid of coordinates is of size num_images * height * width * 2 for a 2D transformation
+    // Obtain grid dimensions
-        const size_t grid_dims[4] = { width, height, 2, num_images };
+    npy_int * dimensions_data = (npy_int *)PyArray_DATA( grid_dimensions );
-        *grid = pygpu_empty( 4, &(grid_dims[0]), theta->ga.typecode, GA_C_ORDER,
+    const size_t width = dimensions_data[0];
-            gpu_ctx, Py_None );
+    const size_t height = dimensions_data[1];
+    const size_t num_images = dimensions_data[3];
+    // Grid of coordinates is of size num_images * height * width * 2 for a 2D transformation
+    const size_t grid_dims[4] = { width, height, 2, num_images };
-        if ( NULL == *grid )
+    if ( theano_prep_output( grid, 4, &(grid_dims[0]), theta->ga.typecode,
-        {
+                             GA_C_ORDER, gpu_ctx ) != 0 )
-            PyErr_Format( PyExc_MemoryError,
+    {
-                          "Could not allocate memory for grid coordinates" );
+        PyErr_SetString( PyExc_MemoryError,
-            return 1;
+                         "Could not allocate memory for the grid of coordinates" );
-        }
+        return -1;
    }
    const void * theta_data = PyGpuArray_DEV_DATA( theta );
@@ -58,7 +52,7 @@ int spatialtf_grid(cudnnSpatialTransformerDescriptor_t desc,
        PyErr_Format( PyExc_RuntimeError,
                      "Failed to create grid of coordinates: %s",
                      cudnnGetErrorString( err ) );
-        return 1;
+        return -1;
    }
    return 0;