提交 74447679 authored 作者: Vivek Kulkarni's avatar Vivek Kulkarni

Fixing minor issue on device_malloc

上级 dbba32f1
...@@ -1809,11 +1809,8 @@ void CudaNdarray_vector_add_fast(CudaNdarray* py_self, CudaNdarray* py_other, Py ...@@ -1809,11 +1809,8 @@ void CudaNdarray_vector_add_fast(CudaNdarray* py_self, CudaNdarray* py_other, Py
unsigned int num_blocks = size; unsigned int num_blocks = size;
dim3 n_blocks(num_blocks); dim3 n_blocks(num_blocks);
dim3 n_threads(num_threads_per_block); dim3 n_threads(num_threads_per_block);
static long *d_indices_arr = NULL; long *d_indices_arr = NULL;
if (!d_indices_arr)
{
d_indices_arr = (long *)device_malloc(sizeof(long) * PyArray_SIZE(indices_arr)); d_indices_arr = (long *)device_malloc(sizeof(long) * PyArray_SIZE(indices_arr));
}
assert(d_indices_arr); assert(d_indices_arr);
cudaError_t err = cudaMemcpy(d_indices_arr, cudaError_t err = cudaMemcpy(d_indices_arr,
...@@ -1834,6 +1831,7 @@ void CudaNdarray_vector_add_fast(CudaNdarray* py_self, CudaNdarray* py_other, Py ...@@ -1834,6 +1831,7 @@ void CudaNdarray_vector_add_fast(CudaNdarray* py_self, CudaNdarray* py_other, Py
d_indices_arr, d_indices_arr,
PyArray_SIZE(indices_arr) PyArray_SIZE(indices_arr)
); );
device_free(d_indices_arr);
return; return;
} }
......
Markdown 格式
0%
您添加了 0 到此讨论。请谨慎行事。
请先完成此评论的编辑!
注册 或者 后发表评论