提交 2b5e9242 authored 作者: James Bergstra's avatar James Bergstra

GpuSum - cast template args to int to satisfy compiler

上级 46a0de64
...@@ -901,11 +901,11 @@ class GpuSum(Op): ...@@ -901,11 +901,11 @@ class GpuSum(Op):
int verbose = 0; int verbose = 0;
dim3 n_threads( dim3 n_threads(
std::min(CudaNdarray_HOST_DIMS(%(x)s)[1], std::min(CudaNdarray_HOST_DIMS(%(x)s)[1],
NUM_VECTOR_OP_THREADS_PER_BLOCK)); (int)NUM_VECTOR_OP_THREADS_PER_BLOCK));
dim3 n_blocks(std::min(CudaNdarray_HOST_DIMS(%(x)s)[0], NUM_VECTOR_OP_BLOCKS)); dim3 n_blocks(std::min(CudaNdarray_HOST_DIMS(%(x)s)[0], (int)NUM_VECTOR_OP_BLOCKS));
n_blocks.y = std::min( n_blocks.y = std::min(
CudaNdarray_HOST_DIMS(%(x)s)[2], CudaNdarray_HOST_DIMS(%(x)s)[2],
NUM_VECTOR_OP_BLOCKS / n_blocks.x (int)(NUM_VECTOR_OP_BLOCKS / n_blocks.x)
); );
if (verbose) printf("running kernel_reduce_sum_10_%(name)s\\n"); if (verbose) printf("running kernel_reduce_sum_10_%(name)s\\n");
int n_shared = sizeof(float) * n_threads.x; int n_shared = sizeof(float) * n_threads.x;
......
Markdown 格式
0%
您添加了 0 到此讨论。请谨慎行事。
请先完成此评论的编辑!
注册 或者 后发表评论