提交 2b5e9242 authored 作者: James Bergstra's avatar James Bergstra

GpuSum - cast template args to int to satisfy compiler

上级 46a0de64
......@@ -901,11 +901,11 @@ class GpuSum(Op):
int verbose = 0;
dim3 n_threads(
std::min(CudaNdarray_HOST_DIMS(%(x)s)[1],
NUM_VECTOR_OP_THREADS_PER_BLOCK));
dim3 n_blocks(std::min(CudaNdarray_HOST_DIMS(%(x)s)[0], NUM_VECTOR_OP_BLOCKS));
(int)NUM_VECTOR_OP_THREADS_PER_BLOCK));
dim3 n_blocks(std::min(CudaNdarray_HOST_DIMS(%(x)s)[0], (int)NUM_VECTOR_OP_BLOCKS));
n_blocks.y = std::min(
CudaNdarray_HOST_DIMS(%(x)s)[2],
NUM_VECTOR_OP_BLOCKS / n_blocks.x
(int)(NUM_VECTOR_OP_BLOCKS / n_blocks.x)
);
if (verbose) printf("running kernel_reduce_sum_10_%(name)s\\n");
int n_shared = sizeof(float) * n_threads.x;
......
Markdown 格式
0%
您添加了 0 到此讨论。请谨慎行事。
请先完成此评论的编辑!
注册 或者 后发表评论