提交 4d641a3e authored 作者: Frederic Bastien's avatar Frederic Bastien

Fix crashes probably due to nvcc not handling unsigned int as we expect

上级 d878af4f
...@@ -1831,7 +1831,7 @@ class GpuCAReduce(GpuOp): ...@@ -1831,7 +1831,7 @@ class GpuCAReduce(GpuOp):
""" % locals(), file=sio) """ % locals(), file=sio)
def c_code_cache_version_apply(self, node): def c_code_cache_version_apply(self, node):
version = [14] # the version corresponding to the c code in this Op version = [15] # the version corresponding to the c code in this Op
# now we insert versions for the ops on which we depend... # now we insert versions for the ops on which we depend...
scalar_node = Apply(self.scalar_op, scalar_node = Apply(self.scalar_op,
...@@ -2163,7 +2163,7 @@ class GpuCAReduce(GpuOp): ...@@ -2163,7 +2163,7 @@ class GpuCAReduce(GpuOp):
# memory (a segment of a column). # memory (a segment of a column).
reducebuf = self._k_reduce_buf('Z[blockIdx.x * sZ0]', node, nodename, sub={}) reducebuf = self._k_reduce_buf('Z[blockIdx.x * sZ0]', node, nodename, sub={})
reduce_fct = self._assign_reduce(node, nodename, "myresult", reduce_fct = self._assign_reduce(node, nodename, "myresult",
"A[i0 * sA0 + i1 * sA1 + blockIdx.x * sA2]", "A[i0 * sA0 + i1 * sA1 + ((int)blockIdx.x) * sA2]",
{}, True) {}, True)
reduce_init = self._assign_init("A[blockIdx.x * sA2]") reduce_init = self._assign_init("A[blockIdx.x * sA2]")
print(""" print("""
......
Markdown 格式
0%
您添加了 0 到此讨论。请谨慎行事。
请先完成此评论的编辑!
注册 或者 后发表评论