提交 217b616b authored 作者: Arnaud Bergeron's avatar Arnaud Bergeron

Fix small nits introduced by the merge.

上级 b3f66f86
...@@ -143,7 +143,8 @@ def local_inplace_gpuagemm(node): ...@@ -143,7 +143,8 @@ def local_inplace_gpuagemm(node):
return [gpugemm_inplace(*node.inputs)] return [gpugemm_inplace(*node.inputs)]
gpuablas_opt_inplace = in2out(LocalOptGroup( gpuablas_opt_inplace = in2out(LocalOptGroup(
local_inplace_gpuagemv, local_inplace_gpuagemm)) local_inplace_gpuagemv, local_inplace_gpuagemm),
name='gpuablas_opt_inplace')
optdb.register('InplaceGpuaBlasOpt', optdb.register('InplaceGpuaBlasOpt',
gpuablas_opt_inplace, gpuablas_opt_inplace,
70.0, 'fast_run', 'inplace', 'gpuarray') 70.0, 'fast_run', 'inplace', 'gpuarray')
...@@ -234,7 +234,7 @@ class GpuDimShuffle(HideC, DimShuffle): ...@@ -234,7 +234,7 @@ class GpuDimShuffle(HideC, DimShuffle):
tmp = pygpu_transpose(a, %(name)s_ax); tmp = pygpu_transpose(a, %(name)s_ax);
if (!tmp) return NULL; if (!tmp) return NULL;
%(copy_shape)s %(copy_shape)s
res = pygpu_reshape(tmp, %(nd_out)s, sh, GA_ANY_ORDER, 1); res = pygpu_reshape(tmp, %(nd_out)s, sh, GA_ANY_ORDER, 1, -1);
Py_DECREF(tmp); Py_DECREF(tmp);
return res; return res;
} }
......
...@@ -221,6 +221,11 @@ def local_gpua_careduce(node): ...@@ -221,6 +221,11 @@ def local_gpua_careduce(node):
def local_gpua_gemv(node): def local_gpua_gemv(node):
return GpuGemv(inplace=node.op.inplace) return GpuGemv(inplace=node.op.inplace)
@register_opt()
@op_lifter(tensor.blas_c.CGemv)
def local_gpua_gemv2(node):
return GpuGemv(inplace=node.op.inplace)
@register_opt() @register_opt()
@op_lifter(tensor.blas.Gemm) @op_lifter(tensor.blas.Gemm)
def local_gpua_gemm(node): def local_gpua_gemm(node):
......
Markdown 格式
0%
您添加了 0 到此讨论。请谨慎行事。
请先完成此评论的编辑!
注册 或者 后发表评论