提交 3d49e41a authored 作者: James Bergstra's avatar James Bergstra 提交者: Frederic

cuda opts: only replace non-inplace blas ops

上级 645fff27
...@@ -385,9 +385,10 @@ def local_gpu_gemv(node): ...@@ -385,9 +385,10 @@ def local_gpu_gemv(node):
gemv(host_from_gpu) -> host_from_gpu(gpu_gemv) gemv(host_from_gpu) -> host_from_gpu(gpu_gemv)
""" """
gemvs = {tensor.blas.gemv_inplace: gpu_gemv_inplace, gemvs = {
#tensor.blas.gemv_inplace: gpu_gemv_inplace,
tensor.blas.gemv_no_inplace: gpu_gemv_no_inplace, tensor.blas.gemv_no_inplace: gpu_gemv_no_inplace,
tensor.blas_c.CGemv(inplace=True): gpu_gemv_inplace, #tensor.blas_c.CGemv(inplace=True): gpu_gemv_inplace,
tensor.blas_c.CGemv(inplace=False): gpu_gemv_no_inplace, tensor.blas_c.CGemv(inplace=False): gpu_gemv_no_inplace,
} }
if node.op == gpu_from_host: if node.op == gpu_from_host:
...@@ -426,7 +427,7 @@ def local_gpu_ger(node): ...@@ -426,7 +427,7 @@ def local_gpu_ger(node):
""" """
gers = { gers = {
tensor.blas_c.CGer(destructive=True): gpu_ger_inplace, #tensor.blas_c.CGer(destructive=True): gpu_ger_inplace,
tensor.blas_c.CGer(destructive=False): gpu_ger_no_inplace, tensor.blas_c.CGer(destructive=False): gpu_ger_no_inplace,
} }
if node.op == gpu_from_host: if node.op == gpu_from_host:
...@@ -463,7 +464,8 @@ def local_gpu_gemm(node): ...@@ -463,7 +464,8 @@ def local_gpu_gemm(node):
gemm(host_from_gpu) -> host_from_gpu(gpu_gemm) gemm(host_from_gpu) -> host_from_gpu(gpu_gemm)
""" """
gemms = {tensor.blas.gemm_inplace: gpu_gemm_inplace, gemms = {
#tensor.blas.gemm_inplace: gpu_gemm_inplace,
tensor.blas.gemm_no_inplace: gpu_gemm_no_inplace} tensor.blas.gemm_no_inplace: gpu_gemm_no_inplace}
if node.op == gpu_from_host: if node.op == gpu_from_host:
host_input = node.inputs[0] host_input = node.inputs[0]
......
Markdown 格式
0%
您添加了 0 到此讨论。请谨慎行事。
请先完成此评论的编辑!
注册 或者 后发表评论