提交 d3b6bec3 authored 作者: Frederic's avatar Frederic

Added some check_blas.py GPU timming.

上级 3307db09
...@@ -67,10 +67,9 @@ def execute(execute=True, verbose=True, M=2000, N=2000, K=2000, ...@@ -67,10 +67,9 @@ def execute(execute=True, verbose=True, M=2000, N=2000, K=2000,
order=order)) order=order))
c = theano.shared(numpy.ones((M, K), dtype=theano.config.floatX, c = theano.shared(numpy.ones((M, K), dtype=theano.config.floatX,
order=order)) order=order))
f = theano.function([], updates={c: 0.4 * c + .8 * T.dot(a, b)}, f = theano.function([], updates=[(c, 0.4 * c + .8 * T.dot(a, b))],
mode=theano.compile.ProfileMode()) mode=theano.compile.ProfileMode())
if any([x.op.__class__.__name__ == 'Gemm' for x in if any([x.op.__class__.__name__ == 'Gemm' for x in
f.maker.fgraph.toposort()]): f.maker.fgraph.toposort()]):
c_impl = f.profile.apply_cimpl.values() c_impl = f.profile.apply_cimpl.values()
...@@ -206,6 +205,8 @@ if __name__ == "__main__": ...@@ -206,6 +205,8 @@ if __name__ == "__main__":
GTX470/4.2 0.238s GTX470/4.2 0.238s
C2075/4.2 0.25s C2075/4.2 0.25s
GTX285/4.2 0.452s #cuda 3.0 seam faster? driver version? GTX285/4.2 0.452s #cuda 3.0 seam faster? driver version?
GT520/4.2 2.68s
GTX560/4.2 0.30s
GTX460/4.0 0.45s GTX460/4.0 0.45s
......
Markdown 格式
0%
您添加了 0 到此讨论。请谨慎行事。
请先完成此评论的编辑!
注册 或者 后发表评论