Skip to content
项目
群组
代码片段
帮助
当前项目
正在载入...
登录 / 注册
切换导航面板
P
pytensor
项目
项目
详情
活动
周期分析
仓库
仓库
文件
提交
分支
标签
贡献者
图表
比较
统计图
议题
0
议题
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
CI / CD
CI / CD
流水线
作业
日程
统计图
Wiki
Wiki
代码片段
代码片段
成员
成员
折叠边栏
关闭边栏
活动
图像
聊天
创建新问题
作业
提交
问题看板
Open sidebar
testgroup
pytensor
Commits
186b90a0
提交
186b90a0
authored
3月 15, 2016
作者:
Chiheb Trabelsi
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
test_blas.py has been modified in order to respect the flake8 style.
上级
155c4e01
隐藏空白字符变更
内嵌
并排
正在显示
1 个修改的文件
包含
129 行增加
和
119 行删除
+129
-119
test_blas.py
theano/sandbox/cuda/tests/test_blas.py
+129
-119
没有找到文件。
theano/sandbox/cuda/tests/test_blas.py
浏览文件 @
186b90a0
...
@@ -8,31 +8,31 @@ from theano import tensor
...
@@ -8,31 +8,31 @@ from theano import tensor
from
theano.tests
import
unittest_tools
from
theano.tests
import
unittest_tools
import
numpy
import
numpy
# Skip test if cuda_ndarray is not available.
from
nose.plugins.skip
import
SkipTest
import
theano.sandbox.cuda
as
cuda_ndarray
if
cuda_ndarray
.
cuda_available
==
False
:
raise
SkipTest
(
'Optional package cuda disabled'
)
import
theano.sandbox.cuda
as
tcn
import
theano.sandbox.cuda
as
tcn
from
theano.tensor.signal.pool
import
(
Pool
,
PoolGrad
,
DownsampleFactorMaxGradGrad
)
import
theano.compile.mode
import
theano.compile.mode
from
theano.tensor.tests.test_blas
import
BaseGemv
,
TestBlasStrides
,
TestGer
from
theano.tensor.tests.test_blas
import
BaseGemv
,
TestBlasStrides
,
TestGer
from
theano.sandbox.cuda.blas
import
gpu_gemv_no_inplace
,
gpu_gemv_inplace
from
theano.sandbox.cuda.blas
import
gpu_gemv_no_inplace
,
gpu_gemv_inplace
from
theano.sandbox.cuda.blas
import
gpu_ger_inplace
,
gpu_ger_no_inplace
from
theano.sandbox.cuda.blas
import
gpu_ger_inplace
,
gpu_ger_no_inplace
from
theano.sandbox.cuda.blas
import
batched_dot
,
GpuBatchedDot
from
theano.sandbox.cuda.blas
import
batched_dot
,
GpuBatchedDot
from
theano.tensor.signal.pool
import
(
Pool
,
PoolGrad
,
DownsampleFactorMaxGradGrad
)
# Skip test if cuda_ndarray is not available.
from
nose.plugins.skip
import
SkipTest
import
theano.sandbox.cuda
as
cuda_ndarray
if
cuda_ndarray
.
cuda_available
is
False
:
raise
SkipTest
(
'Optional package cuda disabled'
)
if
theano
.
config
.
mode
==
'FAST_COMPILE'
:
if
theano
.
config
.
mode
==
'FAST_COMPILE'
:
mode_with_gpu
=
theano
.
compile
.
mode
.
get_mode
(
'FAST_RUN'
)
.
including
(
'gpu'
)
mode_with_gpu
=
theano
.
compile
.
mode
.
get_mode
(
'FAST_RUN'
)
.
including
(
'gpu'
)
mode_without_gpu
=
theano
.
compile
.
mode
.
get_mode
(
mode_without_gpu
=
theano
.
compile
.
mode
.
get_mode
(
'FAST_RUN'
)
.
excluding
(
'gpu'
)
'FAST_RUN'
)
.
excluding
(
'gpu'
)
else
:
else
:
mode_with_gpu
=
theano
.
compile
.
mode
.
get_default_mode
()
.
including
(
'gpu'
)
mode_with_gpu
=
theano
.
compile
.
mode
.
get_default_mode
(
mode_without_gpu
=
theano
.
compile
.
mode
.
get_default_mode
()
.
excluding
(
'gpu'
)
)
.
including
(
'gpu'
)
mode_without_gpu
=
theano
.
compile
.
mode
.
get_default_mode
(
)
.
excluding
(
'gpu'
)
# The CPU tests already compare C/Py, so we only check C/GPU
# The CPU tests already compare C/Py, so we only check C/GPU
mode_with_gpu
=
copy
.
copy
(
mode_with_gpu
)
mode_with_gpu
=
copy
.
copy
(
mode_with_gpu
)
...
@@ -55,73 +55,81 @@ class TestBatchedDot(unittest_tools.InferShapeTester):
...
@@ -55,73 +55,81 @@ class TestBatchedDot(unittest_tools.InferShapeTester):
def
cmp
(
a_shp
,
b_shp
):
def
cmp
(
a_shp
,
b_shp
):
a
=
numpy
.
random
.
randn
(
*
a_shp
)
.
astype
(
numpy
.
float32
)
a
=
numpy
.
random
.
randn
(
*
a_shp
)
.
astype
(
numpy
.
float32
)
b
=
numpy
.
random
.
randn
(
*
b_shp
)
.
astype
(
numpy
.
float32
)
b
=
numpy
.
random
.
randn
(
*
b_shp
)
.
astype
(
numpy
.
float32
)
x
=
tensor
.
ftensor3
()
x
=
tensor
.
ftensor3
()
y
=
tensor
.
ftensor3
()
y
=
tensor
.
ftensor3
()
f
=
theano
.
function
([
x
,
y
],
batched_dot
(
x
,
y
),
mode
=
mode_with_gpu
)
f
=
theano
.
function
([
x
,
y
],
batched_dot
(
x
,
y
),
mode
=
mode_with_gpu
)
z0
=
numpy
.
asarray
(
f
(
a
,
b
))
z0
=
numpy
.
asarray
(
f
(
a
,
b
))
ga
=
cuda_ndarray
.
CudaNdarray
(
a
)
ga
=
cuda_ndarray
.
CudaNdarray
(
a
)
gb
=
cuda_ndarray
.
CudaNdarray
(
b
)
gb
=
cuda_ndarray
.
CudaNdarray
(
b
)
z1
=
numpy
.
asarray
(
f
(
ga
,
gb
))
z1
=
numpy
.
asarray
(
f
(
ga
,
gb
))
z_test
=
numpy
.
sum
(
a
[:,:,:,
None
]
*
b
[:,
None
,:,:],
axis
=-
2
)
z_test
=
numpy
.
sum
(
a
[:,
:,
:,
None
]
*
b
[:,
None
,
:,
:],
axis
=-
2
)
z1
=
numpy
.
asarray
(
f
(
ga
,
gb
))
z_test
=
numpy
.
sum
(
a
[:,
:,
:,
None
]
*
b
[:,
None
,
:,
:],
axis
=-
2
)
unittest_tools
.
assert_allclose
(
z0
,
z_test
)
unittest_tools
.
assert_allclose
(
z0
,
z_test
)
unittest_tools
.
assert_allclose
(
z1
,
z_test
)
unittest_tools
.
assert_allclose
(
z1
,
z_test
)
cmp
((
5
,
4
,
3
),
(
5
,
3
,
2
))
cmp
((
5
,
4
,
3
),
(
5
,
3
,
2
))
cmp
((
5
,
3
,
3
),
(
5
,
3
,
3
))
cmp
((
5
,
3
,
3
),
(
5
,
3
,
3
))
cmp
((
5
,
2
,
6
),
(
5
,
6
,
3
))
cmp
((
5
,
2
,
6
),
(
5
,
6
,
3
))
# Test dimensions of 0
# Test dimensions of 0
cmp
((
0
,
2
,
6
),
(
0
,
6
,
3
))
cmp
((
0
,
2
,
6
),
(
0
,
6
,
3
))
cmp
((
5
,
0
,
3
),
(
5
,
3
,
2
))
cmp
((
5
,
0
,
3
),
(
5
,
3
,
2
))
cmp
((
5
,
4
,
0
),
(
5
,
0
,
2
))
cmp
((
5
,
4
,
0
),
(
5
,
0
,
2
))
cmp
((
5
,
4
,
3
),
(
5
,
3
,
0
))
cmp
((
5
,
4
,
3
),
(
5
,
3
,
0
))
cmp
((
0
,
0
,
0
),
(
0
,
0
,
0
))
cmp
((
0
,
0
,
0
),
(
0
,
0
,
0
))
# Test dimensions of 1
# Test dimensions of 1
cmp
((
1
,
2
,
6
),
(
1
,
6
,
3
))
cmp
((
1
,
2
,
6
),
(
1
,
6
,
3
))
cmp
((
5
,
1
,
3
),
(
5
,
3
,
2
))
cmp
((
5
,
1
,
3
),
(
5
,
3
,
2
))
cmp
((
5
,
4
,
1
),
(
5
,
1
,
2
))
cmp
((
5
,
4
,
1
),
(
5
,
1
,
2
))
cmp
((
5
,
4
,
3
),
(
5
,
3
,
1
))
cmp
((
5
,
4
,
3
),
(
5
,
3
,
1
))
def
test_batched_dot_errors
(
self
):
def
test_batched_dot_errors
(
self
):
def
fail
(
a_shp
,
b_shp
):
def
fail
(
a_shp
,
b_shp
):
a
=
numpy
.
random
.
randn
(
*
a_shp
)
.
astype
(
numpy
.
float32
)
a
=
numpy
.
random
.
randn
(
*
a_shp
)
.
astype
(
numpy
.
float32
)
b
=
numpy
.
random
.
randn
(
*
b_shp
)
.
astype
(
numpy
.
float32
)
b
=
numpy
.
random
.
randn
(
*
b_shp
)
.
astype
(
numpy
.
float32
)
x
=
tensor
.
ftensor3
()
x
=
tensor
.
ftensor3
()
y
=
tensor
.
ftensor3
()
y
=
tensor
.
ftensor3
()
f
=
theano
.
function
([
x
,
y
],
batched_dot
(
x
,
y
),
mode
=
mode_with_gpu
)
f
=
theano
.
function
([
x
,
y
],
batched_dot
(
x
,
y
),
mode
=
mode_with_gpu
)
z
=
f
(
a
,
b
)
f
(
a
,
b
)
# Different batch size
# Different batch size
self
.
assertRaises
(
RuntimeError
,
fail
,
(
5
,
4
,
3
),
(
6
,
3
,
2
))
self
.
assertRaises
(
RuntimeError
,
fail
,
(
5
,
4
,
3
),
(
6
,
3
,
2
))
# Shape mismatch
# Shape mismatch
self
.
assertRaises
(
RuntimeError
,
fail
,
(
5
,
4
,
3
),
(
5
,
2
,
2
))
self
.
assertRaises
(
RuntimeError
,
fail
,
(
5
,
4
,
3
),
(
5
,
2
,
2
))
def
test_batched_dot_gradient
(
self
):
def
test_batched_dot_gradient
(
self
):
for
threshold
in
[
0
,
100
]:
unittest_tools
.
verify_grad
(
unittest_tools
.
verify_grad
(
batched_dot
,
[
GpuBatchedDot
(
stream_threshold
=
threshold
),
numpy
.
random
.
randn
(
5
,
7
,
2
)
.
astype
(
numpy
.
float32
),
[
numpy
.
random
.
randn
(
5
,
7
,
2
)
.
astype
(
numpy
.
float32
),
numpy
.
random
.
randn
(
5
,
2
,
6
)
.
astype
(
numpy
.
float32
)],
numpy
.
random
.
randn
(
5
,
2
,
6
)
.
astype
(
numpy
.
float32
)],
mode
=
mode_with_gpu
)
mode
=
mode_with_gpu
)
def
test_infer_shape
(
self
):
def
test_infer_shape
(
self
):
# only matrix
/
matrix is supported
# only matrix
/
matrix is supported
admat
=
tensor
.
ftensor3
()
admat
=
tensor
.
ftensor3
()
bdmat
=
tensor
.
ftensor3
()
bdmat
=
tensor
.
ftensor3
()
admat_val
=
my_rand
(
7
,
4
,
5
)
admat_val
=
my_rand
(
7
,
4
,
5
)
...
@@ -134,24 +142,23 @@ class TestBatchedDot(unittest_tools.InferShapeTester):
...
@@ -134,24 +142,23 @@ class TestBatchedDot(unittest_tools.InferShapeTester):
def
test_dot22
():
def
test_dot22
():
def
cmp
(
a_shp
,
b_shp
):
def
cmp
(
a_shp
,
b_shp
):
a0
=
my_rand
(
*
a_shp
)
a0
=
my_rand
(
*
a_shp
)
a
=
tcn
.
shared_constructor
(
a0
,
'a'
)
a
=
tcn
.
shared_constructor
(
a0
,
'a'
)
b
=
tensor
.
fmatrix
()
b
=
tensor
.
fmatrix
()
f
=
pfunc
([
b
],
[],
updates
=
[(
a
,
tensor
.
dot
(
a
,
b
))],
mode
=
mode_with_gpu
)
f
=
pfunc
([
b
],
[],
updates
=
[(
a
,
tensor
.
dot
(
a
,
b
))],
mode
=
mode_with_gpu
)
bval
=
my_rand
(
*
b_shp
)
bval
=
my_rand
(
*
b_shp
)
f
(
bval
)
f
(
bval
)
assert
numpy
.
allclose
(
numpy
.
dot
(
a0
,
bval
),
a
.
get_value
())
assert
numpy
.
allclose
(
numpy
.
dot
(
a0
,
bval
),
a
.
get_value
())
# Try with a matrix equal to a0, but with strides in both dims
# Try with a matrix equal to a0, but with strides in both dims
a
.
set_value
(
a0
)
a
.
set_value
(
a0
)
a
.
set_value
(
a
.
set_value
(
a
.
get_value
(
borrow
=
True
,
a
.
get_value
(
borrow
=
True
,
return_internal_type
=
True
)[::
-
1
,
::
-
1
],
return_internal_type
=
True
)[::
-
1
,
::
-
1
],
borrow
=
True
)
borrow
=
True
)
f
(
bval
)
f
(
bval
)
cmp
((
3
,
4
),
(
4
,
5
))
cmp
((
3
,
4
),
(
4
,
5
))
...
@@ -171,12 +178,12 @@ def test_dot22scalar():
...
@@ -171,12 +178,12 @@ def test_dot22scalar():
bv
=
my_rand
(
*
b_shp
)
bv
=
my_rand
(
*
b_shp
)
f
=
theano
.
function
(
f
=
theano
.
function
(
[
a
,
b
],
[
a
,
b
],
tensor
.
dot
(
a
,
b
)
*
numpy
.
asarray
(
4
,
'float32'
),
tensor
.
dot
(
a
,
b
)
*
numpy
.
asarray
(
4
,
'float32'
),
mode
=
mode_with_gpu
)
mode
=
mode_with_gpu
)
f2
=
theano
.
function
(
f2
=
theano
.
function
(
[
a
,
b
],
[
a
,
b
],
tensor
.
dot
(
a
,
b
)
*
numpy
.
asarray
(
4
,
'float32'
))
tensor
.
dot
(
a
,
b
)
*
numpy
.
asarray
(
4
,
'float32'
))
t
=
f
.
maker
.
fgraph
.
toposort
()
t
=
f
.
maker
.
fgraph
.
toposort
()
assert
any
([
isinstance
(
n
.
op
,
tcn
.
blas
.
GpuDot22Scalar
)
for
n
in
t
])
assert
any
([
isinstance
(
n
.
op
,
tcn
.
blas
.
GpuDot22Scalar
)
for
n
in
t
])
# assert any([isinstance(n.op, tcn.basic_ops.GpuAllocEmpty)
# assert any([isinstance(n.op, tcn.basic_ops.GpuAllocEmpty)
...
@@ -220,23 +227,22 @@ def test_gemm():
...
@@ -220,23 +227,22 @@ def test_gemm():
c
=
tensor
.
fmatrix
(
'c'
)
c
=
tensor
.
fmatrix
(
'c'
)
f
=
pfunc
([
b
,
c
],
[],
updates
=
[(
a
,
tensor
.
dot
(
a
,
b
)
+
tensor
.
exp
(
c
))],
f
=
pfunc
([
b
,
c
],
[],
updates
=
[(
a
,
tensor
.
dot
(
a
,
b
)
+
tensor
.
exp
(
c
))],
mode
=
mode_with_gpu
)
mode
=
mode_with_gpu
)
assert
any
([
node
.
op
==
tcn
.
blas
.
gpu_gemm_inplace
assert
any
([
node
.
op
==
tcn
.
blas
.
gpu_gemm_inplace
for
node
in
f
.
maker
.
fgraph
.
toposort
()])
for
node
in
f
.
maker
.
fgraph
.
toposort
()])
bval
=
my_rand
(
*
b_shp
)
bval
=
my_rand
(
*
b_shp
)
cval
=
my_rand
(
a_shp
[
0
],
b_shp
[
1
])
cval
=
my_rand
(
a_shp
[
0
],
b_shp
[
1
])
f
(
bval
,
cval
)
f
(
bval
,
cval
)
assert
numpy
.
allclose
(
numpy
.
dot
(
a0
,
bval
)
+
numpy
.
exp
(
cval
),
assert
numpy
.
allclose
(
numpy
.
dot
(
a0
,
bval
)
+
numpy
.
exp
(
cval
),
a
.
get_value
())
a
.
get_value
())
# Try with a matrix equal to a0, but with strides in both dims
# Try with a matrix equal to a0, but with strides in both dims
a
.
set_value
(
a0
)
a
.
set_value
(
a0
)
a
.
set_value
(
a
.
set_value
(
a
.
get_value
(
borrow
=
True
,
a
.
get_value
(
borrow
=
True
,
return_internal_type
=
True
)[::
-
1
,
::
-
1
],
return_internal_type
=
True
)[::
-
1
,
::
-
1
],
borrow
=
True
)
borrow
=
True
)
f
(
bval
,
cval
)
f
(
bval
,
cval
)
cmp
((
3
,
4
),
(
4
,
5
))
cmp
((
3
,
4
),
(
4
,
5
))
...
@@ -250,7 +256,7 @@ def test_gemm():
...
@@ -250,7 +256,7 @@ def test_gemm():
def
test_gemm_no_inplace
():
def
test_gemm_no_inplace
():
def
cmp
(
a_shp
,
b_shp
):
def
cmp
(
a_shp
,
b_shp
):
a0
=
my_rand
(
*
a_shp
)
a0
=
my_rand
(
*
a_shp
)
a
=
tcn
.
shared_constructor
(
a0
,
'a'
)
a
=
tcn
.
shared_constructor
(
a0
,
'a'
)
cval
=
my_rand
(
a_shp
[
0
],
b_shp
[
1
])
cval
=
my_rand
(
a_shp
[
0
],
b_shp
[
1
])
c
=
tcn
.
shared_constructor
(
cval
.
copy
(),
'c'
)
c
=
tcn
.
shared_constructor
(
cval
.
copy
(),
'c'
)
...
@@ -258,14 +264,13 @@ def test_gemm_no_inplace():
...
@@ -258,14 +264,13 @@ def test_gemm_no_inplace():
b
=
tcn
.
fmatrix
(
'b'
)
b
=
tcn
.
fmatrix
(
'b'
)
b2
=
tcn
.
fmatrix
(
'b2'
)
b2
=
tcn
.
fmatrix
(
'b2'
)
f
=
pfunc
(
f
=
pfunc
([
b
,
b2
],
[
b
,
b2
],
[
tensor
.
dot
(
a
,
b2
)
+
c
],
[
tensor
.
dot
(
a
,
b2
)
+
c
],
updates
=
[(
a
,
tensor
.
dot
(
a
,
b
)
+
c
)],
updates
=
[(
a
,
tensor
.
dot
(
a
,
b
)
+
c
)],
mode
=
mode_with_gpu
)
mode
=
mode_with_gpu
)
assert
any
([
node
.
op
==
tcn
.
blas
.
gpu_gemm_no_inplace
assert
any
([
node
.
op
==
tcn
.
blas
.
gpu_gemm_no_inplace
for
node
in
f
.
maker
.
fgraph
.
toposort
()])
for
node
in
f
.
maker
.
fgraph
.
toposort
()])
bval
=
my_rand
(
*
b_shp
)
bval
=
my_rand
(
*
b_shp
)
bval2
=
my_rand
(
*
b_shp
)
bval2
=
my_rand
(
*
b_shp
)
rval
=
f
(
bval
,
bval2
)
rval
=
f
(
bval
,
bval2
)
...
@@ -276,9 +281,10 @@ def test_gemm_no_inplace():
...
@@ -276,9 +281,10 @@ def test_gemm_no_inplace():
# Try with a matrix equal to a0, but with strides in both dims
# Try with a matrix equal to a0, but with strides in both dims
a
.
set_value
(
a0
)
a
.
set_value
(
a0
)
a
.
set_value
(
a
.
set_value
(
a
.
get_value
(
borrow
=
True
,
a
.
get_value
(
return_internal_type
=
True
)[::
-
1
,
::
-
1
],
borrow
=
True
,
borrow
=
True
)
return_internal_type
=
True
)[::
-
1
,
::
-
1
],
borrow
=
True
)
f
(
bval
,
bval2
)
f
(
bval
,
bval2
)
cmp
((
3
,
4
),
(
4
,
5
))
cmp
((
3
,
4
),
(
4
,
5
))
...
@@ -303,8 +309,8 @@ if 0:
...
@@ -303,8 +309,8 @@ if 0:
def
test_maxpool
():
def
test_maxpool
():
"""TODO: test the gpu version!!! """
"""TODO: test the gpu version!!! """
for
d0
,
d1
,
r_true
,
r_false
in
[(
4
,
4
,
[[[[
5
,
7
],
[
13
,
15
]]]],
[[[[
5
,
7
],
[
13
,
15
]]]]),
for
d0
,
d1
,
r_true
,
r_false
in
[(
4
,
4
,
[[[[
5
,
7
],
[
13
,
15
]]]],
[[[[
5
,
7
],
[
13
,
15
]]]]),
(
5
,
5
,
[[[[
6
,
8
],
[
16
,
18
],
[
21
,
23
]]]],
(
5
,
5
,
[[[[
6
,
8
],
[
16
,
18
],
[
21
,
23
]]]],
[[[[
6
,
8
,
9
],
[
16
,
18
,
19
],
[
21
,
23
,
24
]]]])]:
[[[[
6
,
8
,
9
],
[
16
,
18
,
19
],
[
21
,
23
,
24
]]]])]:
for
border
,
ret
in
[(
True
,
r_true
),
(
False
,
r_false
)]:
for
border
,
ret
in
[(
True
,
r_true
),
(
False
,
r_false
)]:
ret
=
numpy
.
array
(
ret
)
ret
=
numpy
.
array
(
ret
)
a
=
tcn
.
blas
.
Pool
((
2
,
2
),
border
)
a
=
tcn
.
blas
.
Pool
((
2
,
2
),
border
)
...
@@ -312,7 +318,7 @@ if 0:
...
@@ -312,7 +318,7 @@ if 0:
b
=
dmatrix4
()
b
=
dmatrix4
()
f
=
pfunc
([
b
],
[
a
(
b
)],
mode
=
mode_with_gpu
)
f
=
pfunc
([
b
],
[
a
(
b
)],
mode
=
mode_with_gpu
)
bval
=
numpy
.
arange
(
0
,
d0
*
d1
)
.
reshape
(
1
,
1
,
d0
,
d1
)
bval
=
numpy
.
arange
(
0
,
d0
*
d1
)
.
reshape
(
1
,
1
,
d0
,
d1
)
r
=
f
(
bval
)[
0
]
r
=
f
(
bval
)[
0
]
# print bval, bval.shape, border
# print bval, bval.shape, border
# print r, r.shape
# print r, r.shape
...
@@ -347,8 +353,7 @@ def test_downsample():
...
@@ -347,8 +353,7 @@ def test_downsample():
(
1
,
1
,
1025
,
10
),
(
1
,
1
,
1025
,
10
),
(
1
,
1
,
1023
,
10
),
(
1
,
1
,
1023
,
10
),
(
65536
,
1
,
10
,
10
),
(
65536
,
1
,
10
,
10
),
(
1
,
65536
,
10
,
10
),
(
1
,
65536
,
10
,
10
),
]
]
numpy
.
random
.
RandomState
(
unittest_tools
.
fetch_seed
())
.
shuffle
(
shps
)
numpy
.
random
.
RandomState
(
unittest_tools
.
fetch_seed
())
.
shuffle
(
shps
)
...
@@ -368,14 +373,14 @@ def test_downsample():
...
@@ -368,14 +373,14 @@ def test_downsample():
a
=
tcn
.
shared_constructor
(
my_rand
(
*
shp
),
'a'
)
a
=
tcn
.
shared_constructor
(
my_rand
(
*
shp
),
'a'
)
f
=
pfunc
([],
ds_op
(
tensor
.
as_tensor_variable
(
a
)),
f
=
pfunc
([],
ds_op
(
tensor
.
as_tensor_variable
(
a
)),
mode
=
mode_with_gpu
.
excluding
(
'cudnn'
))
mode
=
mode_with_gpu
.
excluding
(
'cudnn'
))
f2
=
pfunc
([],
ds_op
(
tensor
.
as_tensor_variable
(
a
)),
f2
=
pfunc
([],
ds_op
(
tensor
.
as_tensor_variable
(
a
)),
mode
=
mode_without_gpu
)
mode
=
mode_without_gpu
)
assert
any
([
isinstance
(
node
.
op
,
assert
any
([
isinstance
(
node
.
op
,
tcn
.
blas
.
GpuDownsampleFactorMax
)
tcn
.
blas
.
GpuDownsampleFactorMax
)
for
node
in
f
.
maker
.
fgraph
.
toposort
()])
for
node
in
f
.
maker
.
fgraph
.
toposort
()])
assert
any
([
isinstance
(
node
.
op
,
Pool
)
assert
any
([
isinstance
(
node
.
op
,
Pool
)
for
node
in
f2
.
maker
.
fgraph
.
toposort
()])
for
node
in
f2
.
maker
.
fgraph
.
toposort
()])
assert
numpy
.
allclose
(
f
(),
f2
())
assert
numpy
.
allclose
(
f
(),
f2
())
# The grad is too slow on GT220 GPU
# The grad is too slow on GT220 GPU
...
@@ -387,15 +392,15 @@ def test_downsample():
...
@@ -387,15 +392,15 @@ def test_downsample():
continue
continue
g
=
pfunc
(
g
=
pfunc
(
[],
[],
tensor
.
grad
(
ds_op
(
tensor
.
as_tensor_variable
(
a
))
.
sum
(),
tensor
.
grad
(
ds_op
(
tensor
.
as_tensor_variable
(
a
))
.
sum
(),
a
),
a
),
mode
=
mode_with_gpu
.
excluding
(
'cudnn'
))
mode
=
mode_with_gpu
.
excluding
(
'cudnn'
))
g2
=
pfunc
(
g2
=
pfunc
(
[],
[],
tensor
.
grad
(
ds_op
(
tensor
.
as_tensor_variable
(
a
))
.
sum
(),
tensor
.
grad
(
ds_op
(
tensor
.
as_tensor_variable
(
a
))
.
sum
(),
a
),
a
),
mode
=
mode_without_gpu
)
mode
=
mode_without_gpu
)
assert
any
([
isinstance
(
node
.
op
,
assert
any
([
isinstance
(
node
.
op
,
tcn
.
blas
.
GpuDownsampleFactorMaxGrad
)
tcn
.
blas
.
GpuDownsampleFactorMaxGrad
)
for
node
in
g
.
maker
.
fgraph
.
toposort
()])
for
node
in
g
.
maker
.
fgraph
.
toposort
()])
...
@@ -413,11 +418,12 @@ def test_downsample():
...
@@ -413,11 +418,12 @@ def test_downsample():
gg
=
pfunc
([],
ggf
,
mode
=
gpu_mode
)
gg
=
pfunc
([],
ggf
,
mode
=
gpu_mode
)
gg2
=
pfunc
([],
ggf
,
mode
=
ref_mode
)
gg2
=
pfunc
([],
ggf
,
mode
=
ref_mode
)
assert
any
([
isinstance
(
node
.
op
,
assert
any
([
isinstance
(
tcn
.
blas
.
GpuDownsampleFactorMaxGradGrad
)
node
.
op
,
tcn
.
blas
.
GpuDownsampleFactorMaxGradGrad
)
for
node
in
gg
.
maker
.
fgraph
.
toposort
()])
for
node
in
gg
.
maker
.
fgraph
.
toposort
()])
assert
any
([
isinstance
(
node
.
op
,
DownsampleFactorMaxGradGrad
)
assert
any
([
isinstance
(
for
node
in
gg2
.
maker
.
fgraph
.
toposort
()])
node
.
op
,
DownsampleFactorMaxGradGrad
)
for
node
in
gg2
.
maker
.
fgraph
.
toposort
()])
assert
numpy
.
allclose
(
gg
(),
gg2
()),
shp
assert
numpy
.
allclose
(
gg
(),
gg2
()),
shp
# We already check that the gpu version return
# We already check that the gpu version return
...
@@ -434,6 +440,7 @@ class TestGpuGemv(TestCase, BaseGemv,
...
@@ -434,6 +440,7 @@ class TestGpuGemv(TestCase, BaseGemv,
gemv
=
gpu_gemv_no_inplace
gemv
=
gpu_gemv_no_inplace
gemv_inplace
=
gpu_gemv_inplace
gemv_inplace
=
gpu_gemv_inplace
# Mimic shared constructors registry
# Mimic shared constructors registry
@staticmethod
@staticmethod
def
shared
(
val
):
def
shared
(
val
):
# If we don't put shared on the GPU, we won't be able to test
# If we don't put shared on the GPU, we won't be able to test
...
@@ -445,7 +452,7 @@ class TestGpuGemv(TestCase, BaseGemv,
...
@@ -445,7 +452,7 @@ class TestGpuGemv(TestCase, BaseGemv,
class
TestGpuGemvNoTransfer
(
TestCase
,
BaseGemv
,
class
TestGpuGemvNoTransfer
(
TestCase
,
BaseGemv
,
unittest_tools
.
TestOptimizationMixin
):
unittest_tools
.
TestOptimizationMixin
):
mode
=
mode_with_gpu
mode
=
mode_with_gpu
dtype
=
'float32'
dtype
=
'float32'
...
@@ -471,13 +478,13 @@ class TestVectorMatrixDot(TestCase):
...
@@ -471,13 +478,13 @@ class TestVectorMatrixDot(TestCase):
''' Test vector dot matrix '''
''' Test vector dot matrix '''
v
=
theano
.
shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
2
),
dtype
=
'float32'
))
v
=
theano
.
shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
2
),
dtype
=
'float32'
))
m
=
theano
.
shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
2
,
5
),
m
=
theano
.
shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
2
,
5
),
dtype
=
'float32'
))
dtype
=
'float32'
))
no_gpu_f
=
theano
.
function
([],
theano
.
dot
(
v
,
m
),
mode
=
mode_without_gpu
)
no_gpu_f
=
theano
.
function
([],
theano
.
dot
(
v
,
m
),
mode
=
mode_without_gpu
)
gpu_f
=
theano
.
function
([],
theano
.
dot
(
v
,
m
),
mode
=
mode_with_gpu
)
gpu_f
=
theano
.
function
([],
theano
.
dot
(
v
,
m
),
mode
=
mode_with_gpu
)
# gpu_f2 is needed to test the case when the input is not on the gpu
# gpu_f2 is needed to test the case when the input is not on the gpu
# but the output is moved to the gpu.
# but the output is moved to the gpu.
gpu_f2
=
theano
.
function
([],
tcn
.
gpu_from_host
(
theano
.
dot
(
v
,
m
)),
gpu_f2
=
theano
.
function
([],
tcn
.
gpu_from_host
(
theano
.
dot
(
v
,
m
)),
mode
=
mode_with_gpu
)
mode
=
mode_with_gpu
)
# Assert they produce the same output
# Assert they produce the same output
assert
numpy
.
allclose
(
no_gpu_f
(),
gpu_f
(),
atol
=
self
.
atol
)
assert
numpy
.
allclose
(
no_gpu_f
(),
gpu_f
(),
atol
=
self
.
atol
)
...
@@ -490,9 +497,9 @@ class TestVectorMatrixDot(TestCase):
...
@@ -490,9 +497,9 @@ class TestVectorMatrixDot(TestCase):
# Check double-strided m
# Check double-strided m
m
.
set_value
(
m
.
set_value
(
m
.
get_value
(
borrow
=
True
,
m
.
get_value
(
borrow
=
True
,
return_internal_type
=
True
)[::
-
1
,
::
-
1
],
return_internal_type
=
True
)[::
-
1
,
::
-
1
],
borrow
=
True
)
borrow
=
True
)
assert
numpy
.
allclose
(
no_gpu_f
(),
gpu_f
(),
atol
=
self
.
atol
)
assert
numpy
.
allclose
(
no_gpu_f
(),
gpu_f
(),
atol
=
self
.
atol
)
assert
numpy
.
allclose
(
no_gpu_f
(),
gpu_f2
(),
atol
=
self
.
atol
)
assert
numpy
.
allclose
(
no_gpu_f
(),
gpu_f2
(),
atol
=
self
.
atol
)
...
@@ -500,13 +507,13 @@ class TestVectorMatrixDot(TestCase):
...
@@ -500,13 +507,13 @@ class TestVectorMatrixDot(TestCase):
''' Test matrix dot vector '''
''' Test matrix dot vector '''
v
=
theano
.
shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
2
),
dtype
=
'float32'
))
v
=
theano
.
shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
2
),
dtype
=
'float32'
))
m
=
theano
.
shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
5
,
2
),
m
=
theano
.
shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
5
,
2
),
dtype
=
'float32'
))
dtype
=
'float32'
))
no_gpu_f
=
theano
.
function
([],
theano
.
dot
(
m
,
v
),
mode
=
mode_without_gpu
)
no_gpu_f
=
theano
.
function
([],
theano
.
dot
(
m
,
v
),
mode
=
mode_without_gpu
)
gpu_f
=
theano
.
function
([],
theano
.
dot
(
m
,
v
),
mode
=
mode_with_gpu
)
gpu_f
=
theano
.
function
([],
theano
.
dot
(
m
,
v
),
mode
=
mode_with_gpu
)
# gpu_f2 is needed to test the case when the input is not on the gpu
# gpu_f2 is needed to test the case when the input is not on the gpu
# but the output is moved to the gpu.
# but the output is moved to the gpu.
gpu_f2
=
theano
.
function
([],
tcn
.
gpu_from_host
(
theano
.
dot
(
m
,
v
)),
gpu_f2
=
theano
.
function
([],
tcn
.
gpu_from_host
(
theano
.
dot
(
m
,
v
)),
mode
=
mode_with_gpu
)
mode
=
mode_with_gpu
)
# Assert they produce the same output
# Assert they produce the same output
assert
numpy
.
allclose
(
no_gpu_f
(),
gpu_f
(),
atol
=
self
.
atol
)
assert
numpy
.
allclose
(
no_gpu_f
(),
gpu_f
(),
atol
=
self
.
atol
)
...
@@ -520,19 +527,21 @@ class TestVectorMatrixDot(TestCase):
...
@@ -520,19 +527,21 @@ class TestVectorMatrixDot(TestCase):
def
test_gemv1
(
self
):
def
test_gemv1
(
self
):
''' test vector1+dot(matrix,vector2) '''
''' test vector1+dot(matrix,vector2) '''
v1
=
theano
.
tensor
.
_shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
2
),
v1
=
theano
.
tensor
.
_shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
2
),
dtype
=
'float32'
))
dtype
=
'float32'
))
v2
=
theano
.
tensor
.
_shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
5
),
v2
=
theano
.
tensor
.
_shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
5
),
dtype
=
'float32'
))
dtype
=
'float32'
))
m
=
theano
.
tensor
.
_shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
5
,
2
),
m
=
theano
.
tensor
.
_shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
5
,
2
),
dtype
=
'float32'
))
dtype
=
'float32'
))
no_gpu_f
=
theano
.
function
([],
v2
+
theano
.
dot
(
m
,
v1
),
no_gpu_f
=
theano
.
function
([],
v2
+
theano
.
dot
(
m
,
v1
),
mode
=
mode_without_gpu
)
mode
=
mode_without_gpu
)
gpu_f
=
theano
.
function
([],
v2
+
theano
.
dot
(
m
,
v1
),
mode
=
mode_with_gpu
)
gpu_f
=
theano
.
function
([],
v2
+
theano
.
dot
(
m
,
v1
),
mode
=
mode_with_gpu
)
# gpu_f2 is needed to test the case when the input is not on the gpu
# gpu_f2 is needed to test the case when the input is not on the gpu
# but the output is moved to the gpu.
# but the output is moved to the gpu.
gpu_f2
=
theano
.
function
([],
tcn
.
gpu_from_host
(
v2
+
theano
.
dot
(
m
,
v1
)),
gpu_f2
=
theano
.
function
(
mode
=
mode_with_gpu
)
[],
tcn
.
gpu_from_host
(
v2
+
theano
.
dot
(
m
,
v1
)),
mode
=
mode_with_gpu
)
# Assert they produce the same output
# Assert they produce the same output
assert
numpy
.
allclose
(
no_gpu_f
(),
gpu_f
(),
atol
=
self
.
atol
)
assert
numpy
.
allclose
(
no_gpu_f
(),
gpu_f
(),
atol
=
self
.
atol
)
...
@@ -548,16 +557,17 @@ class TestVectorMatrixDot(TestCase):
...
@@ -548,16 +557,17 @@ class TestVectorMatrixDot(TestCase):
v1
=
theano
.
shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
5
),
dtype
=
'float32'
))
v1
=
theano
.
shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
5
),
dtype
=
'float32'
))
v2
=
tensor
.
_shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
2
),
dtype
=
'float32'
))
v2
=
tensor
.
_shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
2
),
dtype
=
'float32'
))
m
=
theano
.
shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
5
,
2
),
m
=
theano
.
shared
(
numpy
.
array
(
numpy
.
random
.
rand
(
5
,
2
),
dtype
=
'float32'
))
dtype
=
'float32'
))
no_gpu_f
=
theano
.
function
([],
v2
+
theano
.
dot
(
v1
,
m
),
no_gpu_f
=
theano
.
function
([],
v2
+
theano
.
dot
(
v1
,
m
),
mode
=
mode_without_gpu
)
mode
=
mode_without_gpu
)
gpu_f
=
theano
.
function
([],
v2
+
theano
.
dot
(
v1
,
m
),
gpu_f
=
theano
.
function
([],
v2
+
theano
.
dot
(
v1
,
m
),
mode
=
mode_with_gpu
)
mode
=
mode_with_gpu
)
# gpu_f2 is needed to test the case when the input is not on the gpu
# gpu_f2 is needed to test the case when the input is not on the gpu
# but the output is moved to the gpu.
# but the output is moved to the gpu.
gpu_f2
=
theano
.
function
([],
tcn
.
gpu_from_host
(
v2
+
theano
.
dot
(
v1
,
m
)),
gpu_f2
=
theano
.
function
(
mode
=
mode_with_gpu
)
[],
tcn
.
gpu_from_host
(
v2
+
theano
.
dot
(
v1
,
m
)),
mode
=
mode_with_gpu
)
# Assert they produce the same output
# Assert they produce the same output
assert
numpy
.
allclose
(
no_gpu_f
(),
gpu_f
(),
atol
=
self
.
atol
)
assert
numpy
.
allclose
(
no_gpu_f
(),
gpu_f
(),
atol
=
self
.
atol
)
...
...
编写
预览
Markdown
格式
0%
重试
或
添加新文件
添加附件
取消
您添加了
0
人
到此讨论。请谨慎行事。
请先完成此评论的编辑!
取消
请
注册
或者
登录
后发表评论