Skip to content
项目
群组
代码片段
帮助
当前项目
正在载入...
登录 / 注册
切换导航面板
P
pytensor
项目
项目
详情
活动
周期分析
仓库
仓库
文件
提交
分支
标签
贡献者
图表
比较
统计图
议题
0
议题
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
CI / CD
CI / CD
流水线
作业
日程
统计图
Wiki
Wiki
代码片段
代码片段
成员
成员
折叠边栏
关闭边栏
活动
图像
聊天
创建新问题
作业
提交
问题看板
Open sidebar
testgroup
pytensor
Commits
1548d7e0
提交
1548d7e0
authored
10月 02, 2015
作者:
Frédéric Bastien
浏览文件
操作
浏览文件
下载
差异文件
Merge pull request #3414 from harmdevries89/mult_argmax2
support for multiple axes in MaxAndArgMaxOp
上级
c74aa4cf
77e5267c
隐藏空白字符变更
内嵌
并排
正在显示
3 个修改的文件
包含
95 行增加
和
63 行删除
+95
-63
basic.py
theano/tensor/basic.py
+64
-50
opt_uncanonicalize.py
theano/tensor/opt_uncanonicalize.py
+4
-1
test_basic.py
theano/tensor/tests/test_basic.py
+27
-12
没有找到文件。
theano/tensor/basic.py
浏览文件 @
1548d7e0
...
...
@@ -109,7 +109,8 @@ if 0:
# - JB 20100226
def
as_cuda_or_tensor_variable
(
x
,
name
=
None
,
ndim
=
None
):
"""
Do the same as_tensor_variable, but do not transfer the value on the gpu.
Do the same as_tensor_variable,
but do not transfer the value on the gpu.
"""
if
hasattr
(
x
,
'_as_CudaNdarrayVariable'
):
# TODO: pass name and ndim arguments
...
...
@@ -516,7 +517,8 @@ def _allclose(a, b, rtol=None, atol=None):
if
atol
is
not
None
:
atol_
=
atol
# Work around bug in Numpy, see http://projects.scipy.org/numpy/ticket/1684
# Work around bug in Numpy, see
# http://projects.scipy.org/numpy/ticket/1684
if
str
(
b
.
dtype
)
in
int_dtypes
and
(
numpy
.
absolute
(
b
)
<
0
)
.
any
():
b
=
theano
.
_asarray
(
b
,
dtype
=
'float64'
)
...
...
@@ -1287,27 +1289,14 @@ class MaxAndArgmax(Op):
def
make_node
(
self
,
x
,
axis
=
None
):
x
=
_as_tensor_variable
(
x
)
if
isinstance
(
axis
,
(
tuple
,
list
)):
axis
=
[
int
(
a
)
for
a
in
axis
]
if
len
(
axis
)
!=
1
:
axis
=
list
(
axis
)
for
idx
in
xrange
(
len
(
axis
)):
if
axis
[
idx
]
<
0
:
axis
[
idx
]
+=
x
.
type
.
ndim
axis
.
sort
()
if
axis
==
list
(
range
(
-
x
.
type
.
ndim
,
0
,
1
)):
axis
=
list
(
range
(
x
.
type
.
ndim
))
assert
axis
==
list
(
range
(
x
.
type
.
ndim
)),
(
"MaxAndArgmax does not support multiple"
" axes. the max fct supports it. Got
%
s"
%
axis
)
axis
=
None
else
:
axis
=
axis
[
0
]
if
isinstance
(
axis
,
(
int
,
numpy
.
integer
)):
axis
=
int
(
axis
)
axis
=
[
int
(
axis
)]
elif
isinstance
(
axis
,
numpy
.
ndarray
)
and
axis
.
ndim
==
0
:
axis
=
int
(
axis
)
axis
=
[
int
(
axis
)]
elif
isinstance
(
axis
,
(
tuple
,
list
,
numpy
.
ndarray
)):
axis
=
[
int
(
a
)
for
a
in
axis
]
if
axis
==
list
(
range
(
x
.
type
.
ndim
)):
axis
=
None
elif
isinstance
(
axis
,
Variable
):
if
NoneConst
.
equals
(
axis
):
axis
=
None
...
...
@@ -1317,30 +1306,40 @@ class MaxAndArgmax(Op):
else
:
assert
(
axis
.
dtype
.
startswith
(
"int"
)
or
axis
.
dtype
.
startswith
(
"uint"
))
axis
=
int
(
axis
.
data
)
# we make the axis all positive to make the infer_shape work
# with negative axis
if
x
.
type
.
ndim
>
0
and
axis
is
not
None
:
if
axis
<
0
:
if
-
axis
>
x
.
type
.
ndim
:
raise
ValueError
(
'axis out of range'
)
axis
=
x
.
type
.
ndim
+
axis
# Verify that the axis is valid.
all_axes
=
set
()
if
axis
is
not
None
:
if
axis
<
0
or
axis
>=
x
.
type
.
ndim
:
raise
ValueError
(
'Invalid axis:
%
s (the number of dimensions of the '
'input is:
%
s)'
%
(
axis
,
x
.
type
.
ndim
))
all_axes
.
add
(
axis
)
if
isinstance
(
axis
.
data
,
(
int
,
numpy
.
integer
))
or
\
(
isinstance
(
axis
.
data
,
numpy
.
ndarray
)
and
axis
.
data
.
ndim
==
0
):
axis
=
[
int
(
axis
.
data
)]
elif
isinstance
(
axis
.
data
,
(
list
,
numpy
.
ndarray
)):
axis
=
[
int
(
i
)
for
i
in
axis
.
data
]
# Make axis entries non-negative, and sort them
if
isinstance
(
axis
,
list
):
for
idx
in
xrange
(
len
(
axis
)):
if
axis
[
idx
]
<
0
:
axis
[
idx
]
+=
x
.
type
.
ndim
axis
.
sort
()
# Verify that axes are valid
all_axes
=
[]
if
isinstance
(
axis
,
list
):
for
ax
in
axis
:
if
ax
<
0
or
ax
>=
x
.
type
.
ndim
:
raise
ValueError
(
'Invalid axis:
%
s (the number of dimensions of the '
'input is:
%
s)'
%
(
ax
,
x
.
type
.
ndim
))
if
ax
not
in
all_axes
:
all_axes
.
append
(
ax
)
else
:
all_axes
=
list
(
range
(
x
.
ndim
))
if
axis
is
None
:
if
axis
is
None
or
axis
==
list
(
range
(
x
.
type
.
ndim
)):
axis
=
NoneConst
.
clone
()
else
:
axis
=
_as_tensor_variable
(
a
xi
s
)
assert
axis
.
ndim
==
0
axis
=
_as_tensor_variable
(
a
ll_axe
s
)
assert
axis
.
ndim
==
1
inputs
=
[
x
,
axis
]
# We keep the original broadcastable flags for dimensions on which
# we do not perform the max / argmax.
broadcastable
=
[
b
for
i
,
b
in
enumerate
(
x
.
type
.
broadcastable
)
...
...
@@ -1350,25 +1349,41 @@ class MaxAndArgmax(Op):
return
Apply
(
self
,
inputs
,
outputs
)
def
perform
(
self
,
node
,
inp
,
outs
):
x
,
ax
i
s
=
inp
x
,
ax
e
s
=
inp
max
,
max_idx
=
outs
max
[
0
]
=
theano
.
_asarray
(
numpy
.
max
(
x
,
axis
),
if
axes
is
None
:
axes
=
tuple
(
range
(
x
.
ndim
))
else
:
axes
=
tuple
(
axes
)
max
[
0
]
=
theano
.
_asarray
(
numpy
.
max
(
x
,
axes
),
dtype
=
node
.
outputs
[
0
]
.
dtype
)
max_idx
[
0
]
=
theano
.
_asarray
(
numpy
.
argmax
(
x
,
axis
),
dtype
=
'int64'
)
# Numpy does not support multiple axes for argmax
# Work around
keep_axes
=
numpy
.
array
([
i
for
i
in
range
(
x
.
ndim
)
if
i
not
in
axes
])
# Not-reduced axes in front
transposed_x
=
numpy
.
transpose
(
x
,
numpy
.
concatenate
((
keep_axes
,
axes
)))
reshaped_x
=
transposed_x
.
reshape
(
transposed_x
.
shape
[:
len
(
keep_axes
)]
+
(
-
1
,))
max_idx
[
0
]
=
theano
.
_asarray
(
numpy
.
argmax
(
reshaped_x
,
axis
=-
1
),
dtype
=
'int64'
)
def
c_code
(
self
,
node
,
name
,
inp
,
out
,
sub
):
x
,
axis
=
inp
max
,
argmax
=
out
fail
=
sub
[
"fail"
]
if
NoneConst
.
equals
(
node
.
inputs
[
1
]):
axis_code
=
"axis = NPY_MAXDIMS;"
else
:
assert
node
.
inputs
[
1
]
.
ndim
==
0
assert
node
.
inputs
[
1
]
.
ndim
==
1
# Fall back to perform() if there are multiple axes
if
len
(
node
.
inputs
[
1
]
.
data
)
>
1
:
raise
NotImplementedError
()
axis_code
=
"""
axis = ((dtype_
%(axis)
s*)PyArray_DATA(
%(axis)
s))[0];
if(axis > PyArray_NDIM(
%(x)
s)-1 || axis < -PyArray_NDIM(
%(x)
s)){
PyErr_SetString(PyExc_ValueError, "MaxAndArgmax, bad axis argument");
PyErr_SetString(PyExc_ValueError,
"MaxAndArgmax, bad axis argument");
%(fail)
s
}
"""
%
locals
()
...
...
@@ -1420,10 +1435,10 @@ class MaxAndArgmax(Op):
def
infer_shape
(
self
,
node
,
shapes
):
ishape
,
axis_shape
=
shapes
axis
=
node
.
inputs
[
1
]
if
node
.
inputs
[
1
]
.
data
is
None
:
if
axis
.
data
is
None
:
return
[(),
()]
rval
=
tuple
([
ishape
[
i
]
for
(
i
,
b
)
in
enumerate
(
node
.
inputs
[
0
]
.
type
.
broadcastable
)
if
i
!=
axis
.
data
])
node
.
inputs
[
0
]
.
type
.
broadcastable
)
if
i
not
in
axis
.
data
])
return
[
rval
,
rval
]
def
R_op
(
self
,
inputs
,
eval_points
):
...
...
@@ -1492,7 +1507,7 @@ class MaxAndArgmax(Op):
# We are taking the max/argmax over all dimensions.
axis
=
None
for
i
in
xrange
(
x
.
ndim
):
if
axis
is
None
or
i
==
axis
.
data
:
if
axis
is
None
or
i
in
axis
.
data
:
pattern
.
append
(
'x'
)
else
:
pattern
.
append
(
out_dim
)
...
...
@@ -1632,7 +1647,6 @@ def argmax(x, axis=None, keepdims=False):
# In python (using MaxAndArgmax.perform()) this leads to a wasteful
# implementation that goes through the data twice instead of once
# but when Argmax.c_impl() is in place, it should be fine.
argout
=
max_and_argmax
(
x
,
axis
)[
1
]
if
keepdims
:
...
...
theano/tensor/opt_uncanonicalize.py
浏览文件 @
1548d7e0
...
...
@@ -62,7 +62,10 @@ def local_max_and_argmax(node):
try
:
axis
=
get_scalar_constant_value
(
node
.
inputs
[
1
])
except
NotScalarConstantError
:
return
False
axis
=
node
.
inputs
[
1
]
if
not
isinstance
(
axis
,
T
.
TensorConstant
):
return
False
axis
=
axis
.
data
new
=
CAReduce
(
scal
.
maximum
,
axis
)(
node
.
inputs
[
0
])
return
[
new
,
None
]
...
...
theano/tensor/tests/test_basic.py
浏览文件 @
1548d7e0
...
...
@@ -2641,7 +2641,7 @@ def _approx_eq(a, b, eps=1.0e-4):
if
_approx_eq
.
debug
:
print
(
a
,
b
)
return
False
return
True
return
True
_approx_eq
.
debug
=
0
...
...
@@ -2799,10 +2799,10 @@ class T_max_and_argmax(unittest.TestCase):
def
test2
(
self
):
data
=
rand
(
2
,
3
)
n
=
as_tensor_variable
(
data
)
for
(
axis
,
np_axis
)
in
[(
-
1
,
-
1
),
(
0
,
0
),
(
1
,
1
),
(
None
,
None
),
([
0
,
1
],
None
),
([
1
,
0
],
None
),
(
NoneConst
.
clone
(),
None
),
(
constant
(
0
),
0
)]:
for
(
axis
,
np_axis
)
in
[(
-
1
,
-
1
),
(
0
,
0
),
(
1
,
1
),
(
None
,
None
),
([
0
,
1
],
None
),
([
1
,
0
],
None
),
(
NoneConst
.
clone
(),
None
),
(
constant
(
0
),
0
)]:
v
,
i
=
eval_outputs
(
max_and_argmax
(
n
,
axis
))
assert
i
.
dtype
==
'int64'
self
.
assertTrue
(
numpy
.
all
(
v
==
numpy
.
max
(
data
,
np_axis
)))
...
...
@@ -2860,8 +2860,8 @@ class T_max_and_argmax(unittest.TestCase):
def
test3
(
self
):
data
=
rand
(
2
,
3
,
4
)
n
=
as_tensor_variable
(
data
)
for
(
axis
,
np_axis
)
in
[(
-
1
,
-
1
),
(
0
,
0
),
(
1
,
1
),
(
None
,
None
),
([
0
,
1
,
2
],
None
),
([
1
,
2
,
0
],
None
)]:
for
(
axis
,
np_axis
)
in
[(
-
1
,
-
1
),
(
0
,
0
),
(
1
,
1
),
(
None
,
None
),
([
0
,
1
,
2
],
None
),
([
1
,
2
,
0
],
None
)]:
v
,
i
=
eval_outputs
(
max_and_argmax
(
n
,
axis
))
assert
i
.
dtype
==
'int64'
self
.
assertTrue
(
numpy
.
all
(
v
==
numpy
.
max
(
data
,
np_axis
)))
...
...
@@ -2922,8 +2922,8 @@ class T_max_and_argmax(unittest.TestCase):
z
[
argmax
]
+=
1
else
:
for
id
,
v
in
enumerate
(
argmax
):
z
[
v
*
numpy
.
prod
(
data
.
shape
[
data
.
ndim
-
1
:
axis
:
-
1
])
+
id
]
+=
1
z
[
v
*
numpy
.
prod
(
data
.
shape
[
data
.
ndim
-
1
:
axis
:
-
1
])
+
id
]
+=
1
z
=
z
.
reshape
(
data
.
shape
)
assert
numpy
.
all
(
max_grad_data
==
z
)
...
...
@@ -2931,11 +2931,11 @@ class T_max_and_argmax(unittest.TestCase):
for
axis
in
(
-
1
,
0
,
1
,
None
):
for
j
in
xrange
(
2
):
safe_verify_grad
(
lambda
v
:
max_and_argmax
(
v
,
axis
=
axis
)[
j
],
[
data
])
[
data
])
if
axis
!=
1
:
safe_verify_grad
(
lambda
v
:
max_and_argmax
(
v
.
flatten
(),
axis
=
axis
)[
j
],
[
data
])
axis
=
axis
)[
j
],
[
data
])
if
axis
in
(
0
,
None
):
check_grad_max
(
data
,
eval_outputs
(
grad
(
max_and_argmax
(
n
,
axis
=
axis
)[
0
]
.
sum
(),
n
)),
axis
=
axis
)
...
...
@@ -2956,6 +2956,11 @@ class T_max_and_argmax(unittest.TestCase):
safe_verify_grad
(
lambda
v
:
max_and_argmax
(
v
,
axis
=
[
i
])[
0
],
[
data
])
safe_verify_grad
(
lambda
v
:
max_and_argmax
(
v
,
axis
=
[
i
])[
1
],
[
data
])
# Test grad with multiple axes
for
i
in
[[
0
,
1
],
[
0
,
0
]]:
safe_verify_grad
(
lambda
v
:
max_and_argmax
(
v
,
axis
=
i
)[
0
],
[
data
])
safe_verify_grad
(
lambda
v
:
max_and_argmax
(
v
,
axis
=
i
)[
1
],
[
data
])
def
test_preserve_broadcastable
(
self
):
"""
Ensure the original broadcastable flags are preserved by Max/Argmax.
...
...
@@ -2964,6 +2969,16 @@ class T_max_and_argmax(unittest.TestCase):
y
=
x
.
max
(
axis
=
1
)
assert
y
.
type
.
broadcastable
==
(
True
,
True
,
False
,
True
)
def
test_multiple_axes
(
self
):
data
=
numpy
.
arange
(
24
)
.
reshape
(
3
,
2
,
4
)
x
=
as_tensor_variable
(
data
)
v
,
i
=
eval_outputs
(
max_and_argmax
(
x
,
[
1
,
-
1
]))
assert
numpy
.
all
(
v
==
numpy
.
array
([
7
,
15
,
23
]))
assert
numpy
.
all
(
i
==
numpy
.
array
([
7
,
7
,
7
]))
v
=
eval_outputs
(
max_and_argmax
(
x
,
[
1
,
-
1
])[
0
]
.
shape
)
assert
tuple
(
v
)
==
numpy
.
max
(
data
,
(
1
,
-
1
))
.
shape
class
T_argmin_argmax
(
unittest
.
TestCase
):
def
setUp
(
self
):
...
...
编写
预览
Markdown
格式
0%
重试
或
添加新文件
添加附件
取消
您添加了
0
人
到此讨论。请谨慎行事。
请先完成此评论的编辑!
取消
请
注册
或者
登录
后发表评论