Skip to content
项目
群组
代码片段
帮助
当前项目
正在载入...
登录 / 注册
切换导航面板
P
pytensor
项目
项目
详情
活动
周期分析
仓库
仓库
文件
提交
分支
标签
贡献者
图表
比较
统计图
议题
0
议题
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
CI / CD
CI / CD
流水线
作业
日程
统计图
Wiki
Wiki
代码片段
代码片段
成员
成员
折叠边栏
关闭边栏
活动
图像
聊天
创建新问题
作业
提交
问题看板
Open sidebar
testgroup
pytensor
Commits
1548d7e0
提交
1548d7e0
authored
10月 02, 2015
作者:
Frédéric Bastien
浏览文件
操作
浏览文件
下载
差异文件
Merge pull request #3414 from harmdevries89/mult_argmax2
support for multiple axes in MaxAndArgMaxOp
上级
c74aa4cf
77e5267c
隐藏空白字符变更
内嵌
并排
正在显示
3 个修改的文件
包含
95 行增加
和
63 行删除
+95
-63
basic.py
theano/tensor/basic.py
+64
-50
opt_uncanonicalize.py
theano/tensor/opt_uncanonicalize.py
+4
-1
test_basic.py
theano/tensor/tests/test_basic.py
+27
-12
没有找到文件。
theano/tensor/basic.py
浏览文件 @
1548d7e0
...
@@ -109,7 +109,8 @@ if 0:
...
@@ -109,7 +109,8 @@ if 0:
# - JB 20100226
# - JB 20100226
def
as_cuda_or_tensor_variable
(
x
,
name
=
None
,
ndim
=
None
):
def
as_cuda_or_tensor_variable
(
x
,
name
=
None
,
ndim
=
None
):
"""
"""
Do the same as_tensor_variable, but do not transfer the value on the gpu.
Do the same as_tensor_variable,
but do not transfer the value on the gpu.
"""
"""
if
hasattr
(
x
,
'_as_CudaNdarrayVariable'
):
if
hasattr
(
x
,
'_as_CudaNdarrayVariable'
):
# TODO: pass name and ndim arguments
# TODO: pass name and ndim arguments
...
@@ -516,7 +517,8 @@ def _allclose(a, b, rtol=None, atol=None):
...
@@ -516,7 +517,8 @@ def _allclose(a, b, rtol=None, atol=None):
if
atol
is
not
None
:
if
atol
is
not
None
:
atol_
=
atol
atol_
=
atol
# Work around bug in Numpy, see http://projects.scipy.org/numpy/ticket/1684
# Work around bug in Numpy, see
# http://projects.scipy.org/numpy/ticket/1684
if
str
(
b
.
dtype
)
in
int_dtypes
and
(
numpy
.
absolute
(
b
)
<
0
)
.
any
():
if
str
(
b
.
dtype
)
in
int_dtypes
and
(
numpy
.
absolute
(
b
)
<
0
)
.
any
():
b
=
theano
.
_asarray
(
b
,
dtype
=
'float64'
)
b
=
theano
.
_asarray
(
b
,
dtype
=
'float64'
)
...
@@ -1287,27 +1289,14 @@ class MaxAndArgmax(Op):
...
@@ -1287,27 +1289,14 @@ class MaxAndArgmax(Op):
def
make_node
(
self
,
x
,
axis
=
None
):
def
make_node
(
self
,
x
,
axis
=
None
):
x
=
_as_tensor_variable
(
x
)
x
=
_as_tensor_variable
(
x
)
if
isinstance
(
axis
,
(
tuple
,
list
)):
axis
=
[
int
(
a
)
for
a
in
axis
]
if
len
(
axis
)
!=
1
:
axis
=
list
(
axis
)
for
idx
in
xrange
(
len
(
axis
)):
if
axis
[
idx
]
<
0
:
axis
[
idx
]
+=
x
.
type
.
ndim
axis
.
sort
()
if
axis
==
list
(
range
(
-
x
.
type
.
ndim
,
0
,
1
)):
axis
=
list
(
range
(
x
.
type
.
ndim
))
assert
axis
==
list
(
range
(
x
.
type
.
ndim
)),
(
"MaxAndArgmax does not support multiple"
" axes. the max fct supports it. Got
%
s"
%
axis
)
axis
=
None
else
:
axis
=
axis
[
0
]
if
isinstance
(
axis
,
(
int
,
numpy
.
integer
)):
if
isinstance
(
axis
,
(
int
,
numpy
.
integer
)):
axis
=
int
(
axis
)
axis
=
[
int
(
axis
)]
elif
isinstance
(
axis
,
numpy
.
ndarray
)
and
axis
.
ndim
==
0
:
elif
isinstance
(
axis
,
numpy
.
ndarray
)
and
axis
.
ndim
==
0
:
axis
=
int
(
axis
)
axis
=
[
int
(
axis
)]
elif
isinstance
(
axis
,
(
tuple
,
list
,
numpy
.
ndarray
)):
axis
=
[
int
(
a
)
for
a
in
axis
]
if
axis
==
list
(
range
(
x
.
type
.
ndim
)):
axis
=
None
elif
isinstance
(
axis
,
Variable
):
elif
isinstance
(
axis
,
Variable
):
if
NoneConst
.
equals
(
axis
):
if
NoneConst
.
equals
(
axis
):
axis
=
None
axis
=
None
...
@@ -1317,30 +1306,40 @@ class MaxAndArgmax(Op):
...
@@ -1317,30 +1306,40 @@ class MaxAndArgmax(Op):
else
:
else
:
assert
(
axis
.
dtype
.
startswith
(
"int"
)
or
assert
(
axis
.
dtype
.
startswith
(
"int"
)
or
axis
.
dtype
.
startswith
(
"uint"
))
axis
.
dtype
.
startswith
(
"uint"
))
axis
=
int
(
axis
.
data
)
if
isinstance
(
axis
.
data
,
(
int
,
numpy
.
integer
))
or
\
# we make the axis all positive to make the infer_shape work
(
isinstance
(
axis
.
data
,
numpy
.
ndarray
)
and
# with negative axis
axis
.
data
.
ndim
==
0
):
if
x
.
type
.
ndim
>
0
and
axis
is
not
None
:
axis
=
[
int
(
axis
.
data
)]
if
axis
<
0
:
elif
isinstance
(
axis
.
data
,
(
list
,
numpy
.
ndarray
)):
if
-
axis
>
x
.
type
.
ndim
:
axis
=
[
int
(
i
)
for
i
in
axis
.
data
]
raise
ValueError
(
'axis out of range'
)
axis
=
x
.
type
.
ndim
+
axis
# Make axis entries non-negative, and sort them
# Verify that the axis is valid.
if
isinstance
(
axis
,
list
):
all_axes
=
set
()
for
idx
in
xrange
(
len
(
axis
)):
if
axis
is
not
None
:
if
axis
[
idx
]
<
0
:
if
axis
<
0
or
axis
>=
x
.
type
.
ndim
:
axis
[
idx
]
+=
x
.
type
.
ndim
raise
ValueError
(
axis
.
sort
()
'Invalid axis:
%
s (the number of dimensions of the '
'input is:
%
s)'
%
(
axis
,
x
.
type
.
ndim
))
# Verify that axes are valid
all_axes
.
add
(
axis
)
all_axes
=
[]
if
isinstance
(
axis
,
list
):
for
ax
in
axis
:
if
ax
<
0
or
ax
>=
x
.
type
.
ndim
:
raise
ValueError
(
'Invalid axis:
%
s (the number of dimensions of the '
'input is:
%
s)'
%
(
ax
,
x
.
type
.
ndim
))
if
ax
not
in
all_axes
:
all_axes
.
append
(
ax
)
else
:
else
:
all_axes
=
list
(
range
(
x
.
ndim
))
all_axes
=
list
(
range
(
x
.
ndim
))
if
axis
is
None
:
if
axis
is
None
or
axis
==
list
(
range
(
x
.
type
.
ndim
)):
axis
=
NoneConst
.
clone
()
axis
=
NoneConst
.
clone
()
else
:
else
:
axis
=
_as_tensor_variable
(
a
xi
s
)
axis
=
_as_tensor_variable
(
a
ll_axe
s
)
assert
axis
.
ndim
==
0
assert
axis
.
ndim
==
1
inputs
=
[
x
,
axis
]
inputs
=
[
x
,
axis
]
# We keep the original broadcastable flags for dimensions on which
# We keep the original broadcastable flags for dimensions on which
# we do not perform the max / argmax.
# we do not perform the max / argmax.
broadcastable
=
[
b
for
i
,
b
in
enumerate
(
x
.
type
.
broadcastable
)
broadcastable
=
[
b
for
i
,
b
in
enumerate
(
x
.
type
.
broadcastable
)
...
@@ -1350,25 +1349,41 @@ class MaxAndArgmax(Op):
...
@@ -1350,25 +1349,41 @@ class MaxAndArgmax(Op):
return
Apply
(
self
,
inputs
,
outputs
)
return
Apply
(
self
,
inputs
,
outputs
)
def
perform
(
self
,
node
,
inp
,
outs
):
def
perform
(
self
,
node
,
inp
,
outs
):
x
,
ax
i
s
=
inp
x
,
ax
e
s
=
inp
max
,
max_idx
=
outs
max
,
max_idx
=
outs
max
[
0
]
=
theano
.
_asarray
(
numpy
.
max
(
x
,
axis
),
if
axes
is
None
:
axes
=
tuple
(
range
(
x
.
ndim
))
else
:
axes
=
tuple
(
axes
)
max
[
0
]
=
theano
.
_asarray
(
numpy
.
max
(
x
,
axes
),
dtype
=
node
.
outputs
[
0
]
.
dtype
)
dtype
=
node
.
outputs
[
0
]
.
dtype
)
max_idx
[
0
]
=
theano
.
_asarray
(
numpy
.
argmax
(
x
,
axis
),
dtype
=
'int64'
)
# Numpy does not support multiple axes for argmax
# Work around
keep_axes
=
numpy
.
array
([
i
for
i
in
range
(
x
.
ndim
)
if
i
not
in
axes
])
# Not-reduced axes in front
transposed_x
=
numpy
.
transpose
(
x
,
numpy
.
concatenate
((
keep_axes
,
axes
)))
reshaped_x
=
transposed_x
.
reshape
(
transposed_x
.
shape
[:
len
(
keep_axes
)]
+
(
-
1
,))
max_idx
[
0
]
=
theano
.
_asarray
(
numpy
.
argmax
(
reshaped_x
,
axis
=-
1
),
dtype
=
'int64'
)
def
c_code
(
self
,
node
,
name
,
inp
,
out
,
sub
):
def
c_code
(
self
,
node
,
name
,
inp
,
out
,
sub
):
x
,
axis
=
inp
x
,
axis
=
inp
max
,
argmax
=
out
max
,
argmax
=
out
fail
=
sub
[
"fail"
]
fail
=
sub
[
"fail"
]
if
NoneConst
.
equals
(
node
.
inputs
[
1
]):
if
NoneConst
.
equals
(
node
.
inputs
[
1
]):
axis_code
=
"axis = NPY_MAXDIMS;"
axis_code
=
"axis = NPY_MAXDIMS;"
else
:
else
:
assert
node
.
inputs
[
1
]
.
ndim
==
0
assert
node
.
inputs
[
1
]
.
ndim
==
1
# Fall back to perform() if there are multiple axes
if
len
(
node
.
inputs
[
1
]
.
data
)
>
1
:
raise
NotImplementedError
()
axis_code
=
"""
axis_code
=
"""
axis = ((dtype_
%(axis)
s*)PyArray_DATA(
%(axis)
s))[0];
axis = ((dtype_
%(axis)
s*)PyArray_DATA(
%(axis)
s))[0];
if(axis > PyArray_NDIM(
%(x)
s)-1 || axis < -PyArray_NDIM(
%(x)
s)){
if(axis > PyArray_NDIM(
%(x)
s)-1 || axis < -PyArray_NDIM(
%(x)
s)){
PyErr_SetString(PyExc_ValueError, "MaxAndArgmax, bad axis argument");
PyErr_SetString(PyExc_ValueError,
"MaxAndArgmax, bad axis argument");
%(fail)
s
%(fail)
s
}
}
"""
%
locals
()
"""
%
locals
()
...
@@ -1420,10 +1435,10 @@ class MaxAndArgmax(Op):
...
@@ -1420,10 +1435,10 @@ class MaxAndArgmax(Op):
def
infer_shape
(
self
,
node
,
shapes
):
def
infer_shape
(
self
,
node
,
shapes
):
ishape
,
axis_shape
=
shapes
ishape
,
axis_shape
=
shapes
axis
=
node
.
inputs
[
1
]
axis
=
node
.
inputs
[
1
]
if
node
.
inputs
[
1
]
.
data
is
None
:
if
axis
.
data
is
None
:
return
[(),
()]
return
[(),
()]
rval
=
tuple
([
ishape
[
i
]
for
(
i
,
b
)
in
enumerate
(
rval
=
tuple
([
ishape
[
i
]
for
(
i
,
b
)
in
enumerate
(
node
.
inputs
[
0
]
.
type
.
broadcastable
)
if
i
!=
axis
.
data
])
node
.
inputs
[
0
]
.
type
.
broadcastable
)
if
i
not
in
axis
.
data
])
return
[
rval
,
rval
]
return
[
rval
,
rval
]
def
R_op
(
self
,
inputs
,
eval_points
):
def
R_op
(
self
,
inputs
,
eval_points
):
...
@@ -1492,7 +1507,7 @@ class MaxAndArgmax(Op):
...
@@ -1492,7 +1507,7 @@ class MaxAndArgmax(Op):
# We are taking the max/argmax over all dimensions.
# We are taking the max/argmax over all dimensions.
axis
=
None
axis
=
None
for
i
in
xrange
(
x
.
ndim
):
for
i
in
xrange
(
x
.
ndim
):
if
axis
is
None
or
i
==
axis
.
data
:
if
axis
is
None
or
i
in
axis
.
data
:
pattern
.
append
(
'x'
)
pattern
.
append
(
'x'
)
else
:
else
:
pattern
.
append
(
out_dim
)
pattern
.
append
(
out_dim
)
...
@@ -1632,7 +1647,6 @@ def argmax(x, axis=None, keepdims=False):
...
@@ -1632,7 +1647,6 @@ def argmax(x, axis=None, keepdims=False):
# In python (using MaxAndArgmax.perform()) this leads to a wasteful
# In python (using MaxAndArgmax.perform()) this leads to a wasteful
# implementation that goes through the data twice instead of once
# implementation that goes through the data twice instead of once
# but when Argmax.c_impl() is in place, it should be fine.
# but when Argmax.c_impl() is in place, it should be fine.
argout
=
max_and_argmax
(
x
,
axis
)[
1
]
argout
=
max_and_argmax
(
x
,
axis
)[
1
]
if
keepdims
:
if
keepdims
:
...
...
theano/tensor/opt_uncanonicalize.py
浏览文件 @
1548d7e0
...
@@ -62,7 +62,10 @@ def local_max_and_argmax(node):
...
@@ -62,7 +62,10 @@ def local_max_and_argmax(node):
try
:
try
:
axis
=
get_scalar_constant_value
(
node
.
inputs
[
1
])
axis
=
get_scalar_constant_value
(
node
.
inputs
[
1
])
except
NotScalarConstantError
:
except
NotScalarConstantError
:
return
False
axis
=
node
.
inputs
[
1
]
if
not
isinstance
(
axis
,
T
.
TensorConstant
):
return
False
axis
=
axis
.
data
new
=
CAReduce
(
scal
.
maximum
,
axis
)(
node
.
inputs
[
0
])
new
=
CAReduce
(
scal
.
maximum
,
axis
)(
node
.
inputs
[
0
])
return
[
new
,
None
]
return
[
new
,
None
]
...
...
theano/tensor/tests/test_basic.py
浏览文件 @
1548d7e0
...
@@ -2641,7 +2641,7 @@ def _approx_eq(a, b, eps=1.0e-4):
...
@@ -2641,7 +2641,7 @@ def _approx_eq(a, b, eps=1.0e-4):
if
_approx_eq
.
debug
:
if
_approx_eq
.
debug
:
print
(
a
,
b
)
print
(
a
,
b
)
return
False
return
False
return
True
return
True
_approx_eq
.
debug
=
0
_approx_eq
.
debug
=
0
...
@@ -2799,10 +2799,10 @@ class T_max_and_argmax(unittest.TestCase):
...
@@ -2799,10 +2799,10 @@ class T_max_and_argmax(unittest.TestCase):
def
test2
(
self
):
def
test2
(
self
):
data
=
rand
(
2
,
3
)
data
=
rand
(
2
,
3
)
n
=
as_tensor_variable
(
data
)
n
=
as_tensor_variable
(
data
)
for
(
axis
,
np_axis
)
in
[(
-
1
,
-
1
),
(
0
,
0
),
(
1
,
1
),
(
None
,
None
),
for
(
axis
,
np_axis
)
in
[(
-
1
,
-
1
),
(
0
,
0
),
(
1
,
1
),
(
None
,
None
),
([
0
,
1
],
None
),
([
1
,
0
],
None
),
([
0
,
1
],
None
),
([
1
,
0
],
None
),
(
NoneConst
.
clone
(),
None
),
(
NoneConst
.
clone
(),
None
),
(
constant
(
0
),
0
)]:
(
constant
(
0
),
0
)]:
v
,
i
=
eval_outputs
(
max_and_argmax
(
n
,
axis
))
v
,
i
=
eval_outputs
(
max_and_argmax
(
n
,
axis
))
assert
i
.
dtype
==
'int64'
assert
i
.
dtype
==
'int64'
self
.
assertTrue
(
numpy
.
all
(
v
==
numpy
.
max
(
data
,
np_axis
)))
self
.
assertTrue
(
numpy
.
all
(
v
==
numpy
.
max
(
data
,
np_axis
)))
...
@@ -2860,8 +2860,8 @@ class T_max_and_argmax(unittest.TestCase):
...
@@ -2860,8 +2860,8 @@ class T_max_and_argmax(unittest.TestCase):
def
test3
(
self
):
def
test3
(
self
):
data
=
rand
(
2
,
3
,
4
)
data
=
rand
(
2
,
3
,
4
)
n
=
as_tensor_variable
(
data
)
n
=
as_tensor_variable
(
data
)
for
(
axis
,
np_axis
)
in
[(
-
1
,
-
1
),
(
0
,
0
),
(
1
,
1
),
(
None
,
None
),
for
(
axis
,
np_axis
)
in
[(
-
1
,
-
1
),
(
0
,
0
),
(
1
,
1
),
(
None
,
None
),
([
0
,
1
,
2
],
None
),
([
1
,
2
,
0
],
None
)]:
([
0
,
1
,
2
],
None
),
([
1
,
2
,
0
],
None
)]:
v
,
i
=
eval_outputs
(
max_and_argmax
(
n
,
axis
))
v
,
i
=
eval_outputs
(
max_and_argmax
(
n
,
axis
))
assert
i
.
dtype
==
'int64'
assert
i
.
dtype
==
'int64'
self
.
assertTrue
(
numpy
.
all
(
v
==
numpy
.
max
(
data
,
np_axis
)))
self
.
assertTrue
(
numpy
.
all
(
v
==
numpy
.
max
(
data
,
np_axis
)))
...
@@ -2922,8 +2922,8 @@ class T_max_and_argmax(unittest.TestCase):
...
@@ -2922,8 +2922,8 @@ class T_max_and_argmax(unittest.TestCase):
z
[
argmax
]
+=
1
z
[
argmax
]
+=
1
else
:
else
:
for
id
,
v
in
enumerate
(
argmax
):
for
id
,
v
in
enumerate
(
argmax
):
z
[
v
*
numpy
.
prod
(
data
.
shape
[
data
.
ndim
-
1
:
axis
:
-
1
])
z
[
v
*
numpy
.
prod
(
data
.
shape
[
data
.
ndim
-
1
:
axis
:
-
1
])
+
+
id
]
+=
1
id
]
+=
1
z
=
z
.
reshape
(
data
.
shape
)
z
=
z
.
reshape
(
data
.
shape
)
assert
numpy
.
all
(
max_grad_data
==
z
)
assert
numpy
.
all
(
max_grad_data
==
z
)
...
@@ -2931,11 +2931,11 @@ class T_max_and_argmax(unittest.TestCase):
...
@@ -2931,11 +2931,11 @@ class T_max_and_argmax(unittest.TestCase):
for
axis
in
(
-
1
,
0
,
1
,
None
):
for
axis
in
(
-
1
,
0
,
1
,
None
):
for
j
in
xrange
(
2
):
for
j
in
xrange
(
2
):
safe_verify_grad
(
lambda
v
:
max_and_argmax
(
v
,
axis
=
axis
)[
j
],
safe_verify_grad
(
lambda
v
:
max_and_argmax
(
v
,
axis
=
axis
)[
j
],
[
data
])
[
data
])
if
axis
!=
1
:
if
axis
!=
1
:
safe_verify_grad
(
lambda
v
:
max_and_argmax
(
v
.
flatten
(),
safe_verify_grad
(
lambda
v
:
max_and_argmax
(
v
.
flatten
(),
axis
=
axis
)[
j
],
axis
=
axis
)[
j
],
[
data
])
[
data
])
if
axis
in
(
0
,
None
):
if
axis
in
(
0
,
None
):
check_grad_max
(
data
,
eval_outputs
(
grad
(
check_grad_max
(
data
,
eval_outputs
(
grad
(
max_and_argmax
(
n
,
axis
=
axis
)[
0
]
.
sum
(),
n
)),
axis
=
axis
)
max_and_argmax
(
n
,
axis
=
axis
)[
0
]
.
sum
(),
n
)),
axis
=
axis
)
...
@@ -2956,6 +2956,11 @@ class T_max_and_argmax(unittest.TestCase):
...
@@ -2956,6 +2956,11 @@ class T_max_and_argmax(unittest.TestCase):
safe_verify_grad
(
lambda
v
:
max_and_argmax
(
v
,
axis
=
[
i
])[
0
],
[
data
])
safe_verify_grad
(
lambda
v
:
max_and_argmax
(
v
,
axis
=
[
i
])[
0
],
[
data
])
safe_verify_grad
(
lambda
v
:
max_and_argmax
(
v
,
axis
=
[
i
])[
1
],
[
data
])
safe_verify_grad
(
lambda
v
:
max_and_argmax
(
v
,
axis
=
[
i
])[
1
],
[
data
])
# Test grad with multiple axes
for
i
in
[[
0
,
1
],
[
0
,
0
]]:
safe_verify_grad
(
lambda
v
:
max_and_argmax
(
v
,
axis
=
i
)[
0
],
[
data
])
safe_verify_grad
(
lambda
v
:
max_and_argmax
(
v
,
axis
=
i
)[
1
],
[
data
])
def
test_preserve_broadcastable
(
self
):
def
test_preserve_broadcastable
(
self
):
"""
"""
Ensure the original broadcastable flags are preserved by Max/Argmax.
Ensure the original broadcastable flags are preserved by Max/Argmax.
...
@@ -2964,6 +2969,16 @@ class T_max_and_argmax(unittest.TestCase):
...
@@ -2964,6 +2969,16 @@ class T_max_and_argmax(unittest.TestCase):
y
=
x
.
max
(
axis
=
1
)
y
=
x
.
max
(
axis
=
1
)
assert
y
.
type
.
broadcastable
==
(
True
,
True
,
False
,
True
)
assert
y
.
type
.
broadcastable
==
(
True
,
True
,
False
,
True
)
def
test_multiple_axes
(
self
):
data
=
numpy
.
arange
(
24
)
.
reshape
(
3
,
2
,
4
)
x
=
as_tensor_variable
(
data
)
v
,
i
=
eval_outputs
(
max_and_argmax
(
x
,
[
1
,
-
1
]))
assert
numpy
.
all
(
v
==
numpy
.
array
([
7
,
15
,
23
]))
assert
numpy
.
all
(
i
==
numpy
.
array
([
7
,
7
,
7
]))
v
=
eval_outputs
(
max_and_argmax
(
x
,
[
1
,
-
1
])[
0
]
.
shape
)
assert
tuple
(
v
)
==
numpy
.
max
(
data
,
(
1
,
-
1
))
.
shape
class
T_argmin_argmax
(
unittest
.
TestCase
):
class
T_argmin_argmax
(
unittest
.
TestCase
):
def
setUp
(
self
):
def
setUp
(
self
):
...
...
编写
预览
Markdown
格式
0%
重试
或
添加新文件
添加附件
取消
您添加了
0
人
到此讨论。请谨慎行事。
请先完成此评论的编辑!
取消
请
注册
或者
登录
后发表评论