Skip to content
项目
群组
代码片段
帮助
当前项目
正在载入...
登录 / 注册
切换导航面板
P
pytensor
项目
项目
详情
活动
周期分析
仓库
仓库
文件
提交
分支
标签
贡献者
图表
比较
统计图
议题
0
议题
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
CI / CD
CI / CD
流水线
作业
日程
统计图
Wiki
Wiki
代码片段
代码片段
成员
成员
折叠边栏
关闭边栏
活动
图像
聊天
创建新问题
作业
提交
问题看板
Open sidebar
testgroup
pytensor
Commits
9fb9dea1
提交
9fb9dea1
authored
3月 10, 2016
作者:
Pascal Lamblin
浏览文件
操作
浏览文件
下载
差异文件
Merge pull request #3991 from vmichals/keep_stack_trace_in_opt
keep stack trace in optimizations of nnet folder
上级
f902e1b3
8328b2a5
显示空白字符变更
内嵌
并排
正在显示
8 个修改的文件
包含
112 行增加
和
12 行删除
+112
-12
conv3d2d.py
theano/tensor/nnet/conv3d2d.py
+10
-2
nnet.py
theano/tensor/nnet/nnet.py
+3
-2
opt.py
theano/tensor/nnet/opt.py
+2
-0
sigm.py
theano/tensor/nnet/sigm.py
+19
-4
test_conv3d2d.py
theano/tensor/nnet/tests/test_conv3d2d.py
+8
-0
test_nnet.py
theano/tensor/nnet/tests/test_nnet.py
+40
-4
test_opt.py
theano/tensor/nnet/tests/test_opt.py
+2
-0
test_sigm.py
theano/tensor/nnet/tests/test_sigm.py
+28
-0
没有找到文件。
theano/tensor/nnet/conv3d2d.py
浏览文件 @
9fb9dea1
...
@@ -3,6 +3,7 @@ from theano.gradient import DisconnectedType
...
@@ -3,6 +3,7 @@ from theano.gradient import DisconnectedType
from
theano.gof
import
Op
,
Apply
,
TopoOptimizer
from
theano.gof
import
Op
,
Apply
,
TopoOptimizer
from
theano
import
tensor
from
theano
import
tensor
import
theano.sandbox.cuda
as
cuda
import
theano.sandbox.cuda
as
cuda
from
theano.tensor.opt
import
copy_stack_trace
def
get_diagonal_subtensor_view
(
x
,
i0
,
i1
):
def
get_diagonal_subtensor_view
(
x
,
i0
,
i1
):
...
@@ -328,7 +329,11 @@ def make_gpu_optimizer(op, to_gpu):
...
@@ -328,7 +329,11 @@ def make_gpu_optimizer(op, to_gpu):
new_inp
=
list
(
node
.
inputs
)
new_inp
=
list
(
node
.
inputs
)
for
idx
in
to_gpu
:
for
idx
in
to_gpu
:
new_inp
[
idx
]
=
cuda
.
gpu_from_host
(
new_inp
[
idx
])
new_inp
[
idx
]
=
cuda
.
gpu_from_host
(
new_inp
[
idx
])
return
[
cuda
.
host_from_gpu
(
op
()(
*
new_inp
))]
result_node
=
op
()(
*
new_inp
)
copy_stack_trace
(
node
.
outputs
[
0
],
result_node
)
transfer_node
=
cuda
.
host_from_gpu
(
result_node
)
copy_stack_trace
(
node
.
outputs
[
0
],
transfer_node
)
return
[
transfer_node
]
if
node
.
op
==
cuda
.
gpu_from_host
:
if
node
.
op
==
cuda
.
gpu_from_host
:
# gpu_from_host(op) -> op(gpu_from_host)
# gpu_from_host(op) -> op(gpu_from_host)
host_input
=
node
.
inputs
[
0
]
host_input
=
node
.
inputs
[
0
]
...
@@ -338,7 +343,9 @@ def make_gpu_optimizer(op, to_gpu):
...
@@ -338,7 +343,9 @@ def make_gpu_optimizer(op, to_gpu):
new_inp
=
list
(
op_node
.
inputs
)
new_inp
=
list
(
op_node
.
inputs
)
for
idx
in
to_gpu
:
for
idx
in
to_gpu
:
new_inp
[
idx
]
=
cuda
.
gpu_from_host
(
new_inp
[
idx
])
new_inp
[
idx
]
=
cuda
.
gpu_from_host
(
new_inp
[
idx
])
return
[
op
()(
*
new_inp
)]
new_node
=
op
()(
*
new_inp
)
copy_stack_trace
(
host_input
,
new_node
)
return
[
new_node
]
return
False
return
False
local_to_gpu
.
__name__
=
"local_to_gpu_"
+
op
.
__name__
local_to_gpu
.
__name__
=
"local_to_gpu_"
+
op
.
__name__
cuda
.
opt
.
register_opt
()(
local_to_gpu
)
cuda
.
opt
.
register_opt
()(
local_to_gpu
)
...
@@ -355,6 +362,7 @@ def local_inplace_DiagonalSubtensor(node):
...
@@ -355,6 +362,7 @@ def local_inplace_DiagonalSubtensor(node):
not
node
.
op
.
inplace
):
not
node
.
op
.
inplace
):
new_op
=
node
.
op
.
__class__
(
inplace
=
True
)
new_op
=
node
.
op
.
__class__
(
inplace
=
True
)
new_node
=
new_op
(
*
node
.
inputs
)
new_node
=
new_op
(
*
node
.
inputs
)
copy_stack_trace
(
node
.
outputs
[
0
],
new_node
)
return
[
new_node
]
return
[
new_node
]
return
False
return
False
theano
.
compile
.
optdb
.
register
(
theano
.
compile
.
optdb
.
register
(
...
...
theano/tensor/nnet/nnet.py
浏览文件 @
9fb9dea1
...
@@ -752,7 +752,8 @@ def local_logsoftmax(node):
...
@@ -752,7 +752,8 @@ def local_logsoftmax(node):
inVars
=
node
.
inputs
[
0
]
.
owner
.
inputs
[
0
]
inVars
=
node
.
inputs
[
0
]
.
owner
.
inputs
[
0
]
new_op
=
LogSoftmax
()
new_op
=
LogSoftmax
()
ret
=
new_op
(
inVars
)
ret
=
new_op
(
inVars
)
ret
.
tag
.
values_eq_approx
=
values_eq_approx_remove_inf
ret
.
tag
.
values_eq_approx
=
values_eq_approx_remove_inf
copy_stack_trace
([
node
.
inputs
[
0
],
node
.
outputs
[
0
]],
ret
)
return
[
ret
]
return
[
ret
]
...
@@ -785,9 +786,9 @@ def local_logsoftmax_grad(node):
...
@@ -785,9 +786,9 @@ def local_logsoftmax_grad(node):
grads
=
node
.
inputs
[
0
]
.
owner
.
inputs
[
0
]
grads
=
node
.
inputs
[
0
]
.
owner
.
inputs
[
0
]
if
grads
.
broadcastable
[
1
]
and
not
sm
.
broadcastable
[
1
]:
if
grads
.
broadcastable
[
1
]
and
not
sm
.
broadcastable
[
1
]:
grads
=
tensor
.
alloc
(
grads
,
grads
.
shape
[
0
],
sm
.
shape
[
1
])
grads
=
tensor
.
alloc
(
grads
,
grads
.
shape
[
0
],
sm
.
shape
[
1
])
ret
=
grads
-
tensor
.
sum
(
grads
,
axis
=
1
,
keepdims
=
True
)
*
sm
ret
=
grads
-
tensor
.
sum
(
grads
,
axis
=
1
,
keepdims
=
True
)
*
sm
ret
.
tag
.
values_eq_approx
=
values_eq_approx_remove_nan
ret
.
tag
.
values_eq_approx
=
values_eq_approx_remove_nan
copy_stack_trace
(
node
.
outputs
[
0
],
ret
)
return
[
ret
]
return
[
ret
]
...
...
theano/tensor/nnet/opt.py
浏览文件 @
9fb9dea1
...
@@ -36,6 +36,7 @@ def local_inplace_sparse_block_gemv(node):
...
@@ -36,6 +36,7 @@ def local_inplace_sparse_block_gemv(node):
"""
"""
if
isinstance
(
node
.
op
,
SparseBlockGemv
)
and
not
node
.
op
.
inplace
:
if
isinstance
(
node
.
op
,
SparseBlockGemv
)
and
not
node
.
op
.
inplace
:
new_node
=
sparse_block_gemv_inplace
(
*
node
.
inputs
)
new_node
=
sparse_block_gemv_inplace
(
*
node
.
inputs
)
copy_stack_trace
(
node
.
outputs
[
0
],
new_node
)
return
[
new_node
]
return
[
new_node
]
return
False
return
False
compile
.
optdb
.
register
(
'local_inplace_sparse_block_gemv'
,
compile
.
optdb
.
register
(
'local_inplace_sparse_block_gemv'
,
...
@@ -52,6 +53,7 @@ def local_inplace_sparse_block_outer(node):
...
@@ -52,6 +53,7 @@ def local_inplace_sparse_block_outer(node):
"""
"""
if
isinstance
(
node
.
op
,
SparseBlockOuter
)
and
not
node
.
op
.
inplace
:
if
isinstance
(
node
.
op
,
SparseBlockOuter
)
and
not
node
.
op
.
inplace
:
new_node
=
sparse_block_outer_inplace
(
*
node
.
inputs
)
new_node
=
sparse_block_outer_inplace
(
*
node
.
inputs
)
copy_stack_trace
(
node
.
outputs
[
0
],
new_node
)
return
[
new_node
]
return
[
new_node
]
return
False
return
False
compile
.
optdb
.
register
(
'local_inplace_sparse_block_outer'
,
compile
.
optdb
.
register
(
'local_inplace_sparse_block_outer'
,
...
...
theano/tensor/nnet/sigm.py
浏览文件 @
9fb9dea1
...
@@ -18,13 +18,14 @@ from theano.printing import pprint
...
@@ -18,13 +18,14 @@ from theano.printing import pprint
from
theano.tensor
import
basic
as
tensor
from
theano.tensor
import
basic
as
tensor
from
theano.tensor
import
elemwise
,
opt
,
NotScalarConstantError
from
theano.tensor
import
elemwise
,
opt
,
NotScalarConstantError
from
theano.tensor.type
import
values_eq_approx_remove_inf
from
theano.tensor.type
import
values_eq_approx_remove_inf
from
theano.tensor.opt
import
copy_stack_trace
############
############
#
#
# SCALAR OPS
# SCALAR OPS
#
#
class
ScalarSigmoid
(
scalar
.
UnaryScalarOp
):
class
ScalarSigmoid
(
scalar
.
UnaryScalarOp
):
"""
"""
This is just speed opt. Not for stability.
This is just speed opt. Not for stability.
...
@@ -262,6 +263,7 @@ def local_ultra_fast_sigmoid(node):
...
@@ -262,6 +263,7 @@ def local_ultra_fast_sigmoid(node):
if
(
isinstance
(
node
.
op
,
tensor
.
Elemwise
)
and
if
(
isinstance
(
node
.
op
,
tensor
.
Elemwise
)
and
node
.
op
.
scalar_op
==
scalar_sigmoid
):
node
.
op
.
scalar_op
==
scalar_sigmoid
):
out
=
ultra_fast_sigmoid
(
node
.
inputs
[
0
])
out
=
ultra_fast_sigmoid
(
node
.
inputs
[
0
])
copy_stack_trace
(
node
.
outputs
[
0
],
out
)
def
values_eq_approx_remove_low_prec
(
a
,
b
):
def
values_eq_approx_remove_low_prec
(
a
,
b
):
# atol is found by trial/error.
# atol is found by trial/error.
...
@@ -301,6 +303,7 @@ def local_hard_sigmoid(node):
...
@@ -301,6 +303,7 @@ def local_hard_sigmoid(node):
if
(
isinstance
(
node
.
op
,
tensor
.
Elemwise
)
and
if
(
isinstance
(
node
.
op
,
tensor
.
Elemwise
)
and
node
.
op
.
scalar_op
==
scalar_sigmoid
):
node
.
op
.
scalar_op
==
scalar_sigmoid
):
out
=
hard_sigmoid
(
node
.
inputs
[
0
])
out
=
hard_sigmoid
(
node
.
inputs
[
0
])
copy_stack_trace
(
node
.
outputs
[
0
],
out
)
def
values_eq_approx_remove_low_prec
(
a
,
b
):
def
values_eq_approx_remove_low_prec
(
a
,
b
):
# atol is found by trial/error.
# atol is found by trial/error.
...
@@ -925,7 +928,10 @@ def local_sigm_times_exp(node):
...
@@ -925,7 +928,10 @@ def local_sigm_times_exp(node):
# get rid of them.
# get rid of them.
mul_tree
=
simplify_mul
(
mul_tree
)
mul_tree
=
simplify_mul
(
mul_tree
)
# Recompute final output based on the updated tree.
# Recompute final output based on the updated tree.
return
[
compute_mul
(
mul_tree
)]
out
=
compute_mul
(
mul_tree
)
# keep the stack trace
copy_stack_trace
(
node
.
outputs
[
0
],
out
)
return
[
out
]
@opt.register_stabilize
@opt.register_stabilize
...
@@ -946,10 +952,17 @@ def local_inv_1_plus_exp(node):
...
@@ -946,10 +952,17 @@ def local_inv_1_plus_exp(node):
if
len
(
nonconsts
)
==
1
:
if
len
(
nonconsts
)
==
1
:
if
nonconsts
[
0
]
.
owner
and
nonconsts
[
0
]
.
owner
.
op
==
tensor
.
exp
:
if
nonconsts
[
0
]
.
owner
and
nonconsts
[
0
]
.
owner
.
op
==
tensor
.
exp
:
if
scalars
and
numpy
.
allclose
(
numpy
.
sum
(
scalars
),
1
):
if
scalars
and
numpy
.
allclose
(
numpy
.
sum
(
scalars
),
1
):
return
opt
.
_fill_chain
(
out
=
opt
.
_fill_chain
(
sigmoid
(
sigmoid
(
tensor
.
neg
(
nonconsts
[
0
]
.
owner
.
inputs
[
0
])),
tensor
.
neg
(
nonconsts
[
0
]
.
owner
.
inputs
[
0
])),
scalar_inputs
)
scalar_inputs
)
# keep combined stack traces of
# exp(x): nonconsts[0],
# 1 + exp(x): inv_arg,
# 1 / (1 + exp(x)): node.outputs[0]
copy_stack_trace
(
[
nonconsts
[
0
],
inv_arg
,
node
.
outputs
[
0
]],
out
)
return
out
# Registration is below, and conditional.
# Registration is below, and conditional.
...
@@ -970,7 +983,9 @@ def local_1msigmoid(node):
...
@@ -970,7 +983,9 @@ def local_1msigmoid(node):
except
Exception
:
except
Exception
:
return
return
if
numpy
.
allclose
(
numpy
.
sum
(
val_l
),
1
):
if
numpy
.
allclose
(
numpy
.
sum
(
val_l
),
1
):
return
[
sigmoid
(
-
sub_r
.
owner
.
inputs
[
0
])]
out
=
sigmoid
(
-
sub_r
.
owner
.
inputs
[
0
])
copy_stack_trace
([
sub_r
,
node
.
outputs
[
0
]],
out
)
return
[
out
]
register_local_1msigmoid
=
False
register_local_1msigmoid
=
False
# This is False because the Stabilize pattern above
# This is False because the Stabilize pattern above
...
...
theano/tensor/nnet/tests/test_conv3d2d.py
浏览文件 @
9fb9dea1
...
@@ -73,6 +73,10 @@ def pyconv3d(signals, filters):
...
@@ -73,6 +73,10 @@ def pyconv3d(signals, filters):
r_i
+=
o_i
[
Tf2
:
o_i_sh0
-
Tf2
,
Hf2
:
-
Hf2
,
Wf2
:
-
Wf2
]
r_i
+=
o_i
[
Tf2
:
o_i_sh0
-
Tf2
,
Hf2
:
-
Hf2
,
Wf2
:
-
Wf2
]
return
rval
return
rval
def
check_diagonal_subtensor_view_traces
(
fn
):
for
apply_node
in
fn
.
maker
.
fgraph
.
apply_nodes
:
if
isinstance
(
apply_node
.
op
,
(
DiagonalSubtensor
,
IncDiagonalSubtensor
)):
assert
hasattr
(
apply_node
.
outputs
[
0
]
.
tag
,
'trace'
)
def
test_conv3d
(
mode
=
mode_without_gpu
,
shared
=
theano
.
tensor
.
_shared
):
def
test_conv3d
(
mode
=
mode_without_gpu
,
shared
=
theano
.
tensor
.
_shared
):
if
ndimage
is
None
:
if
ndimage
is
None
:
...
@@ -100,6 +104,7 @@ def test_conv3d(mode=mode_without_gpu, shared=theano.tensor._shared):
...
@@ -100,6 +104,7 @@ def test_conv3d(mode=mode_without_gpu, shared=theano.tensor._shared):
updates
=
{
s_output
:
out
},
updates
=
{
s_output
:
out
},
mode
=
mode
)
mode
=
mode
)
check_diagonal_subtensor_view_traces
(
newconv3d
)
t0
=
time
.
time
()
t0
=
time
.
time
()
newconv3d
()
newconv3d
()
print
(
time
.
time
()
-
t0
)
print
(
time
.
time
()
-
t0
)
...
@@ -110,6 +115,7 @@ def test_conv3d(mode=mode_without_gpu, shared=theano.tensor._shared):
...
@@ -110,6 +115,7 @@ def test_conv3d(mode=mode_without_gpu, shared=theano.tensor._shared):
(
s_signals
,
gsignals
)],
(
s_signals
,
gsignals
)],
mode
=
mode
,
mode
=
mode
,
name
=
'grad'
)
name
=
'grad'
)
check_diagonal_subtensor_view_traces
(
gnewconv3d
)
t0
=
time
.
time
()
t0
=
time
.
time
()
gnewconv3d
()
gnewconv3d
()
...
@@ -144,6 +150,7 @@ def test_conv3d(mode=mode_without_gpu, shared=theano.tensor._shared):
...
@@ -144,6 +150,7 @@ def test_conv3d(mode=mode_without_gpu, shared=theano.tensor._shared):
newconv3d
=
theano
.
function
([],
[],
newconv3d
=
theano
.
function
([],
[],
updates
=
{
s_output
:
out
},
updates
=
{
s_output
:
out
},
mode
=
mode
)
mode
=
mode
)
check_diagonal_subtensor_view_traces
(
newconv3d
)
t0
=
time
.
time
()
t0
=
time
.
time
()
newconv3d
()
newconv3d
()
...
@@ -155,6 +162,7 @@ def test_conv3d(mode=mode_without_gpu, shared=theano.tensor._shared):
...
@@ -155,6 +162,7 @@ def test_conv3d(mode=mode_without_gpu, shared=theano.tensor._shared):
(
s_signals
,
gsignals
)],
(
s_signals
,
gsignals
)],
mode
=
mode
,
mode
=
mode
,
name
=
'grad'
)
name
=
'grad'
)
check_diagonal_subtensor_view_traces
(
gnewconv3d
)
t0
=
time
.
time
()
t0
=
time
.
time
()
gnewconv3d
()
gnewconv3d
()
...
...
theano/tensor/nnet/tests/test_nnet.py
浏览文件 @
9fb9dea1
...
@@ -139,6 +139,15 @@ class T_SoftmaxWithBias(utt.InferShapeTester):
...
@@ -139,6 +139,15 @@ class T_SoftmaxWithBias(utt.InferShapeTester):
f
([
0
,
1
,
0
])
f
([
0
,
1
,
0
])
# print f.maker.fgraph.toposort()
# print f.maker.fgraph.toposort()
def
test_softmax_with_bias_trace
(
self
):
a
=
theano
.
shared
(
numpy
.
random
.
randn
(
3
)
.
astype
(
config
.
floatX
))
b
=
theano
.
shared
(
numpy
.
float32
(
numpy
.
random
.
randn
()))
sm
=
T
.
nnet
.
softmax
(
a
+
b
)
f
=
theano
.
function
([],
sm
)
self
.
assertTrue
(
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
))
print
(
'f.maker.fgraph.outputs[0]: {0}'
.
format
(
f
.
maker
.
fgraph
.
outputs
[
0
],
))
def
test_infer_shape
(
self
):
def
test_infer_shape
(
self
):
admat
=
matrix
()
admat
=
matrix
()
advec
=
vector
()
advec
=
vector
()
...
@@ -201,11 +210,11 @@ class T_LogSoftmax(utt.InferShapeTester):
...
@@ -201,11 +210,11 @@ class T_LogSoftmax(utt.InferShapeTester):
# numerically stable log-softmax with crossentropy
# numerically stable log-softmax with crossentropy
logsm
=
tensor
.
nnet
.
logsoftmax
(
x
)
logsm
=
tensor
.
nnet
.
logsoftmax
(
x
)
sm2
=
tensor
.
exp
(
logsm
)
# just used to show equivalence with sm
sm2
=
tensor
.
exp
(
logsm
)
# just used to show equivalence with sm
cm2
=
-
tensor
.
sum
(
y
*
logsm
,
axis
=
1
)
cm2
=
-
tensor
.
sum
(
y
*
logsm
,
axis
=
1
)
grad
=
tensor
.
grad
(
cm2
.
mean
(),
x
)
grad
=
tensor
.
grad
(
cm2
.
mean
(),
x
)
# create some inputs into a softmax that are large and labels
# create some inputs into a softmax that are large and labels
a
=
numpy
.
exp
(
10
*
numpy
.
random
.
rand
(
5
,
10
)
.
astype
(
theano
.
config
.
floatX
))
a
=
numpy
.
exp
(
10
*
numpy
.
random
.
rand
(
5
,
10
)
.
astype
(
theano
.
config
.
floatX
))
# create some one-hot coded labels
# create some one-hot coded labels
b
=
numpy
.
eye
(
5
,
10
)
.
astype
(
theano
.
config
.
floatX
)
b
=
numpy
.
eye
(
5
,
10
)
.
astype
(
theano
.
config
.
floatX
)
...
@@ -242,6 +251,7 @@ class T_LogSoftmax(utt.InferShapeTester):
...
@@ -242,6 +251,7 @@ class T_LogSoftmax(utt.InferShapeTester):
sm
=
tensor
.
nnet
.
softmax
(
x
)
sm
=
tensor
.
nnet
.
softmax
(
x
)
logsm
=
tensor
.
log
(
sm
)
logsm
=
tensor
.
log
(
sm
)
f
=
theano
.
function
([
x
],
logsm
)
f
=
theano
.
function
([
x
],
logsm
)
self
.
assertTrue
(
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
))
assert
isinstance
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
owner
.
op
,
assert
isinstance
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
owner
.
op
,
theano
.
tensor
.
nnet
.
nnet
.
LogSoftmax
)
theano
.
tensor
.
nnet
.
nnet
.
LogSoftmax
)
...
@@ -257,7 +267,7 @@ class T_LogSoftmax(utt.InferShapeTester):
...
@@ -257,7 +267,7 @@ class T_LogSoftmax(utt.InferShapeTester):
m
.
check_isfinite
=
False
m
.
check_isfinite
=
False
# some inputs that are large to make the gradient explode in the non
# some inputs that are large to make the gradient explode in the non
# optimized case
# optimized case
a
=
numpy
.
exp
(
10
*
numpy
.
random
.
rand
(
5
,
10
)
.
astype
(
theano
.
config
.
floatX
))
a
=
numpy
.
exp
(
10
*
numpy
.
random
.
rand
(
5
,
10
)
.
astype
(
theano
.
config
.
floatX
))
def
myfunc
(
x
):
def
myfunc
(
x
):
sm
=
tensor
.
nnet
.
softmax
(
x
)
sm
=
tensor
.
nnet
.
softmax
(
x
)
...
@@ -265,6 +275,8 @@ class T_LogSoftmax(utt.InferShapeTester):
...
@@ -265,6 +275,8 @@ class T_LogSoftmax(utt.InferShapeTester):
return
logsm
return
logsm
# We set step to 0.1 because for big values we need a big epsilon
# We set step to 0.1 because for big values we need a big epsilon
utt
.
verify_grad
(
myfunc
,
[
a
],
eps
=
0.1
,
mode
=
m
)
utt
.
verify_grad
(
myfunc
,
[
a
],
eps
=
0.1
,
mode
=
m
)
f
=
theano
.
function
([],
myfunc
(
a
))
self
.
assertTrue
(
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
))
class
T_SoftmaxGrad
(
utt
.
InferShapeTester
):
class
T_SoftmaxGrad
(
utt
.
InferShapeTester
):
...
@@ -642,6 +654,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
...
@@ -642,6 +654,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
fgraph
=
gof
.
FunctionGraph
(
fgraph
=
gof
.
FunctionGraph
(
[
x
,
one_of_n
],
[
x
,
one_of_n
],
[
g_x
])
[
g_x
])
self
.
assertTrue
(
hasattr
(
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
))
# print 'BEFORE'
# print 'BEFORE'
# for node in fgraph.toposort():
# for node in fgraph.toposort():
...
@@ -737,6 +750,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
...
@@ -737,6 +750,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
for
expr
in
expressions
:
for
expr
in
expressions
:
# Verify the optimizer worked on the expressions
# Verify the optimizer worked on the expressions
f
=
theano
.
function
([
x
,
y
],
expr
,
mode
=
mode
)
f
=
theano
.
function
([
x
,
y
],
expr
,
mode
=
mode
)
self
.
assertTrue
(
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
))
if
verbose
:
if
verbose
:
theano
.
printing
.
debugprint
(
f
)
theano
.
printing
.
debugprint
(
f
)
try
:
try
:
...
@@ -752,6 +766,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
...
@@ -752,6 +766,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
# Also verify the gradient wrt x
# Also verify the gradient wrt x
g
=
theano
.
function
([
x
,
y
],
T
.
grad
(
expr
,
x
),
mode
=
mode
)
g
=
theano
.
function
([
x
,
y
],
T
.
grad
(
expr
,
x
),
mode
=
mode
)
self
.
assertTrue
(
hasattr
(
g
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
))
if
verbose
:
if
verbose
:
theano
.
printing
.
debugprint
(
g
)
theano
.
printing
.
debugprint
(
g
)
try
:
try
:
...
@@ -774,6 +789,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
...
@@ -774,6 +789,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
for
expr
in
bias_expressions
:
for
expr
in
bias_expressions
:
f
=
theano
.
function
([
x
,
b
,
y
],
expr
,
mode
=
mode
)
f
=
theano
.
function
([
x
,
b
,
y
],
expr
,
mode
=
mode
)
self
.
assertTrue
(
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
))
if
verbose
:
if
verbose
:
theano
.
printing
.
debugprint
(
f
)
theano
.
printing
.
debugprint
(
f
)
try
:
try
:
...
@@ -785,6 +801,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
...
@@ -785,6 +801,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
theano
.
printing
.
debugprint
(
f
)
theano
.
printing
.
debugprint
(
f
)
raise
raise
g
=
theano
.
function
([
x
,
b
,
y
],
T
.
grad
(
expr
,
x
),
mode
=
mode
)
g
=
theano
.
function
([
x
,
b
,
y
],
T
.
grad
(
expr
,
x
),
mode
=
mode
)
self
.
assertTrue
(
hasattr
(
g
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
))
if
verbose
:
if
verbose
:
theano
.
printing
.
debugprint
(
g
)
theano
.
printing
.
debugprint
(
g
)
try
:
try
:
...
@@ -807,6 +824,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
...
@@ -807,6 +824,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
for
expr
in
mean_expressions
:
for
expr
in
mean_expressions
:
f
=
theano
.
function
([
x
,
y
],
expr
,
mode
=
mode
)
f
=
theano
.
function
([
x
,
y
],
expr
,
mode
=
mode
)
self
.
assertTrue
(
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
))
if
verbose
:
if
verbose
:
theano
.
printing
.
debugprint
(
f
)
theano
.
printing
.
debugprint
(
f
)
try
:
try
:
...
@@ -821,6 +839,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
...
@@ -821,6 +839,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
raise
raise
g
=
theano
.
function
([
x
,
y
],
T
.
grad
(
expr
,
x
),
mode
=
mode
)
g
=
theano
.
function
([
x
,
y
],
T
.
grad
(
expr
,
x
),
mode
=
mode
)
self
.
assertTrue
(
hasattr
(
g
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
))
if
verbose
:
if
verbose
:
theano
.
printing
.
debugprint
(
g
)
theano
.
printing
.
debugprint
(
g
)
try
:
try
:
...
@@ -844,6 +863,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
...
@@ -844,6 +863,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
for
expr
in
mean_bias_expressions
:
for
expr
in
mean_bias_expressions
:
f
=
theano
.
function
([
x
,
b
,
y
],
expr
,
mode
=
mode
)
f
=
theano
.
function
([
x
,
b
,
y
],
expr
,
mode
=
mode
)
self
.
assertTrue
(
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
))
if
verbose
:
if
verbose
:
theano
.
printing
.
debugprint
(
f
)
theano
.
printing
.
debugprint
(
f
)
try
:
try
:
...
@@ -856,6 +876,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
...
@@ -856,6 +876,7 @@ class T_CrossentropyCategorical1Hot(utt.InferShapeTester):
theano
.
printing
.
debugprint
(
f
)
theano
.
printing
.
debugprint
(
f
)
raise
raise
g
=
theano
.
function
([
x
,
b
,
y
],
T
.
grad
(
expr
,
x
),
mode
=
mode
)
g
=
theano
.
function
([
x
,
b
,
y
],
T
.
grad
(
expr
,
x
),
mode
=
mode
)
self
.
assertTrue
(
hasattr
(
g
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
))
if
verbose
:
if
verbose
:
theano
.
printing
.
debugprint
(
g
)
theano
.
printing
.
debugprint
(
g
)
try
:
try
:
...
@@ -1269,6 +1290,7 @@ def test_argmax_pushdown():
...
@@ -1269,6 +1290,7 @@ def test_argmax_pushdown():
fgraph
=
gof
.
FunctionGraph
(
fgraph
=
gof
.
FunctionGraph
(
[
x
],
[
x
],
[
out
])
[
out
])
assert
hasattr
(
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
backup
=
config
.
warn
.
argmax_pushdown_bug
backup
=
config
.
warn
.
argmax_pushdown_bug
config
.
warn
.
argmax_pushdown_bug
=
False
config
.
warn
.
argmax_pushdown_bug
=
False
...
@@ -1297,6 +1319,8 @@ def test_argmax_pushdown_bias():
...
@@ -1297,6 +1319,8 @@ def test_argmax_pushdown_bias():
fgraph
=
gof
.
FunctionGraph
(
fgraph
=
gof
.
FunctionGraph
(
[
x
,
b
],
[
x
,
b
],
[
out
])
[
out
])
f
=
theano
.
function
([
x
,
b
],
out
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
theano
.
compile
.
mode
.
optdb
.
query
(
theano
.
compile
.
mode
.
optdb
.
query
(
theano
.
compile
.
mode
.
OPT_FAST_RUN
)
.
optimize
(
fgraph
)
theano
.
compile
.
mode
.
OPT_FAST_RUN
)
.
optimize
(
fgraph
)
...
@@ -1316,6 +1340,8 @@ def test_argmax_pushdown_bias():
...
@@ -1316,6 +1340,8 @@ def test_argmax_pushdown_bias():
fgraph
=
gof
.
FunctionGraph
(
fgraph
=
gof
.
FunctionGraph
(
[
x
,
b
],
[
x
,
b
],
[
out
])
[
out
])
f
=
theano
.
function
([
x
,
b
],
out
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
backup
=
config
.
warn
.
argmax_pushdown_bug
backup
=
config
.
warn
.
argmax_pushdown_bug
config
.
warn
.
argmax_pushdown_bug
=
False
config
.
warn
.
argmax_pushdown_bug
=
False
...
@@ -1405,6 +1431,9 @@ class Test_softmax_opt:
...
@@ -1405,6 +1431,9 @@ class Test_softmax_opt:
# test that function contains softmax and no div.
# test that function contains softmax and no div.
f
=
theano
.
function
([
c
],
p_y
,
mode
=
self
.
mode
)
f
=
theano
.
function
([
c
],
p_y
,
mode
=
self
.
mode
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
f_ops
=
[
n
.
op
for
n
in
f
.
maker
.
fgraph
.
toposort
()]
f_ops
=
[
n
.
op
for
n
in
f
.
maker
.
fgraph
.
toposort
()]
# print '--- f ='
# print '--- f ='
# printing.debugprint(f)
# printing.debugprint(f)
...
@@ -1419,6 +1448,9 @@ class Test_softmax_opt:
...
@@ -1419,6 +1448,9 @@ class Test_softmax_opt:
# test that function contains softmax and no div.
# test that function contains softmax and no div.
f
=
theano
.
function
([
c
],
p_y
,
mode
=
self
.
mode
)
f
=
theano
.
function
([
c
],
p_y
,
mode
=
self
.
mode
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
f_ops
=
[
n
.
op
for
n
in
f
.
maker
.
fgraph
.
toposort
()]
f_ops
=
[
n
.
op
for
n
in
f
.
maker
.
fgraph
.
toposort
()]
# print '--- f ='
# print '--- f ='
# printing.debugprint(f)
# printing.debugprint(f)
...
@@ -1437,6 +1469,7 @@ class Test_softmax_opt:
...
@@ -1437,6 +1469,7 @@ class Test_softmax_opt:
config
.
warn
.
sum_div_dimshuffle_bug
=
False
config
.
warn
.
sum_div_dimshuffle_bug
=
False
try
:
try
:
g
=
theano
.
function
([
c
,
w
],
T
.
grad
((
p_y
*
w
)
.
sum
(),
c
))
g
=
theano
.
function
([
c
,
w
],
T
.
grad
((
p_y
*
w
)
.
sum
(),
c
))
hasattr
(
g
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
finally
:
finally
:
config
.
warn
.
sum_div_dimshuffle_bug
=
backup
config
.
warn
.
sum_div_dimshuffle_bug
=
backup
g_ops
=
[
n
.
op
for
n
in
g
.
maker
.
fgraph
.
toposort
()]
g_ops
=
[
n
.
op
for
n
in
g
.
maker
.
fgraph
.
toposort
()]
...
@@ -1464,6 +1497,7 @@ class Test_softmax_opt:
...
@@ -1464,6 +1497,7 @@ class Test_softmax_opt:
config
.
warn
.
sum_div_dimshuffle_bug
=
False
config
.
warn
.
sum_div_dimshuffle_bug
=
False
try
:
try
:
g
=
theano
.
function
([
c
],
T
.
grad
(
p_y
.
sum
(),
c
))
g
=
theano
.
function
([
c
],
T
.
grad
(
p_y
.
sum
(),
c
))
hasattr
(
g
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
finally
:
finally
:
config
.
warn
.
sum_div_dimshuffle_bug
=
backup
config
.
warn
.
sum_div_dimshuffle_bug
=
backup
# printing.debugprint(g)
# printing.debugprint(g)
...
@@ -1476,6 +1510,7 @@ class Test_softmax_opt:
...
@@ -1476,6 +1510,7 @@ class Test_softmax_opt:
# test that function contains softmax and no div.
# test that function contains softmax and no div.
f
=
theano
.
function
([
c
],
p_y
)
f
=
theano
.
function
([
c
],
p_y
)
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
# printing.debugprint(f)
# printing.debugprint(f)
# test that function contains softmax and no div.
# test that function contains softmax and no div.
...
@@ -1483,6 +1518,7 @@ class Test_softmax_opt:
...
@@ -1483,6 +1518,7 @@ class Test_softmax_opt:
config
.
warn
.
sum_div_dimshuffle_bug
=
False
config
.
warn
.
sum_div_dimshuffle_bug
=
False
try
:
try
:
g
=
theano
.
function
([
c
],
T
.
grad
(
p_y
.
sum
(),
c
))
g
=
theano
.
function
([
c
],
T
.
grad
(
p_y
.
sum
(),
c
))
hasattr
(
g
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
finally
:
finally
:
config
.
warn
.
sum_div_dimshuffle_bug
=
backup
config
.
warn
.
sum_div_dimshuffle_bug
=
backup
# printing.debugprint(g)
# printing.debugprint(g)
...
@@ -1522,6 +1558,7 @@ def test_stabilize_log_softmax():
...
@@ -1522,6 +1558,7 @@ def test_stabilize_log_softmax():
z
=
theano
.
tensor
.
log
(
y
)
z
=
theano
.
tensor
.
log
(
y
)
f
=
theano
.
function
([
x
],
z
,
mode
=
mode
)
f
=
theano
.
function
([
x
],
z
,
mode
=
mode
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
# check that the softmax has been optimized out
# check that the softmax has been optimized out
for
node
in
f
.
maker
.
fgraph
.
toposort
():
for
node
in
f
.
maker
.
fgraph
.
toposort
():
...
@@ -1621,7 +1658,6 @@ def test_h_softmax():
...
@@ -1621,7 +1658,6 @@ def test_h_softmax():
#############
#############
x_mat
=
numpy
.
random
.
normal
(
size
=
(
batch_size
,
input_size
))
.
astype
(
floatX
)
x_mat
=
numpy
.
random
.
normal
(
size
=
(
batch_size
,
input_size
))
.
astype
(
floatX
)
y_mat
=
numpy
.
random
.
randint
(
0
,
output_size
,
batch_size
)
.
astype
(
'int32'
)
y_mat
=
numpy
.
random
.
randint
(
0
,
output_size
,
batch_size
)
.
astype
(
'int32'
)
tg_output
=
fun_output_tg
(
x_mat
,
y_mat
)
tg_output
=
fun_output_tg
(
x_mat
,
y_mat
)
all_outputs
=
fun_output
(
x_mat
)
all_outputs
=
fun_output
(
x_mat
)
...
...
theano/tensor/nnet/tests/test_opt.py
浏览文件 @
9fb9dea1
...
@@ -13,6 +13,7 @@ def test_blocksparse_inplace_gemv_opt():
...
@@ -13,6 +13,7 @@ def test_blocksparse_inplace_gemv_opt():
o
=
sparse_block_dot
(
W
,
h
,
iIdx
,
b
,
oIdx
)
o
=
sparse_block_dot
(
W
,
h
,
iIdx
,
b
,
oIdx
)
f
=
theano
.
function
([
W
,
h
,
iIdx
,
b
,
oIdx
],
o
)
f
=
theano
.
function
([
W
,
h
,
iIdx
,
b
,
oIdx
],
o
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
if
theano
.
config
.
mode
==
"FAST_COMPILE"
:
if
theano
.
config
.
mode
==
"FAST_COMPILE"
:
assert
not
f
.
maker
.
fgraph
.
toposort
()[
-
1
]
.
op
.
inplace
assert
not
f
.
maker
.
fgraph
.
toposort
()[
-
1
]
.
op
.
inplace
...
@@ -33,6 +34,7 @@ def test_blocksparse_inplace_outer_opt():
...
@@ -33,6 +34,7 @@ def test_blocksparse_inplace_outer_opt():
f
=
theano
.
function
([
W
,
h
,
iIdx
,
b
,
oIdx
],
f
=
theano
.
function
([
W
,
h
,
iIdx
,
b
,
oIdx
],
[
o
,
tensor
.
grad
(
o
.
sum
(),
wrt
=
W
)])
[
o
,
tensor
.
grad
(
o
.
sum
(),
wrt
=
W
)])
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
if
theano
.
config
.
mode
==
"FAST_COMPILE"
:
if
theano
.
config
.
mode
==
"FAST_COMPILE"
:
assert
not
f
.
maker
.
fgraph
.
toposort
()[
-
1
]
.
op
.
inplace
assert
not
f
.
maker
.
fgraph
.
toposort
()[
-
1
]
.
op
.
inplace
...
...
theano/tensor/nnet/tests/test_sigm.py
浏览文件 @
9fb9dea1
...
@@ -126,32 +126,40 @@ class T_sigmoid_opts(unittest.TestCase):
...
@@ -126,32 +126,40 @@ class T_sigmoid_opts(unittest.TestCase):
# tests inv_1_plus_exp
# tests inv_1_plus_exp
f
=
theano
.
function
([
x
],
T
.
fill
(
x
,
1.0
)
/
(
1
+
T
.
exp
(
-
x
)),
mode
=
m
)
f
=
theano
.
function
([
x
],
T
.
fill
(
x
,
1.0
)
/
(
1
+
T
.
exp
(
-
x
)),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
==
[
sigmoid
]
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
==
[
sigmoid
]
f
(
data
)
f
(
data
)
f
=
theano
.
function
([
x
],
T
.
fill
(
x
,
1.0
)
/
(
2
+
T
.
exp
(
-
x
)),
mode
=
m
)
f
=
theano
.
function
([
x
],
T
.
fill
(
x
,
1.0
)
/
(
2
+
T
.
exp
(
-
x
)),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
]
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
]
f
(
data
)
f
(
data
)
f
=
theano
.
function
([
x
],
T
.
fill
(
x
,
1.0
)
/
(
1
-
T
.
exp
(
-
x
)),
mode
=
m
)
f
=
theano
.
function
([
x
],
T
.
fill
(
x
,
1.0
)
/
(
1
-
T
.
exp
(
-
x
)),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
]
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
]
f
(
data
)
f
(
data
)
f
=
theano
.
function
([
x
],
T
.
fill
(
x
,
1.1
)
/
(
1
+
T
.
exp
(
-
x
)),
mode
=
m
)
f
=
theano
.
function
([
x
],
T
.
fill
(
x
,
1.1
)
/
(
1
+
T
.
exp
(
-
x
)),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
]
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
]
f
(
data
)
f
(
data
)
# tests inv_1_plus_exp with neg
# tests inv_1_plus_exp with neg
f
=
theano
.
function
([
x
],
T
.
fill
(
x
,
-
1.0
)
/
(
1
+
T
.
exp
(
-
x
)),
mode
=
m
)
f
=
theano
.
function
([
x
],
T
.
fill
(
x
,
-
1.0
)
/
(
1
+
T
.
exp
(
-
x
)),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
==
[
sigmoid
,
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
==
[
sigmoid
,
theano
.
tensor
.
inplace
.
neg_inplace
]
theano
.
tensor
.
inplace
.
neg_inplace
]
f
(
data
)
f
(
data
)
f
=
theano
.
function
([
x
],
T
.
fill
(
x
,
-
1.0
)
/
(
1
-
T
.
exp
(
-
x
)),
mode
=
m
)
f
=
theano
.
function
([
x
],
T
.
fill
(
x
,
-
1.0
)
/
(
1
-
T
.
exp
(
-
x
)),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
,
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
,
theano
.
tensor
.
inplace
.
neg_inplace
]
theano
.
tensor
.
inplace
.
neg_inplace
]
f
(
data
)
f
(
data
)
f
=
theano
.
function
([
x
],
T
.
fill
(
x
,
-
1.0
)
/
(
2
+
T
.
exp
(
-
x
)),
mode
=
m
)
f
=
theano
.
function
([
x
],
T
.
fill
(
x
,
-
1.0
)
/
(
2
+
T
.
exp
(
-
x
)),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
,
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
,
theano
.
tensor
.
inplace
.
neg_inplace
]
theano
.
tensor
.
inplace
.
neg_inplace
]
f
(
data
)
f
(
data
)
f
=
theano
.
function
([
x
],
T
.
fill
(
x
,
-
1.1
)
/
(
1
+
T
.
exp
(
-
x
)),
mode
=
m
)
f
=
theano
.
function
([
x
],
T
.
fill
(
x
,
-
1.1
)
/
(
1
+
T
.
exp
(
-
x
)),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
,
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
,
theano
.
tensor
.
inplace
.
neg_inplace
]
theano
.
tensor
.
inplace
.
neg_inplace
]
f
(
data
)
f
(
data
)
...
@@ -162,31 +170,37 @@ class T_sigmoid_opts(unittest.TestCase):
...
@@ -162,31 +170,37 @@ class T_sigmoid_opts(unittest.TestCase):
# = - (sigm(x) * sigm(x))
# = - (sigm(x) * sigm(x))
f
=
theano
.
function
([
x
],
(
T
.
fill
(
x
,
-
1.0
)
*
T
.
exp
(
x
))
/
f
=
theano
.
function
([
x
],
(
T
.
fill
(
x
,
-
1.0
)
*
T
.
exp
(
x
))
/
((
1
+
T
.
exp
(
x
))
*
(
1
+
T
.
exp
(
-
x
))),
mode
=
m
)
((
1
+
T
.
exp
(
x
))
*
(
1
+
T
.
exp
(
-
x
))),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
==
[
sigmoid
,
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
==
[
sigmoid
,
T
.
mul
]
T
.
mul
]
f
(
data
)
f
(
data
)
f
=
theano
.
function
([
x
],
(
T
.
fill
(
x
,
-
1.1
)
*
T
.
exp
(
x
))
/
f
=
theano
.
function
([
x
],
(
T
.
fill
(
x
,
-
1.1
)
*
T
.
exp
(
x
))
/
((
1
+
T
.
exp
(
x
))
*
(
1
+
T
.
exp
(
-
x
))),
mode
=
m
)
((
1
+
T
.
exp
(
x
))
*
(
1
+
T
.
exp
(
-
x
))),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
,
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
,
T
.
mul
,
theano
.
tensor
.
inplace
.
neg_inplace
]
T
.
mul
,
theano
.
tensor
.
inplace
.
neg_inplace
]
f
(
data
)
f
(
data
)
f
=
theano
.
function
([
x
],
(
T
.
fill
(
x
,
-
1.0
)
*
T
.
exp
(
x
))
/
f
=
theano
.
function
([
x
],
(
T
.
fill
(
x
,
-
1.0
)
*
T
.
exp
(
x
))
/
((
2
+
T
.
exp
(
x
))
*
(
1
+
T
.
exp
(
-
x
))),
mode
=
m
)
((
2
+
T
.
exp
(
x
))
*
(
1
+
T
.
exp
(
-
x
))),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
,
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
,
T
.
mul
,
theano
.
tensor
.
inplace
.
neg_inplace
]
T
.
mul
,
theano
.
tensor
.
inplace
.
neg_inplace
]
f
(
data
)
f
(
data
)
f
=
theano
.
function
([
x
],
(
T
.
fill
(
x
,
-
1.0
)
*
T
.
exp
(
x
))
/
f
=
theano
.
function
([
x
],
(
T
.
fill
(
x
,
-
1.0
)
*
T
.
exp
(
x
))
/
((
1
+
T
.
exp
(
x
))
*
(
2
+
T
.
exp
(
-
x
))),
mode
=
m
)
((
1
+
T
.
exp
(
x
))
*
(
2
+
T
.
exp
(
-
x
))),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
,
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
,
T
.
mul
,
theano
.
tensor
.
inplace
.
neg_inplace
]
T
.
mul
,
theano
.
tensor
.
inplace
.
neg_inplace
]
f
(
data
)
f
(
data
)
f
=
theano
.
function
([
x
],
(
T
.
fill
(
x
,
-
1.0
)
*
T
.
exp
(
x
))
/
f
=
theano
.
function
([
x
],
(
T
.
fill
(
x
,
-
1.0
)
*
T
.
exp
(
x
))
/
((
1
+
T
.
exp
(
x
))
*
(
1
+
T
.
exp
(
x
))),
mode
=
m
)
((
1
+
T
.
exp
(
x
))
*
(
1
+
T
.
exp
(
x
))),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
,
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
,
T
.
mul
,
theano
.
tensor
.
inplace
.
neg_inplace
]
T
.
mul
,
theano
.
tensor
.
inplace
.
neg_inplace
]
f
(
data
)
f
(
data
)
f
=
theano
.
function
([
x
],
(
T
.
fill
(
x
,
-
1.0
)
*
T
.
exp
(
x
))
/
f
=
theano
.
function
([
x
],
(
T
.
fill
(
x
,
-
1.0
)
*
T
.
exp
(
x
))
/
((
1
+
T
.
exp
(
x
))
*
(
2
+
T
.
exp
(
-
x
))),
mode
=
m
)
((
1
+
T
.
exp
(
x
))
*
(
2
+
T
.
exp
(
-
x
))),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
,
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
!=
[
sigmoid
,
T
.
mul
,
theano
.
tensor
.
inplace
.
neg_inplace
]
T
.
mul
,
theano
.
tensor
.
inplace
.
neg_inplace
]
f
(
data
)
f
(
data
)
...
@@ -204,11 +218,13 @@ class T_sigmoid_opts(unittest.TestCase):
...
@@ -204,11 +218,13 @@ class T_sigmoid_opts(unittest.TestCase):
# tests exp_over_1_plus_exp
# tests exp_over_1_plus_exp
f
=
theano
.
function
([
x
],
1
-
T
.
exp
(
x
)
/
(
1
+
T
.
exp
(
x
)),
mode
=
m
)
f
=
theano
.
function
([
x
],
1
-
T
.
exp
(
x
)
/
(
1
+
T
.
exp
(
x
)),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
==
[
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
==
[
tensor
.
neg
,
sigmoid_inplace
]
tensor
.
neg
,
sigmoid_inplace
]
# tests inv_1_plus_exp
# tests inv_1_plus_exp
f
=
theano
.
function
([
x
],
1
-
T
.
fill
(
x
,
1.0
)
/
(
1
+
T
.
exp
(
-
x
)),
mode
=
m
)
f
=
theano
.
function
([
x
],
1
-
T
.
fill
(
x
,
1.0
)
/
(
1
+
T
.
exp
(
-
x
)),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
==
[
tensor
.
neg
,
assert
[
node
.
op
for
node
in
f
.
maker
.
fgraph
.
toposort
()]
==
[
tensor
.
neg
,
sigmoid_inplace
]
sigmoid_inplace
]
...
@@ -225,12 +241,15 @@ class T_sigmoid_opts(unittest.TestCase):
...
@@ -225,12 +241,15 @@ class T_sigmoid_opts(unittest.TestCase):
x
,
y
=
tensor
.
vectors
(
'x'
,
'y'
)
x
,
y
=
tensor
.
vectors
(
'x'
,
'y'
)
f
=
theano
.
function
([
x
],
sigmoid
(
-
x
)
*
tensor
.
exp
(
x
),
mode
=
m
)
f
=
theano
.
function
([
x
],
sigmoid
(
-
x
)
*
tensor
.
exp
(
x
),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
match
(
f
,
[
sigmoid
])
match
(
f
,
[
sigmoid
])
f
=
theano
.
function
([
x
],
sigmoid
(
x
)
*
tensor
.
exp
(
-
x
),
mode
=
m
)
f
=
theano
.
function
([
x
],
sigmoid
(
x
)
*
tensor
.
exp
(
-
x
),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
match
(
f
,
[
tensor
.
neg
,
sigmoid
])
match
(
f
,
[
tensor
.
neg
,
sigmoid
])
f
=
theano
.
function
([
x
],
-
(
-
(
-
(
sigmoid
(
x
))))
*
tensor
.
exp
(
-
x
),
mode
=
m
)
f
=
theano
.
function
([
x
],
-
(
-
(
-
(
sigmoid
(
x
))))
*
tensor
.
exp
(
-
x
),
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
match
(
f
,
[
tensor
.
neg
,
sigmoid
,
tensor
.
neg
])
match
(
f
,
[
tensor
.
neg
,
sigmoid
,
tensor
.
neg
])
f
=
theano
.
function
(
f
=
theano
.
function
(
...
@@ -238,6 +257,7 @@ class T_sigmoid_opts(unittest.TestCase):
...
@@ -238,6 +257,7 @@ class T_sigmoid_opts(unittest.TestCase):
(
sigmoid
(
x
)
*
sigmoid
(
-
y
)
*
-
tensor
.
exp
(
-
x
)
*
(
sigmoid
(
x
)
*
sigmoid
(
-
y
)
*
-
tensor
.
exp
(
-
x
)
*
tensor
.
exp
(
x
*
y
)
*
tensor
.
exp
(
y
)),
tensor
.
exp
(
x
*
y
)
*
tensor
.
exp
(
y
)),
mode
=
m
)
mode
=
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
match
(
f
,
[
sigmoid
,
tensor
.
mul
,
tensor
.
neg
,
tensor
.
exp
,
sigmoid
,
match
(
f
,
[
sigmoid
,
tensor
.
mul
,
tensor
.
neg
,
tensor
.
exp
,
sigmoid
,
tensor
.
mul
])
tensor
.
mul
])
...
@@ -298,6 +318,7 @@ class T_sigmoid_opts(unittest.TestCase):
...
@@ -298,6 +318,7 @@ class T_sigmoid_opts(unittest.TestCase):
mode
=
self
.
get_mode
()
mode
=
self
.
get_mode
()
if
not
isinstance
(
mode
,
theano
.
compile
.
DebugMode
):
if
not
isinstance
(
mode
,
theano
.
compile
.
DebugMode
):
f
=
theano
.
function
([
x
,
lr
],
ux
,
mode
=
mode
)
f
=
theano
.
function
([
x
,
lr
],
ux
,
mode
=
mode
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
ux_v
=
f
([[
50
]],
0.1
)
ux_v
=
f
([[
50
]],
0.1
)
assert
not
numpy
.
isnan
(
ux_v
)
assert
not
numpy
.
isnan
(
ux_v
)
...
@@ -307,12 +328,14 @@ class T_sigmoid_opts(unittest.TestCase):
...
@@ -307,12 +328,14 @@ class T_sigmoid_opts(unittest.TestCase):
mode
=
self
.
get_mode
(
'local_ultra_fast_sigmoid'
)
mode
=
self
.
get_mode
(
'local_ultra_fast_sigmoid'
)
f
=
theano
.
function
([
x
],
s
,
mode
=
mode
)
f
=
theano
.
function
([
x
],
s
,
mode
=
mode
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
topo
=
f
.
maker
.
fgraph
.
toposort
()
topo
=
f
.
maker
.
fgraph
.
toposort
()
assert
len
(
topo
)
==
1
assert
len
(
topo
)
==
1
assert
topo
[
0
]
.
op
==
sigmoid
assert
topo
[
0
]
.
op
==
sigmoid
mode
=
self
.
get_mode
()
.
including
(
'local_ultra_fast_sigmoid'
)
mode
=
self
.
get_mode
()
.
including
(
'local_ultra_fast_sigmoid'
)
f
=
theano
.
function
([
x
],
s
,
mode
=
mode
)
f
=
theano
.
function
([
x
],
s
,
mode
=
mode
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
topo
=
f
.
maker
.
fgraph
.
toposort
()
topo
=
f
.
maker
.
fgraph
.
toposort
()
assert
topo
[
0
]
.
op
==
ultra_fast_sigmoid
assert
topo
[
0
]
.
op
==
ultra_fast_sigmoid
assert
len
(
topo
)
==
1
assert
len
(
topo
)
==
1
...
@@ -324,12 +347,14 @@ class T_sigmoid_opts(unittest.TestCase):
...
@@ -324,12 +347,14 @@ class T_sigmoid_opts(unittest.TestCase):
mode
=
self
.
get_mode
(
'local_hard_sigmoid'
)
mode
=
self
.
get_mode
(
'local_hard_sigmoid'
)
f
=
theano
.
function
([
x
],
s
,
mode
=
mode
)
f
=
theano
.
function
([
x
],
s
,
mode
=
mode
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
topo
=
f
.
maker
.
fgraph
.
toposort
()
topo
=
f
.
maker
.
fgraph
.
toposort
()
assert
topo
[
0
]
.
op
==
sigmoid
assert
topo
[
0
]
.
op
==
sigmoid
assert
len
(
topo
)
==
1
assert
len
(
topo
)
==
1
mode
=
self
.
get_mode
()
.
including
(
'local_hard_sigmoid'
)
mode
=
self
.
get_mode
()
.
including
(
'local_hard_sigmoid'
)
f
=
theano
.
function
([
x
],
s
,
mode
=
mode
)
f
=
theano
.
function
([
x
],
s
,
mode
=
mode
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
topo
=
f
.
maker
.
fgraph
.
toposort
()
topo
=
f
.
maker
.
fgraph
.
toposort
()
assert
len
(
topo
)
>
1
assert
len
(
topo
)
>
1
assert
not
any
([
n
.
op
==
sigmoid
for
n
in
topo
])
assert
not
any
([
n
.
op
==
sigmoid
for
n
in
topo
])
...
@@ -352,6 +377,7 @@ class T_softplus_opts(unittest.TestCase):
...
@@ -352,6 +377,7 @@ class T_softplus_opts(unittest.TestCase):
out
=
T
.
log
(
sigmoid
(
x
))
out
=
T
.
log
(
sigmoid
(
x
))
f
=
theano
.
function
([
x
],
out
,
mode
=
self
.
m
)
f
=
theano
.
function
([
x
],
out
,
mode
=
self
.
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
topo
=
f
.
maker
.
fgraph
.
toposort
()
topo
=
f
.
maker
.
fgraph
.
toposort
()
assert
len
(
topo
)
==
3
assert
len
(
topo
)
==
3
assert
isinstance
(
topo
[
0
]
.
op
.
scalar_op
,
theano
.
scalar
.
Neg
)
assert
isinstance
(
topo
[
0
]
.
op
.
scalar_op
,
theano
.
scalar
.
Neg
)
...
@@ -375,6 +401,7 @@ class T_softplus_opts(unittest.TestCase):
...
@@ -375,6 +401,7 @@ class T_softplus_opts(unittest.TestCase):
# Same test with a flatten
# Same test with a flatten
out
=
T
.
log
(
1
-
T
.
flatten
(
sigmoid
(
x
)))
out
=
T
.
log
(
1
-
T
.
flatten
(
sigmoid
(
x
)))
f
=
theano
.
function
([
x
],
out
,
mode
=
self
.
m
)
f
=
theano
.
function
([
x
],
out
,
mode
=
self
.
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
topo
=
f
.
maker
.
fgraph
.
toposort
()
topo
=
f
.
maker
.
fgraph
.
toposort
()
assert
len
(
topo
)
==
3
assert
len
(
topo
)
==
3
assert
tensor
.
is_flat
(
topo
[
0
]
.
outputs
[
0
])
assert
tensor
.
is_flat
(
topo
[
0
]
.
outputs
[
0
])
...
@@ -403,6 +430,7 @@ class T_softplus_opts(unittest.TestCase):
...
@@ -403,6 +430,7 @@ class T_softplus_opts(unittest.TestCase):
out
=
T
.
log
(
1
+
T
.
exp
(
x
))
out
=
T
.
log
(
1
+
T
.
exp
(
x
))
f
=
theano
.
function
([
x
],
out
,
mode
=
self
.
m
)
f
=
theano
.
function
([
x
],
out
,
mode
=
self
.
m
)
assert
hasattr
(
f
.
maker
.
fgraph
.
outputs
[
0
]
.
tag
,
'trace'
)
topo
=
f
.
maker
.
fgraph
.
toposort
()
topo
=
f
.
maker
.
fgraph
.
toposort
()
assert
len
(
topo
)
==
1
assert
len
(
topo
)
==
1
assert
isinstance
(
topo
[
0
]
.
op
.
scalar_op
,
assert
isinstance
(
topo
[
0
]
.
op
.
scalar_op
,
...
...
编写
预览
Markdown
格式
0%
重试
或
添加新文件
添加附件
取消
您添加了
0
人
到此讨论。请谨慎行事。
请先完成此评论的编辑!
取消
请
注册
或者
登录
后发表评论