提交 639b0871 authored 作者: Ricardo Vieira's avatar Ricardo Vieira 提交者: Ricardo Vieira

Get rid of redundant checks in tracked node_rewriters

上级 cb2c40ba
...@@ -328,7 +328,7 @@ def local_func_inv(fgraph, node): ...@@ -328,7 +328,7 @@ def local_func_inv(fgraph, node):
@register_canonicalize @register_canonicalize
@register_specialize @register_specialize
@node_rewriter([Elemwise]) @node_rewriter([log, log1p, exp, expm1])
def local_exp_log(fgraph, node): def local_exp_log(fgraph, node):
x = node.inputs[0] x = node.inputs[0]
...@@ -368,7 +368,7 @@ def local_exp_log(fgraph, node): ...@@ -368,7 +368,7 @@ def local_exp_log(fgraph, node):
@register_specialize @register_specialize
@node_rewriter([Elemwise]) @node_rewriter([exp, expm1])
def local_exp_log_nan_switch(fgraph, node): def local_exp_log_nan_switch(fgraph, node):
# Rewrites of the kind exp(log...(x)) that require a `nan` switch # Rewrites of the kind exp(log...(x)) that require a `nan` switch
x = node.inputs[0] x = node.inputs[0]
...@@ -431,11 +431,7 @@ def local_sumsqr2dot(fgraph, node): ...@@ -431,11 +431,7 @@ def local_sumsqr2dot(fgraph, node):
``pt.sqr(W.dimshuffle("x", 0, 1) * G.dimshuffle(0, "x", 1) ).sum(axis=(1, 2))`` ``pt.sqr(W.dimshuffle("x", 0, 1) * G.dimshuffle(0, "x", 1) ).sum(axis=(1, 2))``
and converts it to ``pt.dot(pt.sqr(G), pt.sqr(W).sum(axis=0))``. and converts it to ``pt.dot(pt.sqr(G), pt.sqr(W).sum(axis=0))``.
""" """
if ( if node.op.axis == (1, 2):
isinstance(node.op, Sum)
and isinstance(node.op.scalar_op, ps.Add)
and node.op.axis == (1, 2)
):
in1 = node.inputs[0] in1 = node.inputs[0]
out = node.outputs[0] out = node.outputs[0]
...@@ -479,7 +475,7 @@ def local_mul_exp_to_exp_add(fgraph, node): ...@@ -479,7 +475,7 @@ def local_mul_exp_to_exp_add(fgraph, node):
n.owner.inputs[0] n.owner.inputs[0]
for n in node.inputs for n in node.inputs
if n.owner if n.owner
and hasattr(n.owner.op, "scalar_op") and isinstance(n.owner.op, Elemwise)
and isinstance(n.owner.op.scalar_op, ps.Exp) and isinstance(n.owner.op.scalar_op, ps.Exp)
] ]
# Can only do any rewrite if there are at least two exp-s # Can only do any rewrite if there are at least two exp-s
...@@ -523,7 +519,7 @@ def local_mul_pow_to_pow_add(fgraph, node): ...@@ -523,7 +519,7 @@ def local_mul_pow_to_pow_add(fgraph, node):
for n in node.inputs: for n in node.inputs:
if ( if (
n.owner n.owner
and hasattr(n.owner.op, "scalar_op") and isinstance(n.owner.op, Elemwise)
and isinstance(n.owner.op.scalar_op, ps.Pow) and isinstance(n.owner.op.scalar_op, ps.Pow)
): ):
base_node = n.owner.inputs[0] base_node = n.owner.inputs[0]
...@@ -567,10 +563,9 @@ def local_mul_pow_to_pow_add(fgraph, node): ...@@ -567,10 +563,9 @@ def local_mul_pow_to_pow_add(fgraph, node):
@register_stabilize @register_stabilize
@register_specialize @register_specialize
@register_canonicalize @register_canonicalize
@node_rewriter([Elemwise]) @node_rewriter([sub])
def local_expm1(fgraph, node): def local_expm1(fgraph, node):
"""Detect ``exp(a) - 1`` and convert them to ``expm1(a)``.""" """Detect ``exp(a) - 1`` and convert them to ``expm1(a)``."""
if isinstance(node.op, Elemwise) and isinstance(node.op.scalar_op, ps.Sub):
in1, in2 = node.inputs in1, in2 = node.inputs
out = node.outputs[0] out = node.outputs[0]
...@@ -625,8 +620,6 @@ def local_mul_switch_sink(fgraph, node): ...@@ -625,8 +620,6 @@ def local_mul_switch_sink(fgraph, node):
part of the graph. part of the graph.
""" """
if node.op != mul:
return False
for idx, i in enumerate(node.inputs): for idx, i in enumerate(node.inputs):
if i.owner and i.owner.op == switch: if i.owner and i.owner.op == switch:
switch_node = i.owner switch_node = i.owner
...@@ -705,8 +698,6 @@ def local_div_switch_sink(fgraph, node): ...@@ -705,8 +698,6 @@ def local_div_switch_sink(fgraph, node):
See `local_mul_switch_sink` for more details. See `local_mul_switch_sink` for more details.
""" """
if node.op != true_div and node.op != int_div:
return False
op = node.op op = node.op
if node.inputs[0].owner and node.inputs[0].owner.op == switch: if node.inputs[0].owner and node.inputs[0].owner.op == switch:
switch_node = node.inputs[0].owner switch_node = node.inputs[0].owner
...@@ -1235,7 +1226,6 @@ register_canonicalize(local_mul_canonizer, "shape_unsafe", name="local_mul_canon ...@@ -1235,7 +1226,6 @@ register_canonicalize(local_mul_canonizer, "shape_unsafe", name="local_mul_canon
@register_canonicalize @register_canonicalize
@node_rewriter([neg]) @node_rewriter([neg])
def local_neg_to_mul(fgraph, node): def local_neg_to_mul(fgraph, node):
if node.op == neg:
return [mul(np.array(-1, dtype=node.inputs[0].dtype), node.inputs[0])] return [mul(np.array(-1, dtype=node.inputs[0].dtype), node.inputs[0])]
...@@ -1347,17 +1337,12 @@ def local_sum_of_neg_to_neg_of_sum(fgraph, node): ...@@ -1347,17 +1337,12 @@ def local_sum_of_neg_to_neg_of_sum(fgraph, node):
@register_specialize @register_specialize
@node_rewriter([Elemwise]) @node_rewriter([sub])
def local_elemwise_sub_zeros(fgraph, node): def local_elemwise_sub_zeros(fgraph, node):
""" """
Elemwise{sub}(X,X) -> zeros_like(X) Elemwise{sub}(X,X) -> zeros_like(X)
""" """
if ( if node.inputs[0] == node.inputs[1]:
isinstance(node.op, Elemwise)
and node.op.scalar_op.nin == 2
and node.op.scalar_op == ps.sub
and node.inputs[0] == node.inputs[1]
):
res = zeros_like(node.inputs[0]) res = zeros_like(node.inputs[0])
# Copy over stacktrace from previous output. # Copy over stacktrace from previous output.
# This could help for failures due to out-of-memory. # This could help for failures due to out-of-memory.
...@@ -1400,8 +1385,6 @@ def local_useless_elemwise_comparison(fgraph, node): ...@@ -1400,8 +1385,6 @@ def local_useless_elemwise_comparison(fgraph, node):
the graph easier to read. the graph easier to read.
""" """
if not isinstance(node.op, Elemwise):
return
if node.op.scalar_op.nin != 2: if node.op.scalar_op.nin != 2:
return return
...@@ -1590,7 +1573,6 @@ def local_sum_prod_all_to_none(fgraph, node): ...@@ -1590,7 +1573,6 @@ def local_sum_prod_all_to_none(fgraph, node):
Prod{0,1,...N} -> Prod{} Prod{0,1,...N} -> Prod{}
""" """
if isinstance(node.op, Sum) or isinstance(node.op, Prod):
op_type = Sum if isinstance(node.op, Sum) else Prod op_type = Sum if isinstance(node.op, Sum) else Prod
# if all the axes are named, then use None as a shorthand # if all the axes are named, then use None as a shorthand
# this permits more merging # this permits more merging
...@@ -1609,7 +1591,6 @@ def local_op_of_op(fgraph, node): ...@@ -1609,7 +1591,6 @@ def local_op_of_op(fgraph, node):
Sum(Sum()) -> single Sum() Sum(Sum()) -> single Sum()
""" """
if isinstance(node.op, Prod) or isinstance(node.op, Sum):
op_type = Sum if isinstance(node.op, Sum) else Prod op_type = Sum if isinstance(node.op, Sum) else Prod
(node_inps,) = node.inputs (node_inps,) = node.inputs
out_dtype = node.op.dtype out_dtype = node.op.dtype
...@@ -1669,11 +1650,7 @@ def local_reduce_join(fgraph, node): ...@@ -1669,11 +1650,7 @@ def local_reduce_join(fgraph, node):
where we join and reduce on the same set of axis. where we join and reduce on the same set of axis.
""" """
if ( if node.inputs[0].owner and isinstance(node.inputs[0].owner.op, Join):
isinstance(node.op, CAReduce)
and node.inputs[0].owner
and isinstance(node.inputs[0].owner.op, Join)
):
join_node = node.inputs[0].owner join_node = node.inputs[0].owner
if extract_constant(join_node.inputs[0], only_process_constants=True) != 0: if extract_constant(join_node.inputs[0], only_process_constants=True) != 0:
return return
...@@ -1732,7 +1709,6 @@ def local_reduce_join(fgraph, node): ...@@ -1732,7 +1709,6 @@ def local_reduce_join(fgraph, node):
@node_rewriter(ALL_REDUCE) @node_rewriter(ALL_REDUCE)
def local_useless_reduce(fgraph, node): def local_useless_reduce(fgraph, node):
"""Sum(a, axis=[]) -> a""" """Sum(a, axis=[]) -> a"""
if isinstance(node.op, CAReduce):
(summed,) = node.inputs (summed,) = node.inputs
# if reduce were doing anything, the output ndim would be reduced # if reduce were doing anything, the output ndim would be reduced
if summed.type == node.outputs[0].type: if summed.type == node.outputs[0].type:
...@@ -1745,7 +1721,6 @@ def local_useless_reduce(fgraph, node): ...@@ -1745,7 +1721,6 @@ def local_useless_reduce(fgraph, node):
@node_rewriter(ALL_REDUCE) @node_rewriter(ALL_REDUCE)
def local_reduce_broadcastable(fgraph, node): def local_reduce_broadcastable(fgraph, node):
"""Remove reduction over broadcastable dimensions.""" """Remove reduction over broadcastable dimensions."""
if isinstance(node.op, CAReduce):
(reduced,) = node.inputs (reduced,) = node.inputs
odtype = node.outputs[0].dtype odtype = node.outputs[0].dtype
if node.op.axis is None: if node.op.axis is None:
...@@ -1792,15 +1767,12 @@ def local_opt_alloc(fgraph, node): ...@@ -1792,15 +1767,12 @@ def local_opt_alloc(fgraph, node):
prod(alloc(constant,shapes...)) => constant**prod(shapes) prod(alloc(constant,shapes...)) => constant**prod(shapes)
""" """
if isinstance(node.op, Sum) or isinstance(node.op, Prod):
(node_inps,) = node.inputs (node_inps,) = node.inputs
if node_inps.owner and isinstance(node_inps.owner.op, Alloc): if node_inps.owner and isinstance(node_inps.owner.op, Alloc):
inp = node_inps.owner.inputs[0] inp = node_inps.owner.inputs[0]
shapes = node_inps.owner.inputs[1:] shapes = node_inps.owner.inputs[1:]
try: try:
val = get_underlying_scalar_constant_value( val = get_underlying_scalar_constant_value(inp, only_process_constants=True)
inp, only_process_constants=True
)
assert val.size == 1 assert val.size == 1
val = val.reshape(1)[0] val = val.reshape(1)[0]
# check which type of op # check which type of op
...@@ -1838,11 +1810,7 @@ def local_opt_alloc(fgraph, node): ...@@ -1838,11 +1810,7 @@ def local_opt_alloc(fgraph, node):
return [ return [
alloc( alloc(
val, val,
*[ *[shapes[i] for i in range(len(shapes)) if i not in node.op.axis],
shapes[i]
for i in range(len(shapes))
if i not in node.op.axis
],
) )
] ]
except NotScalarConstantError: except NotScalarConstantError:
...@@ -1858,7 +1826,6 @@ def local_neg_div_neg(fgraph, node): ...@@ -1858,7 +1826,6 @@ def local_neg_div_neg(fgraph, node):
Also performs - (c / b) -> ((-c) / b) when c is a scalar constant. Also performs - (c / b) -> ((-c) / b) when c is a scalar constant.
""" """
if node.op == neg:
if node.inputs[0].owner and node.inputs[0].owner.op == true_div: if node.inputs[0].owner and node.inputs[0].owner.op == true_div:
frac = node.inputs[0] frac = node.inputs[0]
num, denom = frac.owner.inputs num, denom = frac.owner.inputs
...@@ -1881,7 +1848,6 @@ def local_sub_neg_to_add(fgraph, node): ...@@ -1881,7 +1848,6 @@ def local_sub_neg_to_add(fgraph, node):
x - (-y) -> x + y x - (-y) -> x + y
""" """
if node.op == sub:
minuend, subtrahend = node.inputs minuend, subtrahend = node.inputs
if subtrahend.owner: if subtrahend.owner:
...@@ -1903,7 +1869,7 @@ def local_add_neg_to_sub(fgraph, node): ...@@ -1903,7 +1869,7 @@ def local_add_neg_to_sub(fgraph, node):
# `local_neg_to_mul` rewrite modifies the relevant pattern during canonicalization # `local_neg_to_mul` rewrite modifies the relevant pattern during canonicalization
# Rewrite is only applicable when there are two inputs to add # Rewrite is only applicable when there are two inputs to add
if node.op == add and len(node.inputs) == 2: if len(node.inputs) == 2:
# Look for pattern with either input order # Look for pattern with either input order
for first, second in (node.inputs, reversed(node.inputs)): for first, second in (node.inputs, reversed(node.inputs)):
if second.owner: if second.owner:
...@@ -1927,7 +1893,6 @@ def local_mul_zero(fgraph, node): ...@@ -1927,7 +1893,6 @@ def local_mul_zero(fgraph, node):
with zero. with zero.
""" """
if node.op == mul:
otype = node.outputs[0].type otype = node.outputs[0].type
for i in node.inputs: for i in node.inputs:
...@@ -1938,16 +1903,14 @@ def local_mul_zero(fgraph, node): ...@@ -1938,16 +1903,14 @@ def local_mul_zero(fgraph, node):
# print 'MUL by value', value, node.inputs # print 'MUL by value', value, node.inputs
if value == 0: if value == 0:
# print '... returning zeros' # print '... returning zeros'
return [ return [broadcast_arrays(_asarray(0, dtype=otype.dtype), *node.inputs)[0]]
broadcast_arrays(_asarray(0, dtype=otype.dtype), *node.inputs)[0]
]
# TODO: Add this to the canonicalization to reduce redundancy. # TODO: Add this to the canonicalization to reduce redundancy.
@register_specialize @register_specialize
@node_rewriter([true_div]) @node_rewriter([true_div])
def local_div_to_reciprocal(fgraph, node): def local_div_to_reciprocal(fgraph, node):
if node.op == true_div and np.all(get_constant(node.inputs[0]) == 1.0): if np.all(get_constant(node.inputs[0]) == 1.0):
out = node.outputs[0] out = node.outputs[0]
new_out = reciprocal(local_mul_canonizer.merge_num_denum(node.inputs[1:], [])) new_out = reciprocal(local_mul_canonizer.merge_num_denum(node.inputs[1:], []))
# The ones could have forced upcasting # The ones could have forced upcasting
...@@ -1957,30 +1920,22 @@ def local_div_to_reciprocal(fgraph, node): ...@@ -1957,30 +1920,22 @@ def local_div_to_reciprocal(fgraph, node):
if not out.type.is_super(new_out.type): if not out.type.is_super(new_out.type):
new_out = alloc_like(new_out, out, fgraph) new_out = alloc_like(new_out, out, fgraph)
return [new_out] return [new_out]
else:
return False
@register_canonicalize @register_canonicalize
@node_rewriter([reciprocal]) @node_rewriter([reciprocal])
def local_reciprocal_canon(fgraph, node): def local_reciprocal_canon(fgraph, node):
if node.op == reciprocal:
return [pt_pow(node.inputs[0], -1.0)] return [pt_pow(node.inputs[0], -1.0)]
else:
return False
@register_canonicalize @register_canonicalize
@node_rewriter([pt_pow]) @node_rewriter([pt_pow])
def local_pow_canonicalize(fgraph, node): def local_pow_canonicalize(fgraph, node):
if node.op == pt_pow:
cst = get_constant(node.inputs[1]) cst = get_constant(node.inputs[1])
if cst == 0: if cst == 0:
return [alloc_like(1, node.outputs[0], fgraph)] return [alloc_like(1, node.outputs[0], fgraph)]
if cst == 1: if cst == 1:
return [alloc_like(node.inputs[0], node.outputs[0], fgraph)] return [alloc_like(node.inputs[0], node.outputs[0], fgraph)]
else:
return False
@register_specialize @register_specialize
...@@ -1989,7 +1944,6 @@ def local_mul_to_sqr(fgraph, node): ...@@ -1989,7 +1944,6 @@ def local_mul_to_sqr(fgraph, node):
""" """
x*x -> sqr(x) x*x -> sqr(x)
""" """
if node.op == mul:
if len(node.inputs) == 2: if len(node.inputs) == 2:
if node.inputs[0] is node.inputs[1]: if node.inputs[0] is node.inputs[1]:
return [sqr(node.inputs[0])] return [sqr(node.inputs[0])]
...@@ -1999,10 +1953,7 @@ def local_mul_to_sqr(fgraph, node): ...@@ -1999,10 +1953,7 @@ def local_mul_to_sqr(fgraph, node):
@node_rewriter([int_div]) @node_rewriter([int_div])
def local_intdiv_by_one(fgraph, node): def local_intdiv_by_one(fgraph, node):
"""x // 1 -> x""" """x // 1 -> x"""
if node.op in [int_div]: if isinstance(node.inputs[1], TensorConstant) and np.all(node.inputs[1].value == 1):
if isinstance(node.inputs[1], TensorConstant) and np.all(
node.inputs[1].value == 1
):
return [node.inputs[0].astype(node.outputs[0].dtype)] return [node.inputs[0].astype(node.outputs[0].dtype)]
...@@ -2011,9 +1962,6 @@ def local_intdiv_by_one(fgraph, node): ...@@ -2011,9 +1962,6 @@ def local_intdiv_by_one(fgraph, node):
@node_rewriter([int_div, true_div]) @node_rewriter([int_div, true_div])
def local_zero_div(fgraph, node): def local_zero_div(fgraph, node):
"""0 / x -> 0""" """0 / x -> 0"""
if isinstance(node.op, Elemwise) and isinstance(
node.op.scalar_op, ps.IntDiv | ps.TrueDiv
):
if get_constant(node.inputs[0]) == 0: if get_constant(node.inputs[0]) == 0:
ret = alloc_like(0, node.outputs[0], fgraph) ret = alloc_like(0, node.outputs[0], fgraph)
ret.tag.values_eq_approx = values_eq_approx_remove_nan ret.tag.values_eq_approx = values_eq_approx_remove_nan
...@@ -2023,7 +1971,6 @@ def local_zero_div(fgraph, node): ...@@ -2023,7 +1971,6 @@ def local_zero_div(fgraph, node):
@register_specialize @register_specialize
@node_rewriter([pt_pow]) @node_rewriter([pt_pow])
def local_pow_specialize(fgraph, node): def local_pow_specialize(fgraph, node):
if node.op == pt_pow:
# the idea here is that we have pow(x, y) # the idea here is that we have pow(x, y)
odtype = node.outputs[0].dtype odtype = node.outputs[0].dtype
xsym = node.inputs[0] xsym = node.inputs[0]
...@@ -2052,8 +1999,6 @@ def local_pow_specialize(fgraph, node): ...@@ -2052,8 +1999,6 @@ def local_pow_specialize(fgraph, node):
rval[0] = cast(rval[0], odtype) rval[0] = cast(rval[0], odtype)
assert rval[0].type.dtype == node.outputs[0].type.dtype assert rval[0].type.dtype == node.outputs[0].type.dtype
return rval return rval
else:
return False
@register_specialize @register_specialize
...@@ -2138,7 +2083,6 @@ def local_mul_specialize(fgraph, node): ...@@ -2138,7 +2083,6 @@ def local_mul_specialize(fgraph, node):
""" """
# at this point [post canonicalize], mul() may have many inputs. # at this point [post canonicalize], mul() may have many inputs.
if node.op == mul:
# the idea here is that we have pow(x, y) # the idea here is that we have pow(x, y)
has_neg = False has_neg = False
new_inputs = [] new_inputs = []
...@@ -2276,7 +2220,7 @@ def local_abs_lift(fgraph, node): ...@@ -2276,7 +2220,7 @@ def local_abs_lift(fgraph, node):
This is needed for check_for_x_over_absX to apply in more case. This is needed for check_for_x_over_absX to apply in more case.
""" """
if node.op == pt_abs and node.inputs[0].owner: if node.inputs[0].owner:
assert node.nin == 1 assert node.nin == 1
if node.inputs[0].owner.op == mul: if node.inputs[0].owner.op == mul:
return [mul(*[pt_abs(i) for i in node.inputs[0].owner.inputs])] return [mul(*[pt_abs(i) for i in node.inputs[0].owner.inputs])]
...@@ -2328,7 +2272,6 @@ def local_abs_merge(fgraph, node): ...@@ -2328,7 +2272,6 @@ def local_abs_merge(fgraph, node):
def local_log1p(fgraph, node): def local_log1p(fgraph, node):
# log(1+x) -> log1p(x) # log(1+x) -> log1p(x)
# log(1-x) -> log1p(-x) # log(1-x) -> log1p(-x)
if node.op == log:
(log_arg,) = node.inputs (log_arg,) = node.inputs
if log_arg.owner and log_arg.owner.op == add: if log_arg.owner and log_arg.owner.op == add:
scalars, scalar_inputs, nonconsts = scalarconsts_rest( scalars, scalar_inputs, nonconsts = scalarconsts_rest(
...@@ -2365,7 +2308,6 @@ def local_log_add_exp(fgraph, node): ...@@ -2365,7 +2308,6 @@ def local_log_add_exp(fgraph, node):
TODO: in canonicalize, change log10 and log2 -> log TODO: in canonicalize, change log10 and log2 -> log
""" """
if node.op == log:
z = node.inputs[0] z = node.inputs[0]
if z.owner and z.owner.op == add: if z.owner and z.owner.op == add:
zi = z.owner.inputs zi = z.owner.inputs
...@@ -2393,9 +2335,6 @@ def local_log_add_exp(fgraph, node): ...@@ -2393,9 +2335,6 @@ def local_log_add_exp(fgraph, node):
def local_log_sum_exp(fgraph, node): def local_log_sum_exp(fgraph, node):
# log(sum_i(exp(x_i))) = x_max + log(sum_i(exp(x_i - x_max))) # log(sum_i(exp(x_i))) = x_max + log(sum_i(exp(x_i - x_max)))
if node.op != log:
return
sum_node = node.inputs[0].owner sum_node = node.inputs[0].owner
# If the sum has keepdims=True, there might be a dimshuffle # If the sum has keepdims=True, there might be a dimshuffle
if sum_node and isinstance(sum_node.op, DimShuffle): if sum_node and isinstance(sum_node.op, DimShuffle):
...@@ -2720,8 +2659,7 @@ def local_log_erfc(fgraph, node): ...@@ -2720,8 +2659,7 @@ def local_log_erfc(fgraph, node):
numpy.asarray([i],dtype='float32')))) for i in numpy.arange( numpy.asarray([i],dtype='float32')))) for i in numpy.arange(
10.0541948,10.0541951,.0000001)] 10.0541948,10.0541951,.0000001)]
""" """
if node.op != log:
return False
if not node.inputs[0].owner or node.inputs[0].owner.op != erfc: if not node.inputs[0].owner or node.inputs[0].owner.op != erfc:
return False return False
...@@ -2773,8 +2711,6 @@ def local_grad_log_erfc_neg(fgraph, node): ...@@ -2773,8 +2711,6 @@ def local_grad_log_erfc_neg(fgraph, node):
Make it so that the test does not generate an error in that case! Make it so that the test does not generate an error in that case!
""" """
if node.op != true_div:
return False
if not node.inputs[1].owner or node.inputs[1].owner.op != erfc: if not node.inputs[1].owner or node.inputs[1].owner.op != erfc:
return False return False
...@@ -3147,7 +3083,6 @@ def local_exp_over_1_plus_exp(fgraph, node): ...@@ -3147,7 +3083,6 @@ def local_exp_over_1_plus_exp(fgraph, node):
""" """
# This rewrite should be done for numerical stability # This rewrite should be done for numerical stability
# so we don't care to check client counts # so we don't care to check client counts
if node.op == true_div:
# find all the exp() terms in the numerator # find all the exp() terms in the numerator
num, denom = node.inputs num, denom = node.inputs
num_exp_x, num_rest, num_neg = partition_num_or_denom(num, is_exp) num_exp_x, num_rest, num_neg = partition_num_or_denom(num, is_exp)
...@@ -3498,9 +3433,6 @@ def local_sigm_times_exp(fgraph, node): ...@@ -3498,9 +3433,6 @@ def local_sigm_times_exp(fgraph, node):
todo: add stack traces to the intermediate variables todo: add stack traces to the intermediate variables
""" """
# Bail early if it is not a multiplication.
if node.op != mul:
return None
# Obtain tree of multiplications starting at this node. # Obtain tree of multiplications starting at this node.
mul_tree = parse_mul_tree(node.outputs[0]) mul_tree = parse_mul_tree(node.outputs[0])
did_something = perform_sigm_times_exp(mul_tree) did_something = perform_sigm_times_exp(mul_tree)
...@@ -3528,7 +3460,6 @@ def local_reciprocal_1_plus_exp(fgraph, node): ...@@ -3528,7 +3460,6 @@ def local_reciprocal_1_plus_exp(fgraph, node):
""" """
# This Rewrite should be done for numerical stability # This Rewrite should be done for numerical stability
# so we don't care to check client counts # so we don't care to check client counts
if node.op == reciprocal:
reciprocal_arg = node.inputs[0] reciprocal_arg = node.inputs[0]
if reciprocal_arg.owner and reciprocal_arg.owner.op == add: if reciprocal_arg.owner and reciprocal_arg.owner.op == add:
scalars_, scalar_inputs, nonconsts = scalarconsts_rest( scalars_, scalar_inputs, nonconsts = scalarconsts_rest(
......
Markdown 格式
0%
您添加了 0 到此讨论。请谨慎行事。
请先完成此评论的编辑!
注册 或者 后发表评论