提交 29d3f9e0 authored 作者: lamblin's avatar lamblin

Merge pull request #425 from delallea/improved_set_subtensor

Fixed issues with advanced inc/set subtensor in some cases
...@@ -5097,6 +5097,7 @@ class AdvancedSubtensor1(Op): ...@@ -5097,6 +5097,7 @@ class AdvancedSubtensor1(Op):
def __hash__(self): def __hash__(self):
return hash(type(self)) return hash(type(self))
def __eq__(self, other): def __eq__(self, other):
return type(self) == type(other) return type(self) == type(other)
...@@ -5115,7 +5116,7 @@ class AdvancedSubtensor1(Op): ...@@ -5115,7 +5116,7 @@ class AdvancedSubtensor1(Op):
x, i = inp x, i = inp
out, = out_ out, = out_
# Copy always implied by numpy advanced indexing semantic. # Copy always implied by numpy advanced indexing semantic.
if out[0] is not None and out[0].shape==(len(i),)+x.shape[1:]: if out[0] is not None and out[0].shape == (len(i),) + x.shape[1:]:
o = out[0] o = out[0]
else: else:
o = None o = None
...@@ -5131,8 +5132,9 @@ class AdvancedSubtensor1(Op): ...@@ -5131,8 +5132,9 @@ class AdvancedSubtensor1(Op):
def grad(self, inputs, grads): def grad(self, inputs, grads):
gz, = grads gz, = grads
assert len(inputs)==2 assert len(inputs) == 2
return [advanced_inc_subtensor1(zeros_like(inputs[0]),gz,inputs[1])]+[None]*(len(inputs)-1) rval1 = [advanced_inc_subtensor1(zeros_like(inputs[0]), gz, inputs[1])]
return rval1 + [None] * (len(inputs) - 1)
def R_op(self, inputs, eval_points): def R_op(self, inputs, eval_points):
if eval_points[0] is None: if eval_points[0] is None:
...@@ -5141,10 +5143,11 @@ class AdvancedSubtensor1(Op): ...@@ -5141,10 +5143,11 @@ class AdvancedSubtensor1(Op):
def infer_shape(self, node, ishapes): def infer_shape(self, node, ishapes):
x, ilist = ishapes x, ilist = ishapes
return [ilist+x[1:]] return [ilist + x[1:]]
advanced_subtensor1 = AdvancedSubtensor1() advanced_subtensor1 = AdvancedSubtensor1()
class AdvancedIncSubtensor1(Op): class AdvancedIncSubtensor1(Op):
"""Increments a subtensor using advanced slicing (list of index)""" """Increments a subtensor using advanced slicing (list of index)"""
def __init__(self, inplace=False, set_instead_of_inc=False): def __init__(self, inplace=False, set_instead_of_inc=False):
...@@ -5173,10 +5176,13 @@ class AdvancedIncSubtensor1(Op): ...@@ -5173,10 +5176,13 @@ class AdvancedIncSubtensor1(Op):
if x_.type.ndim == 0: if x_.type.ndim == 0:
raise TypeError('cannot index into a scalar') raise TypeError('cannot index into a scalar')
if y_.type.ndim > x_.type.ndim: if y_.type.ndim > x_.type.ndim:
if self.set_instead_of_inc:
opname = 'set'
else:
opname = 'increment' opname = 'increment'
raise TypeError('cannot %s x subtensor with ndim=%s' raise TypeError('cannot %s x subtensor with ndim=%s'
' by y with ndim=%s to x subtensor with ndim=%s '%( ' by y with ndim=%s to x subtensor with ndim=%s ' % (
opname, x_.type.ndim, y_.type.ndim )) opname, x_.type.ndim, y_.type.ndim))
return Apply(self, [x_, y_, ilist_], [x_.type()]) return Apply(self, [x_, y_, ilist_], [x_.type()])
...@@ -5186,19 +5192,19 @@ class AdvancedIncSubtensor1(Op): ...@@ -5186,19 +5192,19 @@ class AdvancedIncSubtensor1(Op):
out, = out_ out, = out_
if not self.inplace: if not self.inplace:
x = x.copy() x = x.copy()
# x[idx] += y don't work if the same index is present many times. # In Numpy, x[idx] += y doesn't work if the same index is present
# It do it only once # many times: it does it only once. Is it a bug? In any case, for
# -- Numpy also behaves this way, is it a bug in numpy? # this reason we implement our own 'inc' iteration.
if self.set_instead_of_inc: if self.set_instead_of_inc:
if y.ndim: x[idx] = y
for (j,i) in enumerate(idx):
x[i] = y[j]
else:
for i in idx:
x[i] = y
else: else:
if y.ndim: # If `y` has as many dimensions as `x`, then we want to iterate
for (j,i) in enumerate(idx): # jointly on `x` and `y`. Otherwise, it means `y` should be
# broadcasted to fill all relevant rows of `x`.
assert y.ndim <= x.ndim # Should be guaranteed by `make_node`
if y.ndim == x.ndim:
assert len(y) == len(idx)
for (j, i) in enumerate(idx):
x[i] += y[j] x[i] += y[j]
else: else:
for i in idx: for i in idx:
...@@ -5215,7 +5221,6 @@ class AdvancedIncSubtensor1(Op): ...@@ -5215,7 +5221,6 @@ class AdvancedIncSubtensor1(Op):
return self.make_node(eval_points[0], eval_points[1], return self.make_node(eval_points[0], eval_points[1],
*inputs[2:]).outputs *inputs[2:]).outputs
def grad(self, inputs, grads): def grad(self, inputs, grads):
g_output, = grads g_output, = grads
x, y = inputs[:2] x, y = inputs[:2]
...@@ -5228,6 +5233,7 @@ class AdvancedIncSubtensor1(Op): ...@@ -5228,6 +5233,7 @@ class AdvancedIncSubtensor1(Op):
advanced_inc_subtensor1 = AdvancedIncSubtensor1() advanced_inc_subtensor1 = AdvancedIncSubtensor1()
class AdvancedSubtensor(Op): class AdvancedSubtensor(Op):
"""Return a subtensor copy, using advanced indexing. """Return a subtensor copy, using advanced indexing.
""" """
...@@ -5235,10 +5241,10 @@ class AdvancedSubtensor(Op): ...@@ -5235,10 +5241,10 @@ class AdvancedSubtensor(Op):
# AdvancedSubtensor(args)(self, *args), # AdvancedSubtensor(args)(self, *args),
# if args contains and advanced indexing pattern # if args contains and advanced indexing pattern
def __init__(self, args): #idx_list? def __init__(self, args): # idx_list?
# For the moment, __init__ will be passed the whole list of arguments # For the moment, __init__ will be passed the whole list of arguments
#TODO: see what's the best solution #TODO: see what's the best solution
self.args = args #? self.args = args # ?
#FIXME: do not store variables in the class instance #FIXME: do not store variables in the class instance
...@@ -5590,6 +5596,7 @@ class TensorDotGrad(Op): ...@@ -5590,6 +5596,7 @@ class TensorDotGrad(Op):
tensordot_grad = TensorDotGrad tensordot_grad = TensorDotGrad
class TensorDot(Op): class TensorDot(Op):
"""Compute tensor-tensor products over the given axes. """Compute tensor-tensor products over the given axes.
See numpy documentation for details. See numpy documentation for details.
...@@ -5600,21 +5607,23 @@ class TensorDot(Op): ...@@ -5600,21 +5607,23 @@ class TensorDot(Op):
@classmethod @classmethod
def parse_axes(cls, axes): def parse_axes(cls, axes):
if not numpy.isscalar(axes) and len(axes)!=2: if not numpy.isscalar(axes) and len(axes) != 2:
raise ValueError("Axes should be scalar valued or a list/tuple of len 2.") raise ValueError("Axes should be scalar valued or a list/tuple of "
"len 2.")
if isinstance(axes,(list,tuple)): if isinstance(axes, (list, tuple)):
axes_out = [] axes_out = []
# cast axes[0] and axes[1] to tuples # cast axes[0] and axes[1] to tuples
for i,a in enumerate(axes): for i, a in enumerate(axes):
if numpy.isscalar(a): if numpy.isscalar(a):
axes_out.append((a,)) axes_out.append((a,))
else: else:
axes_out.append(tuple(a)) axes_out.append(tuple(a))
# these should be of same length # these should be of same length
if len(axes_out[0])!=len(axes_out[1]): if len(axes_out[0]) != len(axes_out[1]):
raise ValueError("Elements of the axes list/tuple need to be of the same size.") raise ValueError("Elements of the axes list/tuple need to be "
"of the same size.")
axes = tuple(axes_out) axes = tuple(axes_out)
...@@ -5631,22 +5640,23 @@ class TensorDot(Op): ...@@ -5631,22 +5640,23 @@ class TensorDot(Op):
def make_node(self, x, y): def make_node(self, x, y):
op = self op = self
if isinstance(self.axes,int): if isinstance(self.axes, int):
axes = [range(x.ndim-self.axes,x.ndim),range(self.axes)] axes = [range(x.ndim - self.axes, x.ndim), range(self.axes)]
op = TensorDot(axes) op = TensorDot(axes)
axesdim = numpy.size(op.axes)/2 axesdim = numpy.size(op.axes) / 2
x, y = map(as_tensor_variable, [x, y]) x, y = map(as_tensor_variable, [x, y])
if axesdim > x.type.ndim or axesdim > y.type.ndim: if axesdim > x.type.ndim or axesdim > y.type.ndim:
raise TypeError('Cannot sum over more dimensions than input. %i > %i,%i' % raise TypeError('Cannot sum over more dimensions than input. '
axesdim, x.type.ndim, y.type.ndim) '%i > %i,%i' %
(axesdim, x.type.ndim, y.type.ndim))
outdim = x.type.ndim + y.type.ndim - 2*axesdim outdim = x.type.ndim + y.type.ndim - 2 * axesdim
output = tensor(dtype=scal.upcast(x.dtype, y.dtype), output = tensor(dtype=scal.upcast(x.dtype, y.dtype),
broadcastable=[False]*outdim); broadcastable=[False] * outdim)
return Apply(op, inputs=[x,y], outputs=[output,]) return Apply(op, inputs=[x, y], outputs=[output, ])
def perform(self, node, inp, out): def perform(self, node, inp, out):
x, y = inp x, y = inp
...@@ -5654,7 +5664,8 @@ class TensorDot(Op): ...@@ -5654,7 +5664,8 @@ class TensorDot(Op):
try: try:
z[0] = numpy.asarray(numpy.tensordot(x, y, self.axes)) z[0] = numpy.asarray(numpy.tensordot(x, y, self.axes))
except ValueError, e: except ValueError, e:
# The error raised by numpy has no shape information, we mean to add that # The error raised by numpy has no shape information, we mean to
# add that.
e.args = e.args + (x.shape, y.shape, self.axes) e.args = e.args + (x.shape, y.shape, self.axes)
raise raise
...@@ -5667,13 +5678,15 @@ class TensorDot(Op): ...@@ -5667,13 +5678,15 @@ class TensorDot(Op):
def __str__(self): def __str__(self):
return "tensordot" return "tensordot"
def tensordot(x, y=None, axes=2): def tensordot(x, y=None, axes=2):
if y==None: if y is None:
raise NotImplementedError('The interface to tensordot has changed from '\ raise NotImplementedError(
'tensor.tensordot(axes)(x,y) to tensor.tensordot(x,y,axes). Please '\ 'The interface to tensordot has changed from '
'modify your code accordingly.') 'tensor.tensordot(axes)(x,y) to tensor.tensordot(x,y,axes). '
'Please modify your code accordingly.')
if x.ndim==0 or y.ndim==0: if x.ndim == 0 or y.ndim == 0:
raise ValueError('Cannot perform tensordot of 0-d inputs.') raise ValueError('Cannot perform tensordot of 0-d inputs.')
axes = TensorDot.parse_axes(axes) axes = TensorDot.parse_axes(axes)
...@@ -5682,16 +5695,16 @@ def tensordot(x, y=None, axes=2): ...@@ -5682,16 +5695,16 @@ def tensordot(x, y=None, axes=2):
if numpy.isscalar(axes): if numpy.isscalar(axes):
if axes >= x.ndim or axes >= y.ndim: if axes >= x.ndim or axes >= y.ndim:
raise ValueError('axes should be smaller than the dimension of '\ raise ValueError('axes should be smaller than the dimension of '\
'x and y (x.ndim=%i, y.ndim=%i)' % (x.ndim,y.ndim)) 'x and y (x.ndim=%i, y.ndim=%i)' % (x.ndim, y.ndim))
elif isinstance(axes, (list,tuple)): elif isinstance(axes, (list, tuple)):
if isinstance(axes[0],(list,tuple)) and \ if isinstance(axes[0], (list, tuple)) and \
(len(axes[0]) > x.ndim or (numpy.array(axes[0]) >= x.ndim).any()): (len(axes[0]) > x.ndim or (numpy.array(axes[0]) >= x.ndim).any()):
raise ValueError('axes[0] should be array_like, of length smaller'\ raise ValueError('axes[0] should be array_like, of length smaller'\
' than the dimension of x (x.ndim=%i, len(axes[0])=%i).' % ' than the dimension of x (x.ndim=%i, len(axes[0])=%i).' %
(x.ndim, len(axes[0]))) (x.ndim, len(axes[0])))
if isinstance(axes[1],(list,tuple)) and \ if isinstance(axes[1], (list, tuple)) and \
(len(axes[1]) > y.ndim or (numpy.array(axes[1]) >= y.ndim).any()): (len(axes[1]) > y.ndim or (numpy.array(axes[1]) >= y.ndim).any()):
raise ValueError('axes[1] should be array_like, of length smaller'\ raise ValueError('axes[1] should be array_like, of length smaller'\
'than the dimension of y (y.ndim=%i, len(axes[1])=%i).' % 'than the dimension of y (y.ndim=%i, len(axes[1])=%i).' %
......
Markdown 格式
0%
您添加了 0 到此讨论。请谨慎行事。
请先完成此评论的编辑!
注册 或者 后发表评论