Merge pull request #242 from nouiz/max_default

change the default of theano.{max,min,argmax,argmin,max_and_argmax} to t...

Merge pull request #242 from nouiz/max_default
90c3833e · nouiz · c08a6f31 · 586c0e3c · 90c3833e · 90c3833e
--- a/theano/compile/sharedvalue.py
+++ b/theano/compile/sharedvalue.py
@@ -18,13 +18,6 @@ from theano.gof import Container, Variable, generic
 _logger = logging.getLogger('theano.compile.sharedvalue')
-AddConfigVar('shared.value_borrows',
-        ("DEPRECATED. You should not use the 'value' property of shared"
-            " variables, but use the .get_value() and .set_value() methods."
-            " False: shared variables 'value' property is guaranteed to not"
-            " alias theano-managed memory. True: no guarantee, but faster."),
-        BoolParam(True),
-        in_c_key=False)
 class SharedVariable(Variable):
    """
@@ -125,29 +118,6 @@ class SharedVariable(Variable):
        cp.tag = copy.copy(self.tag)
        return cp
-    def _value_get(self):
-        warnings.warn(("The .value property of shared variables is deprecated."
-            " You should use the .get_value() method instead."),
-            stacklevel=2)
-        return self.get_value(borrow=config.shared.value_borrows, return_internal_type=False)
-    def _value_set(self, new_value):
-        warnings.warn(("The .value property of shared variables is deprecated."
-            " You should use the .set_value() method instead."),
-            stacklevel=2)
-        return self.set_value(new_value, borrow=config.shared.value_borrows)
-    #TODO: USE A CONFIG VARIABLE TO set these get/set methods to the non-borrowing versions
-    #      Semantically things are clearer when using non-borrow versions.  That should be the
-    #      default.  The default support transparently (if slowly) when the 'raw' value is in a
-    #      different memory space (e.g. GPU or other machine).
-    value = property(_value_get, _value_set,
-            doc=("DEPRECATED. Shortcut for self.get_value() and "
-                 "self.set_value(). "
-                 "The `borrow` argument to these methods is read from "
-                 "`theano.config.shared.value_borrows`. "
-                 "You should call get_value() and set_value() directly."))
    def filter_update(self, update):
        """
        When this shared variable is updated by a pfunc, the update value will be run through this function.

--- a/theano/tensor/basic.py
+++ b/theano/tensor/basic.py
@@ -1795,6 +1795,7 @@ shape = Shape()
 _shape = shape #was used in the past, now use shape directly.
 pprint.assign(_shape, printing.MemberPrinter('shape'))
 class SpecifyShape(Op):
    """
    L{Op} put into the graph the user provided shape
@@ -1808,14 +1809,18 @@ class SpecifyShape(Op):
    @note:     We currently don't support specifying partial shape information.
    """
    view_map = {0: [0]}
    def __hash__(self):
        return hash(type(self))
    def __eq__(self, other):
        return type(self) == type(other)
    def __str__(self):
        return self.__class__.__name__
    def make_node(self, x, shape):
-        if not isinstance(x,Variable):
+        if not isinstance(x, Variable):
            x = as_tensor_variable(x)
        shape = as_tensor_variable(shape)
        return Apply(self, [x, shape], [x.type()])
@@ -1823,22 +1828,22 @@ class SpecifyShape(Op):
    def perform(self, node, inp, out_):
        x, shape = inp
        out, = out_
-        assert numpy.all(x.shape==shape), ("got shape", x.shape,
+        assert numpy.all(x.shape == shape), ("got shape", x.shape,
                                           "expected", shape)
        out[0] = x
    def infer_shape(self, node, shapes):
        xshape, sshape = shapes
-        new_shape=[]
+        new_shape = []
        for dim in xrange(node.inputs[0].ndim):
            try:
-                s=get_constant_value(node.inputs[1][dim])
+                s = get_constant_value(node.inputs[1][dim])
-                s=as_tensor_variable(s)
+                s = as_tensor_variable(s)
                new_shape.append(s)
            except TypeError, e:
                new_shape.append(node.inputs[1][dim])
-        assert len(new_shape)==len(xshape)
+        assert len(new_shape) == len(xshape)
        return [new_shape]
    def grad(self, inp, grads):
@@ -1847,9 +1852,10 @@ class SpecifyShape(Op):
        # Should I set an SpecifyShape on gz? I think so
        # But I don't do it now as we need to make an optimization
        # to remove that op from the graph to don't block other optimization
-        # Should I do an optimizer that will remove the SpecifyShape? I think Yes
+        # Should I do an optimizer that will remove the SpecifyShape?
+        # I think Yes
        return [gz, None]
-        return [specify_shape(gz,s), None]
+        return [specify_shape(gz, s), None]
    def R_op(self, inputs, eval_points):
        if eval_points[0] is None:
@@ -1860,97 +1866,83 @@ class SpecifyShape(Op):
 specify_shape = SpecifyShape()
 class MaxAndArgmax(Op):
    """Calculate the max and argmax over a given axis.
-    .. note::
-        If axis is None it means to calculate the max over the last dimension which is
-        DIFFERENT FROM NUMPY!!
-        To have the behavior of numpy do a flatten of the input before passing the data to this op.
-        If the input to flatten is not ccontiguous, this will make a copy to a contiguous version.
    """
-    nin=2 # tensor, axis
+    nin = 2  # tensor, axis
-    nout=2 # max val, max idx
+    nout = 2  # max val, max idx
    E_axis = 'invalid axis'
-    def __eq__(self,other):
+    def __eq__(self, other):
-        return type(self)==type(other)
+        return type(self) == type(other)
    def __hash__(self):
        return hash(type(self))
-    def make_node(self, x, axis='DEFAULT'):
+    def make_node(self, x, axis=None):
        x = _as_tensor_variable(x)
-        if x.type.ndim <= 1 and axis in ('DEFAULT', None):
+        if isinstance(axis, int):
-            # The old and new behavior are not different.
-            axis = 0
-        if axis=='DEFAULT':
-            axis=x.type.ndim - 1
-            warnings.warn(("The default axis of MaxAndArgmax will change! "
-            "Now we return the max and the armax over the last dimensions. "
-            "It will change to be the same as numpy: the max and argmax over "
-            "all dimensions. To hide this warning and be compatible with the "
-            "future behavior, set axis to -1 to have the current behavior. "
-            "MaxAndArgmax currently support axis over only 1 dimensions, so "
-            "you must flatten the tensor to have the futur behavior."),
-            stacklevel=3)
-        elif axis is None:
-            axis = x.type.ndim - 1
-            warnings.warn(("The behavior of MaxAndArgmax when axis==None will "
-            "change! Now we return the max and argmax over the last "
-            "dimensions. It will change to the max and argmax over all "
-            "dimensions as numpy. To hide this warning and be compatible with "
-            "the future behavior, set axis to -1 to have the current behavior. "
-            "MaxAndArgmax currently support axis over only 1 dimensions, so "
-            "you must flatten the tensor to have the futur behavior."),
-            stacklevel=3)
-        if isinstance(axis,int):
            axis = [axis]
-        elif isinstance(axis,(tuple,list)):
+        elif isinstance(axis, (tuple, list)):
-            assert len(axis)==1,"MaxAndArgmax don't support multiple axis. the max fct support it."
+            if len(axis) != 1:
-        #we make the axis all positive to make the infer_shape work with negative axis
+                list(axis)
-        if x.type.ndim>0:
+                axis.sort()
-            for id,a in enumerate(axis):
+                assert axis == range(x.type.ndim), (
-                if not isinstance(a, TensorVariable) and a<0:
+                    "MaxAndArgmax don't support multiple"
-                    if -a>x.type.ndim:
+                    " axis. the max fct support it.")
+        # we make the axis all positive to make the infer_shape work
+        # with negative axis
+        if x.type.ndim > 0 and axis is not None:
+            for id, a in enumerate(axis):
+                if not isinstance(a, TensorVariable) and a < 0:
+                    if -a > x.type.ndim:
                        raise ValueError('axis out of range')
-                    axis[id]=x.type.ndim+a
+                    axis[id] = x.type.ndim + a
-        axis = _as_tensor_variable(axis)
+        if axis is None:
+            axis = _as_tensor_variable(range(x.type.ndim))
+        else:
+            axis = _as_tensor_variable(axis)
        inputs = [x, axis]
-        #TODO: figure things out if axis is a constant
+        broadcastable = [False] * (x.type.ndim - len(axis.data))
-        broadcastable = [False] * (x.type.ndim - 1)
+        outputs = [tensor(x.type.dtype, broadcastable, name='max'),
-        outputs = [tensor(x.type.dtype, broadcastable,name='max'),
+                   tensor('int32', broadcastable, name='argmax')]
-                   tensor('int32', broadcastable,name='argmax')]
        return Apply(self, inputs, outputs)
    def perform(self, node, inp, outs):
        x, axis = inp
        max, max_idx = outs
+        if len(axis) == 0 or python_all(axis == range(x.ndim)):
+            axis = None
        max[0] = numpy.asarray(numpy.max(x, axis))
        max_idx[0] = theano._asarray(numpy.argmax(x, axis), dtype='int32')
    def infer_shape(self, node, shapes):
        ishape, axis_shape = shapes
-        axis=node.inputs[1]
+        axis = node.inputs[1]
-        if axis is None:
+        if python_all(axis.data == range(node.inputs[0].ndim)):
-            return [(),()]
+            return [(), ()]
-        rval = tuple([ishape[i] for (i,b) in enumerate(node.inputs[0].type.broadcastable) if i !=axis.data])
+        rval = tuple([ishape[i] for (i, b) in enumerate(
-        return [rval,rval]
+                    node.inputs[0].type.broadcastable) if i != axis.data])
+        return [rval, rval]
    def R_op(self, inputs, eval_points):
        if eval_points[0] is None:
            return [None, None]
        if not isinstance(inputs[1], theano.Constant):
-            raise ValueError( ('R_op supported for arg_max only for '
+            raise ValueError(('R_op supported for arg_max only for '
-                               'constant axis!'))
+                              'constant axis!'))
        if inputs[1].data > 1:
-            raise ValueError( ('R_op supported for arg_max only when '
+            raise ValueError(('R_op supported for arg_max only when '
-                               ' axis is 0 or 1'))
+                              ' axis is 0 or 1'))
        if inputs[0].ndim != 2:
-            raise ValueError( ('R_op supported for arg_max only when '
+            raise ValueError(('R_op supported for arg_max only when '
-                               ' input is a matrix'))
+                              ' input is a matrix'))
        max_vals, max_pos = self.make_node(*inputs).outputs
        if inputs[1].data == 0:
-            return [eval_points[0][max_pos, arange(eval_points[0].shape[1])], None]
+            return [eval_points[0][max_pos,
+                                   arange(eval_points[0].shape[1])], None]
        else:
            return [eval_points[0][arange(eval_points[0].shape[0]),
                                   max_pos], None]
@@ -1987,112 +1979,48 @@ class MaxAndArgmax(Op):
    def __str__(self):
        return self.__class__.__name__
 _max_and_argmax = MaxAndArgmax()
 @_redefine_asRoutine(_max_and_argmax)
 def max_and_argmax(a):
    pass
 @constructor
-def max(x, axis='DEFAULT'):
+def max(x, axis=None):
    """
    Return maximum elements obtained by iterating over given axis
-    Default axis is the last one. This will change.
+    Default axis is None: max over all dimensions.
    :note: we return an error as numpy when we reduce a dim with a shape of 0
-    :note2: see MaxAndArgmax note for a difference between numpy and theano when axis==None
    """
-    if x.type.ndim <= 1 and axis in ('DEFAULT', None):
+    if isinstance(axis, (list, tuple)) and len(axis) > 1:
-        # The old and new behavior are not different.
+        return CAReduce(scal.maximum, axis)(x)
-        axis = 0
-    elif axis=='DEFAULT':
-        axis = x.type.ndim - 1
-        warnings.warn(("The default axis of max will change! Now we return the "
-        "max over the last dimensions. It will change to be the same as numpy: "
-        "the max over all dimensions. To hide this warning and be compatible "
-        "with the future behavior, set axis to -1 to have the current "
-        "behavior. To have the futur behavior set axis to range(nb dim), but "
-        "this don't support the grad. To have the grad, you must flatten the "
-        "tensor before calling max()."),
-        stacklevel=2)
-    elif axis is None:
-        axis = x.type.ndim - 1
-        warnings.warn(("The behavior of max when axis==None will change! Now "
-        "we return the max over the last dimensions. It will change to the max "
-        "over all dimensions as numpy. To hide this warning and be compatible "
-        "with the future behavior, set axis to -1 to have the current "
-        "behavior. To have the futur behavior set axis to range(nb dim), but "
-        "this don't support the grad. To have the grad, you must flatten the "
-        "tensor before calling max()."),
-        stacklevel=2)
-    if isinstance(axis,(list,tuple)) and len(axis)>1:
-        return CAReduce(scal.maximum,axis)(x)
    try:
        const = get_constant_value(axis)
-        return CAReduce(scal.maximum,list(const))(x)
+        return CAReduce(scal.maximum, list(const))(x)
    except Exception:
-        return max_and_argmax(x,axis)[0]
+        return max_and_argmax(x, axis)[0]
 @constructor
-def argmax(x, axis='DEFAULT'):
+def argmax(x, axis=None):
    """
    Return indexes of maximum elements obtained by iterating over given axis
-    Default axis is the last one. This will change.
+    When axis is None (the default value), the argmax is performed
+    over the flattened tensor.
    """
-    if x.type.ndim <= 1 and axis in ('DEFAULT', None):
-        # The old and new behavior are not different.
-        axis = 0
-    elif axis=='DEFAULT':
-        axis = x.type.ndim - 1
-        warnings.warn(("The default axis of argmax will change! Now we return "
-        "the argmax over the last dimensions. It will change to be the same as "
-        "numpy: the argmax over all dimensions. To hide this warning and be "
-        "compatible with the future behavior, set axis to -1 to have the "
-        "current behavior. To have the futur behavior, you must flatten the "
-        "tensor before calling max()."),
-        stacklevel=2)
-    elif axis is None:
-        axis = x.type.ndim - 1
-        warnings.warn(("The behavior of argmax when axis==None will change! "
-        "Now we return the argmax over the last dimensions. It will change to "
-        "the argmax over all dimensions as numpy. To hide this warning and be "
-        "compatible with the future behavior, set axis to -1 to have the "
-        "current behavior. To have the futur behavior, you must flatten the "
-        "tensor before calling argmax()."),
-        stacklevel=2)
    # In python (using MaxAndArgmax.perform()) this leads to an wasteful
    # implementation that goes through the data twice instead of once
    # but when Argmax.c_impl() is in place, it should be fine.
-    return max_and_argmax(x,axis)[1]
+    return max_and_argmax(x, axis)[1]
 @constructor
-def min(x, axis='DEFAULT'):
+def min(x, axis=None):
-    if x.type.ndim <= 1 and axis in ('DEFAULT', None):
-        # The old and new behavior are not different.
-        axis = 0
-    elif axis=='DEFAULT':
-        axis = x.type.ndim - 1
-        warnings.warn(("The default axis of min will change! Now we return the "
-        "min over the last dimensions. It will change to be the same as numpy: "
-        "the min over all dimensions. To hide this warning and be compatible "
-        "with the future behavior, set axis to -1 to have the current "
-        "behavior. To have the future behavior, set axis to range(x.ndim), but "
-        "this does not support the grad. To be able to get the grad, you must "
-        "flatten the tensor before calling min()."),
-        stacklevel=2)
-    elif axis is None:
-        axis = x.type.ndim - 1
-        warnings.warn(("The behavior of min when axis is None will change! Now "
-        "we return the min over the last dimensions. It will change to the min "
-        "over all dimensions as numpy. To hide this warning and be compatible "
-        "with the future behavior, set axis to -1 to have the current "
-        "behavior. To have the future behavior, set axis to range(x.ndim), but "
-        "this does not support the grad. To be able to get the grad, you must "
-        "flatten the tensor before calling min()."),
-        stacklevel=2)
    str_x_type = str(x.dtype)
    if str_x_type.startswith('float') or str_x_type in int_dtypes:
        return -max(-x, axis=axis)
@@ -2100,29 +2028,9 @@ def min(x, axis='DEFAULT'):
        #Be careful about unsigned integers, complex
        raise NotImplementedError()
 @constructor
-def argmin(x, axis='DEFAULT'):
+def argmin(x, axis=None):
-    if x.type.ndim <= 1 and axis in ('DEFAULT', None):
-        # The old and new behavior are not different.
-        axis = 0
-    elif axis=='DEFAULT':
-        axis = x.type.ndim - 1
-        warnings.warn(("The default axis of argmin will change! Now we return "
-        "the argmin over the last dimensions. It will change to be the same as "
-        "numpy: the argmin over all dimensions. To hide this warning and be "
-        "compatible with the future behavior, set axis to -1 to have the "
-        "current behavior. To have the futur behavior, you must flatten the "
-        "axis before calling argmin."),
-        stacklevel=2)
-    elif axis is None:
-        axis = x.type.ndim - 1
-        warnings.warn(("The behavior of argmin when axis==None will change! "
-        "Now we return the argmin over the last dimensions. It will change to "
-        "the argmin over all dimensions as numpy. To hide this warning and be "
-        "compatible with the future behavior, set axis to -1 to have the "
-        "current behavior. To have the futur behavior, you must flatten the "
-        "axis before calling argmin."),
-        stacklevel=2)
    str_x_type = str(x.dtype)
    if str_x_type.startswith('float') or str_x_type in int_dtypes:
        return argmax(-x, axis=axis)
@@ -2130,6 +2038,7 @@ def argmin(x, axis='DEFAULT'):
        #Be careful about unsigned integers, complex
        raise NotImplementedError()
 @constructor
 def smallest(*args):
    """Return the [elementwise] smallest of a variable number of arguments (like python's min)."""

--- a/theano/tensor/opt_uncanonicalize.py
+++ b/theano/tensor/opt_uncanonicalize.py
@@ -57,7 +57,7 @@ class MaxAndArgmaxOptimizer(Optimizer):
                    if len(node.outputs[1].clients)==0:
                        try:
                            axis=get_constant_value(node.inputs[1])
-                        except ValueError:
+                        except (ValueError, TypeError), e:
                            return False
                        new = CAReduce(scal.maximum,axis)(node.inputs[0])

--- a/theano/tensor/tests/test_basic.py
+++ b/theano/tensor/tests/test_basic.py
@@ -1449,6 +1449,7 @@ class T_Shape(unittest.TestCase):
        s = shape(numpy.ones((5, 3, 10)))
        self.assertTrue((eval_outputs([s]) == [5, 3, 10]).all())
 class T_max_and_argmax(unittest.TestCase):
    def setUp(self):
        utt.seed_rng()
@@ -1456,108 +1457,91 @@ class T_max_and_argmax(unittest.TestCase):
    def test0(self):
        n = as_tensor_variable(5.0)
-        v,i = eval_outputs(max_and_argmax(n))
+        v, i = eval_outputs(max_and_argmax(n))
        self.assertTrue(v == 5.0)
        self.assertTrue(i == 0)
        v = eval_outputs(max_and_argmax(n)[0].shape)
-        assert len(v)==0
+        assert len(v) == 0
        v = eval_outputs(max_and_argmax(n)[1].shape)
-        assert len(v)==0
+        assert len(v) == 0
    def test1(self):
-        n = as_tensor_variable([1,2,3,2,-6])
+        n = as_tensor_variable([1, 2, 3, 2, -6])
-        v,i = eval_outputs(max_and_argmax(n))
+        v, i = eval_outputs(max_and_argmax(n))
        self.assertTrue(v == 3)
        self.assertTrue(i == 2)
        v = eval_outputs(max_and_argmax(n)[0].shape)
-        assert len(v)==0
+        assert len(v) == 0
    def test2(self):
-        data = numpy.random.rand(2,3)
+        data = numpy.random.rand(2, 3)
-        n = as_tensor_variable(data)
-        v,i = eval_outputs(max_and_argmax(n,-1))
-        self.assertTrue(numpy.all(v == numpy.max(data,-1)))
-        self.assertTrue(numpy.all(i == numpy.argmax(data,-1)))
-        v = eval_outputs(max_and_argmax(n,-1)[0].shape)
-        assert v==(2)
-    def test2b(self):
-        data = numpy.random.rand(2,3)
        n = as_tensor_variable(data)
-        v,i = eval_outputs(max_and_argmax(n,0))
+        for (axis, np_axis)  in [(-1, -1), (0, 0), (1, 1), (None, None),
-        self.assertTrue(numpy.all(v == numpy.max(data,0)))
+                                 ([0, 1], None), ([1, 0], None)]:
-        self.assertTrue(numpy.all(i == numpy.argmax(data,0)))
+            v, i = eval_outputs(max_and_argmax(n, axis))
-        v = eval_outputs(max_and_argmax(n,0)[0].shape)
+            self.assertTrue(numpy.all(v == numpy.max(data, np_axis)))
-        assert v==(3)
+            self.assertTrue(numpy.all(i == numpy.argmax(data, np_axis)))
-        v = eval_outputs(max_and_argmax(n,1)[0].shape)
+            v_shape = eval_outputs(max_and_argmax(n, axis)[0].shape)
-        assert v==(2)
+            assert tuple(v_shape) == numpy.max(data, np_axis).shape
-        #currently not supported
-        #v = eval_outputs(max_and_argmax(n,[0,1])[0].shape)
-        #assert v.size==0
    def test2_invalid(self):
-        n = as_tensor_variable(numpy.random.rand(2,3))
+        n = as_tensor_variable(numpy.random.rand(2, 3))
        # Silence expected error messages
        _logger = logging.getLogger('theano.gof.opt')
        oldlevel = _logger.level
        _logger.setLevel(logging.CRITICAL)
        try:
            try:
-                eval_outputs(max_and_argmax(n,3))
+                eval_outputs(max_and_argmax(n, 3))
                assert False
            except ValueError, e:
                pass
        finally:
            _logger.setLevel(oldlevel)
    def test2_invalid_neg(self):
-        n = as_tensor_variable(numpy.random.rand(2,3))
+        n = as_tensor_variable(numpy.random.rand(2, 3))
        old_stderr = sys.stderr
        sys.stderr = StringIO.StringIO()
        try:
            try:
-                eval_outputs(max_and_argmax(n,-3))
+                eval_outputs(max_and_argmax(n, -3))
                assert False
            except ValueError, e:
                pass
        finally:
            sys.stderr = old_stderr
    def test2_valid_neg(self):
-        n = as_tensor_variable(numpy.random.rand(2,3))
+        n = as_tensor_variable(numpy.random.rand(2, 3))
-        v,i = eval_outputs(max_and_argmax(n,-1))
+        v, i = eval_outputs(max_and_argmax(n, -1))
        self.assertTrue(v.shape == (2,))
        self.assertTrue(i.shape == (2,))
-        self.assertTrue(numpy.all(v == numpy.max(n.value,-1)))
+        self.assertTrue(numpy.all(v == numpy.max(n.value, -1)))
-        self.assertTrue(numpy.all(i == numpy.argmax(n.value,-1)))
+        self.assertTrue(numpy.all(i == numpy.argmax(n.value, -1)))
-        v,i = eval_outputs(max_and_argmax(n,-2))
+        v, i = eval_outputs(max_and_argmax(n, -2))
        self.assertTrue(v.shape == (3,))
        self.assertTrue(i.shape == (3,))
-        self.assertTrue(numpy.all(v == numpy.max(n.value,-2)))
+        self.assertTrue(numpy.all(v == numpy.max(n.value, -2)))
-        self.assertTrue(numpy.all(i == numpy.argmax(n.value,-2)))
+        self.assertTrue(numpy.all(i == numpy.argmax(n.value, -2)))
-        v = eval_outputs(max_and_argmax(n,-1)[0].shape)
+        v = eval_outputs(max_and_argmax(n, -1)[0].shape)
-        assert v==(2)
+        assert v == (2)
-        v = eval_outputs(max_and_argmax(n,-2)[0].shape)
+        v = eval_outputs(max_and_argmax(n, -2)[0].shape)
-        assert v==(3)
+        assert v == (3)
    def test3(self):
-        n = as_tensor_variable(numpy.random.rand(2,3,4))
+        data = numpy.random.rand(2, 3, 4)
-        v,i = eval_outputs(max_and_argmax(n,0))
+        n = as_tensor_variable(data)
-        self.assertTrue(v.shape == (3,4))
+        for (axis, np_axis)  in [(-1, -1), (0, 0), (1, 1), (None, None),
-        self.assertTrue(i.shape == (3,4))
+                                 ([0, 1, 2], None), ([1, 2, 0], None)]:
-        v,i = eval_outputs(max_and_argmax(n,1))
+            v, i = eval_outputs(max_and_argmax(n, axis))
-        self.assertTrue(v.shape == (2,4))
+            self.assertTrue(numpy.all(v == numpy.max(data, np_axis)))
-        self.assertTrue(i.shape == (2,4))
+            self.assertTrue(numpy.all(i == numpy.argmax(data, np_axis)))
-        v,i = eval_outputs(max_and_argmax(n,2))
+            v = eval_outputs(max_and_argmax(n, axis)[0].shape)
-        self.assertTrue(v.shape == (2,3))
+            assert tuple(v) == numpy.max(data, np_axis).shape
-        self.assertTrue(i.shape == (2,3))
-        v = eval_outputs(max_and_argmax(n,0)[0].shape)
-        assert tuple(v)==(3,4)
-        v = eval_outputs(max_and_argmax(n,1)[0].shape)
-        assert tuple(v)==(2,4)
-        v = eval_outputs(max_and_argmax(n,2)[0].shape)
-        assert tuple(v)==(2,3)
    def test_grad(self):
-        data = numpy.random.rand(2,3)
+        data = numpy.random.rand(2, 3)
        n = as_tensor_variable(data)
        def check_grad_max(data, max_grad_data, axis=None):
@@ -1565,35 +1549,39 @@ class T_max_and_argmax(unittest.TestCase):
            Why this is needed? verify_grad is not enought?
            """
            #This work only for axis in [0,None]
-            assert axis in [0,None]
+            assert axis in [0, None]
            z = numpy.zeros_like(data)
            z = z.flatten()
-            argmax=numpy.argmax(data,axis=axis)
+            argmax = numpy.argmax(data, axis=axis)
-            if argmax.ndim==0:
+            if argmax.ndim == 0:
-                z[argmax]+=1
+                z[argmax] += 1
            else:
-                for id,v in enumerate(argmax):
+                for id, v in enumerate(argmax):
-                    z[v*numpy.prod(data.shape[data.ndim-1:axis:-1])+id]+=1
+                    z[v * numpy.prod(data.shape[data.ndim - 1:axis:-1])
+                      + id] += 1
            z = z.reshape(data.shape)
            assert numpy.all(max_grad_data == z)
        #test grad of max
        #axis is the last one
-        utt.verify_grad(lambda v: max_and_argmax(v,axis=-1)[0], [data])
+        utt.verify_grad(lambda v: max_and_argmax(v, axis=-1)[0], [data])
-        utt.verify_grad(lambda v: max_and_argmax(v,axis=-1)[1], [data])
+        utt.verify_grad(lambda v: max_and_argmax(v, axis=-1)[1], [data])
-        utt.verify_grad(lambda v: max_and_argmax(v,axis=[0])[0], [data])
+        utt.verify_grad(lambda v: max_and_argmax(v, axis=[0])[0], [data])
-        utt.verify_grad(lambda v: max_and_argmax(v,axis=[0])[1], [data])
+        utt.verify_grad(lambda v: max_and_argmax(v, axis=[0])[1], [data])
-        check_grad_max(data,eval_outputs(grad(max_and_argmax(n,axis=0)[0].sum(),n)),axis=0)
+        check_grad_max(data, eval_outputs(grad(
+                    max_and_argmax(n, axis=0)[0].sum(), n)), axis=0)
-        utt.verify_grad(lambda v: max_and_argmax(v,axis=[1])[0], [data])
+        utt.verify_grad(lambda v: max_and_argmax(v, axis=[1])[0], [data])
-        utt.verify_grad(lambda v: max_and_argmax(v,axis=[1])[1], [data])
+        utt.verify_grad(lambda v: max_and_argmax(v, axis=[1])[1], [data])
-        #check_grad_max(data,eval_outputs(grad(max_and_argmax(n,axis=1)[0],n)),axis=1)
+        #check_grad_max(data,eval_outputs(grad(
+        #            max_and_argmax(n,axis=1)[0],n)),axis=1)
        utt.verify_grad(lambda v: max_and_argmax(v.flatten())[0], [data])
        utt.verify_grad(lambda v: max_and_argmax(v.flatten())[1], [data])
-        check_grad_max(data,eval_outputs(grad(max_and_argmax(n.flatten())[0],n)))
+        check_grad_max(data, eval_outputs(grad(
+                    max_and_argmax(n.flatten())[0], n)))
        # Test 4d inner dimensions
        data = numpy.random.rand(2, 3, 4, 5)
@@ -1608,60 +1596,48 @@ class T_argmin_argmax(unittest.TestCase):
        utt.seed_rng()
        MaxAndArgmax.debug = 0
-    def test0(self):
+    def test_scalar(self):
-        for fct in [argmin,argmax]:
+        for fct in [argmin, argmax]:
            n = as_tensor_variable(5.0)
            i = eval_outputs(fct(n))
            self.assertTrue(i == 0)
            v = eval_outputs(fct(n).shape)
-            assert len(v)==0
+            assert len(v) == 0
-    def test1(self):
+    def test_list(self):
-        n = as_tensor_variable([1,2,3,2,-6])
+        n = as_tensor_variable([1, 2, 3, 2, -6])
        i = eval_outputs(argmin(n))
        self.assertTrue(i == 4)
        v = eval_outputs(argmin(n).shape)
-        assert len(v)==0
+        assert len(v) == 0
-        n = as_tensor_variable([1,2,3,2,-6])
+        n = as_tensor_variable([1, 2, 3, 2, -6])
        i = eval_outputs(argmax(n))
        self.assertTrue(i == 2)
        v = eval_outputs(argmax(n).shape)
-        assert len(v)==0
+        assert len(v) == 0
    def test2(self):
-        for fct,nfct in [(argmax,numpy.argmax),(argmin,numpy.argmin)]:
+        data = numpy.random.rand(2, 3)
-            data = numpy.random.rand(2,3)
+        n = as_tensor_variable(data)
-            n = as_tensor_variable(data)
+        for fct, nfct in [(argmax, numpy.argmax), (argmin, numpy.argmin)]:
-            i = eval_outputs(fct(n,-1))
+            for (axis, np_axis)  in [(-1, -1), (0, 0), (1, 1), (None, None),
-            self.assertTrue(numpy.all(i == nfct(data,-1)))
+                                     ([0, 1], None), ([1, 0], None)]:
-            v = eval_outputs(fct(n,-1).shape)
+                v = eval_outputs(fct(n, axis))
-            assert v==(2)
+                self.assertTrue(numpy.all(v == nfct(data, np_axis)))
+                v_shape = eval_outputs(fct(n, axis).shape)
-    def test2b(self):
+                assert tuple(v_shape) == nfct(data, np_axis).shape
-        for fct,nfct in [(argmax,numpy.argmax),(argmin,numpy.argmin)]:
-            data = numpy.random.rand(2,3)
-            n = as_tensor_variable(data)
-            i = eval_outputs(fct(n,0))
-            self.assertTrue(numpy.all(i == nfct(data,0)))
-            v = eval_outputs(fct(n,0).shape)
-            assert v==(3)
-            v = eval_outputs(fct(n,1).shape)
-            assert v==(2)
-            #currently not supported
-            #v = eval_outputs(fct(n,[0,1]).shape)
-            #assert v.size==0
    def test2_invalid(self):
-        for fct,nfct in [(argmax,numpy.argmax),(argmin,numpy.argmin)]:
+        for fct, nfct in [(argmax, numpy.argmax), (argmin, numpy.argmin)]:
-            n = as_tensor_variable(numpy.random.rand(2,3))
+            n = as_tensor_variable(numpy.random.rand(2, 3))
            # Silence expected error messages
            _logger = logging.getLogger('theano.gof.opt')
            oldlevel = _logger.level
            _logger.setLevel(logging.CRITICAL)
            try:
                try:
-                    eval_outputs(fct(n,3))
+                    eval_outputs(fct(n, 3))
                    assert False
                except ValueError, e:
                    pass
@@ -1669,13 +1645,13 @@ class T_argmin_argmax(unittest.TestCase):
                _logger.setLevel(oldlevel)
    def test2_invalid_neg(self):
-        for fct,nfct in [(argmax,numpy.argmax),(argmin,numpy.argmin)]:
+        for fct, nfct in [(argmax, numpy.argmax), (argmin, numpy.argmin)]:
-            n = as_tensor_variable(numpy.random.rand(2,3))
+            n = as_tensor_variable(numpy.random.rand(2, 3))
            old_stderr = sys.stderr
            sys.stderr = StringIO.StringIO()
            try:
                try:
-                    eval_outputs(fct(n,-3))
+                    eval_outputs(fct(n, -3))
                    assert False
                except ValueError, e:
                    pass
@@ -1683,286 +1659,262 @@ class T_argmin_argmax(unittest.TestCase):
                sys.stderr = old_stderr
    def test2_valid_neg(self):
-        for fct,nfct in [(argmax,numpy.argmax),(argmin,numpy.argmin)]:
+        for fct, nfct in [(argmax, numpy.argmax), (argmin, numpy.argmin)]:
-            n = as_tensor_variable(numpy.random.rand(2,3))
+            n = as_tensor_variable(numpy.random.rand(2, 3))
-            i = eval_outputs(fct(n,-1))
+            i = eval_outputs(fct(n, -1))
            self.assertTrue(i.shape == (2,))
-            self.assertTrue(numpy.all(i == nfct(n.value,-1)))
+            self.assertTrue(numpy.all(i == nfct(n.value, -1)))
-            i = eval_outputs(fct(n,-2))
+            i = eval_outputs(fct(n, -2))
            self.assertTrue(i.shape == (3,))
-            self.assertTrue(numpy.all(i == nfct(n.value,-2)))
+            self.assertTrue(numpy.all(i == nfct(n.value, -2)))
-            v = eval_outputs(fct(n,-1).shape)
+            v = eval_outputs(fct(n, -1).shape)
-            assert v==(2)
+            assert v == (2)
-            v = eval_outputs(fct(n,-2).shape)
+            v = eval_outputs(fct(n, -2).shape)
-            assert v==(3)
+            assert v == (3)
    def test3(self):
-        for fct,nfct in [(argmax,numpy.argmax),(argmin,numpy.argmin)]:
+        data = numpy.random.rand(2, 3, 4)
-            n = as_tensor_variable(numpy.random.rand(2,3,4))
+        n = as_tensor_variable(data)
-            i = eval_outputs(fct(n,0))
+        for fct, nfct in [(argmax, numpy.argmax), (argmin, numpy.argmin)]:
-            self.assertTrue(i.shape == (3,4))
+            for (axis, np_axis)  in [(-1, -1), (0, 0), (1, 1), (2, 2),
-            self.assertTrue(numpy.all(i == nfct(n.value,0)))
+                                     (None, None), ([0, 1, 2], None),
-            i = eval_outputs(fct(n,1))
+                                     ([1, 0, 2], None)]:
-            self.assertTrue(i.shape == (2,4))
+                v = eval_outputs(fct(n, axis))
-            self.assertTrue(numpy.all(i == nfct(n.value,1)))
+                self.assertTrue(numpy.all(v == nfct(data, np_axis)))
-            i = eval_outputs(fct(n,2))
+                v_shape = eval_outputs(fct(n, axis).shape)
-            self.assertTrue(i.shape == (2,3))
+                assert tuple(v_shape) == nfct(data, np_axis).shape
-            self.assertTrue(numpy.all(i == nfct(n.value,2)))
-            v = eval_outputs(fct(n,0).shape)
-            assert tuple(v)==(3,4)
-            v = eval_outputs(fct(n,1).shape)
-            assert tuple(v)==(2,4)
-            v = eval_outputs(fct(n,2).shape)
-            assert tuple(v)==(2,3)
    def test_grad_argmin(self):
-        data = numpy.random.rand(2,3)
+        data = numpy.random.rand(2, 3)
        n = as_tensor_variable(data)
        #test grad of argmin
-        utt.verify_grad(lambda v: argmin(v,axis=-1), [data])
+        utt.verify_grad(lambda v: argmin(v, axis=-1), [data])
-        utt.verify_grad(lambda v: argmin(v,axis=[0]), [data])
+        utt.verify_grad(lambda v: argmin(v, axis=[0]), [data])
-        utt.verify_grad(lambda v: argmin(v,axis=[1]), [data])
+        utt.verify_grad(lambda v: argmin(v, axis=[1]), [data])
        utt.verify_grad(lambda v: argmin(v.flatten()), [data])
        try:
-            grad(argmin(n,axis=-1),n)
+            grad(argmin(n, axis=-1), n)
            raise Exception('Expected an error')
        except TypeError:
            pass
    def test_grad_argmax(self):
-        data = numpy.random.rand(2,3)
+        data = numpy.random.rand(2, 3)
        n = as_tensor_variable(data)
        #test grad of argmax
        utt.verify_grad(lambda v: argmax(v, axis=-1), [data])
-        utt.verify_grad(lambda v: argmax(v,axis=[0]), [data])
+        utt.verify_grad(lambda v: argmax(v, axis=[0]), [data])
-        utt.verify_grad(lambda v: argmax(v,axis=[1]), [data])
+        utt.verify_grad(lambda v: argmax(v, axis=[1]), [data])
        utt.verify_grad(lambda v: argmax(v.flatten()), [data])
        try:
-            grad(argmax(n, axis=-1),n)
+            grad(argmax(n, axis=-1), n)
            raise Exception('Expected an error')
        except TypeError:
            pass
 class T_min_max(unittest.TestCase):
    def setUp(self):
        utt.seed_rng()
        MaxAndArgmax.debug = 0
-    def test0(self):
+    def test_scalar(self):
-        for fct in [max,min]:
+        for fct in [max, min]:
            n = as_tensor_variable(5.0)
            v = eval_outputs(fct(n))
            self.assertTrue(v == 5.0)
            v = eval_outputs(fct(n).shape)
-            assert len(v)==0
+            assert len(v) == 0
-    def test1(self):
+    def test_list(self):
-        for fct,nfct in [(max,numpy.max),(min,numpy.min)]:
+        for fct, nfct in [(max, numpy.max), (min, numpy.min)]:
-            n = as_tensor_variable([1,2,3,2,-6])
+            n = as_tensor_variable([1, 2, 3, 2, -6])
            v = eval_outputs([fct(n)])
            self.assertTrue(v == nfct(n.value))
            v = eval_outputs(fct(n).shape)
-            assert len(v)==0
+            assert len(v) == 0
    def test2(self):
-        for fct,nfct in [(max,numpy.max),(min,numpy.min)]:
+        data = numpy.random.rand(2, 3)
-            data = numpy.random.rand(2,3)
+        n = as_tensor_variable(data)
-            n = as_tensor_variable(data)
+        for fct, nfct in [(max, numpy.max), (min, numpy.min)]:
-            v = eval_outputs(fct(n,-1))
+            for (axis, np_axis)  in [(-1, -1), (0, 0), (1, 1), (None, None),
-            self.assertTrue(numpy.all(v == nfct(data,-1)))
+                                     ([0, 1], None), ([1, 0], None)]:
+                v = eval_outputs(fct(n, axis))
-            v = eval_outputs(fct(n,-1).shape)
+                self.assertTrue(numpy.all(v == nfct(data, np_axis)))
-            assert v==(2)
+                v_shape = eval_outputs(fct(n, axis).shape)
+                assert tuple(v_shape) == nfct(data, np_axis).shape
-    def test2b(self):
-        for fct,nfct in [(max,numpy.max),(min,numpy.min)]:
-            data = numpy.random.rand(2,3)
-            n = as_tensor_variable(data)
-            v = eval_outputs(fct(n,0))
-            self.assertTrue(numpy.all(v == nfct(data,0)))
-            v = eval_outputs(fct(n,0).shape)
-            assert v==(3)
-            v = eval_outputs(fct(n,1).shape)
-            assert v==(2)
-            v = eval_outputs(fct(n,[0,1]).shape)
-            assert v.size==0
    def test2_invalid(self):
-        for fct in [max,min]:
+        for fct in [max, min]:
-            n = as_tensor_variable(numpy.random.rand(2,3))
+            n = as_tensor_variable(numpy.random.rand(2, 3))
            # Silence expected error messages
            _logger = logging.getLogger('theano.gof.opt')
            oldlevel = _logger.level
            _logger.setLevel(logging.CRITICAL)
            try:
                try:
-                    eval_outputs(fct(n,3))
+                    eval_outputs(fct(n, 3))
                    assert False
                except ValueError, e:
                    pass
            finally:
                _logger.setLevel(oldlevel)
    def test2_invalid_neg(self):
-        for fct in [max,min]:
+        for fct in [max, min]:
-            n = as_tensor_variable(numpy.random.rand(2,3))
+            n = as_tensor_variable(numpy.random.rand(2, 3))
            old_stderr = sys.stderr
            sys.stderr = StringIO.StringIO()
            try:
                try:
-                    eval_outputs(fct(n,-3))
+                    eval_outputs(fct(n, -3))
                    assert False
                except ValueError, e:
                    pass
            finally:
                sys.stderr = old_stderr
    def test2_valid_neg(self):
-        for fct,nfct in [(max,numpy.max),(min,numpy.min)]:
+        for fct, nfct in [(max, numpy.max), (min, numpy.min)]:
-            n = as_tensor_variable(numpy.random.rand(2,3))
+            n = as_tensor_variable(numpy.random.rand(2, 3))
-            v = eval_outputs(fct(n,-1))
+            v = eval_outputs(fct(n, -1))
            self.assertTrue(v.shape == (2,))
-            self.assertTrue(numpy.all(v == nfct(n.value,-1)))
+            self.assertTrue(numpy.all(v == nfct(n.value, -1)))
-            v = eval_outputs(fct(n,-2))
+            v = eval_outputs(fct(n, -2))
            self.assertTrue(v.shape == (3,))
-            self.assertTrue(numpy.all(v == nfct(n.value,-2)))
+            self.assertTrue(numpy.all(v == nfct(n.value, -2)))
-            v = eval_outputs(fct(n,-1).shape)
+            v = eval_outputs(fct(n, -1).shape)
-            assert v==(2)
+            assert v == (2)
-            v = eval_outputs(fct(n,-2).shape)
+            v = eval_outputs(fct(n, -2).shape)
-            assert v==(3)
+            assert v == (3)
    def test3(self):
-        for fct,nfct in [(max,numpy.max),(min,numpy.min)]:
+        # Test with 1 axis or all axis out of 3 dims
-            n = as_tensor_variable(numpy.random.rand(2,3,4))
+        data = numpy.random.rand(2, 3, 4)
-            v = eval_outputs(fct(n,0))
+        n = as_tensor_variable(data)
-            self.assertTrue(v.shape == (3,4))
+        for fct, nfct in [(max, numpy.max), (min, numpy.min)]:
-            self.assertTrue(numpy.all(v == nfct(n.value,0)))
+            for (axis, np_axis)  in [(-1, -1), (0, 0), (1, 1), (2, 2),
-            v = eval_outputs(fct(n,1))
+                                     (None, None), ([0, 1, 2], None),
-            self.assertTrue(v.shape == (2,4))
+                                     ([1, 0, 2], None)]:
-            self.assertTrue(numpy.all(v == nfct(n.value,1)))
+                v = eval_outputs(fct(n, axis))
-            v = eval_outputs(fct(n,2))
+                self.assertTrue(numpy.all(v == nfct(data, np_axis)))
-            self.assertTrue(v.shape == (2,3))
+                v_shape = eval_outputs(fct(n, axis).shape)
-            self.assertTrue(numpy.all(v == nfct(n.value,2)))
+                assert tuple(v_shape) == nfct(data, np_axis).shape
-            v = eval_outputs(fct(n,[0,1]))
-            self.assertTrue(v.shape == (4,))
+    def test3b(self):
-            self.assertTrue(numpy.all(v == nfct(nfct(n.value,1),0)))
+        # Test with 2 axis out of 3 dims
-            v = eval_outputs(fct(n,[0,2]))
+        data = numpy.random.rand(2, 3, 4)
-            self.assertTrue(v.shape == (3,))
+        n = as_tensor_variable(data)
-            self.assertTrue(numpy.all(v == nfct(nfct(n.value,2),0)))
+        for fct, nfct in [(max, numpy.max), (min, numpy.min)]:
-            v = eval_outputs(fct(n,[1,2]))
+            for axis in [[0, 1], [1, 2], [0, 2]]:
-            self.assertTrue(v.shape == (2,))
+                v = eval_outputs(fct(n, axis))
-            self.assertTrue(numpy.all(v == nfct(nfct(n.value,2),1)))
+                np_v = nfct(nfct(data, axis[1]), axis[0])
-            v = eval_outputs(fct(n,[0,1,2]))
+                self.assertTrue(numpy.all(v == np_v))
-            self.assertTrue(v.shape == ())
+                v_shape = eval_outputs(fct(n, axis).shape)
+                assert tuple(v_shape) == np_v.shape
-            v = eval_outputs(fct(n,0).shape)
-            assert tuple(v)==(3,4)
-            v = eval_outputs(fct(n,1).shape)
-            assert tuple(v)==(2,4)
-            v = eval_outputs(fct(n,2).shape)
-            assert tuple(v)==(2,3)
-            v = eval_outputs(fct(n,[0,1]).shape)
-            self.assertTrue(v == (4,))
-            v = eval_outputs(fct(n,[0,2]).shape)
-            self.assertTrue(v == (3,))
-            v = eval_outputs(fct(n,[1,2]).shape)
-            self.assertTrue(v == (2,))
-            v = eval_outputs(fct(n,[0,1,2]).shape)
-            self.assertTrue(v.size == 0)
    def test_grad_max(self):
-        data = numpy.random.rand(2,3)
+        data = numpy.random.rand(2, 3)
        n = as_tensor_variable(data)
        def check_grad_max(data, max_grad_data, axis=None):
            #This work only for axis in [0,None]
-            assert axis in [0,None]
+            assert axis in [0, None]
            z = numpy.zeros_like(data)
            z = z.flatten()
-            argmax=numpy.argmax(data,axis=axis)
+            argmax = numpy.argmax(data, axis=axis)
-            if argmax.ndim==0:
+            if argmax.ndim == 0:
-                z[numpy.argmax(data,axis=axis)]+=1
+                z[numpy.argmax(data, axis=axis)] += 1
            else:
-                for id,v in enumerate(argmax):
+                for id, v in enumerate(argmax):
-                    z[v*numpy.prod(data.shape[data.ndim-1:axis:-1])+id]+=1
+                    z[v * numpy.prod(data.shape[data.ndim - 1:axis:-1])
+                      + id] += 1
            z = z.reshape(data.shape)
            assert numpy.all(max_grad_data == z)
        #test grad of max
        #axis is the last one
-        utt.verify_grad(lambda v: max(v,axis=-1), [data])
+        utt.verify_grad(lambda v: max(v, axis=-1), [data])
-        utt.verify_grad(lambda v: max(v,axis=[0]), [data])
+        utt.verify_grad(lambda v: max(v, axis=[0]), [data])
-        check_grad_max(data,eval_outputs(grad(max(n,axis=0).sum(),n)),axis=0)
+        check_grad_max(data, eval_outputs(grad(max(n, axis=0).sum(), n)),
+                       axis=0)
-        utt.verify_grad(lambda v: max(v,axis=[1]), [data])
+        utt.verify_grad(lambda v: max(v, axis=[1]), [data])
        #check_grad_max(data,eval_outputs(grad(max(n,axis=1),n)),axis=1)
        utt.verify_grad(lambda v: max(v.flatten()), [data])
-        check_grad_max(data,eval_outputs(grad(max(n.flatten()),n)))
+        check_grad_max(data, eval_outputs(grad(max(n.flatten()), n)))
    def test_grad_min(self):
-        data = numpy.random.rand(2,3)
+        data = numpy.random.rand(2, 3)
        n = as_tensor_variable(data)
        def check_grad_min(data, min_grad_data, axis=None):
-            #This work only for axis in [0,None]
+            #This work only for axis in [0, None]
-            assert axis in [0,None]
+            assert axis in [0, None]
            z = numpy.zeros_like(data)
            z = z.flatten()
-            argmin=numpy.argmin(data,axis=axis)
+            argmin = numpy.argmin(data, axis=axis)
-            if argmin.ndim==0:
+            if argmin.ndim == 0:
-                z[numpy.argmin(data,axis=axis)]+=1
+                z[numpy.argmin(data, axis=axis)] += 1
            else:
-                for id,v in enumerate(argmin):
+                for id, v in enumerate(argmin):
-                    z[v*numpy.prod(data.shape[data.ndim-1:axis:-1])+id]+=1
+                    z[v * numpy.prod(data.shape[data.ndim - 1:axis:-1])
+                      + id] += 1
            z = z.reshape(data.shape)
            assert numpy.all(min_grad_data == z)
        #test grad of min
        #axis is the last one
-        utt.verify_grad(lambda v: min(v,axis=-1), [data])
+        utt.verify_grad(lambda v: min(v, axis=-1), [data])
-        utt.verify_grad(lambda v: min(v,axis=[0]), [data])
+        utt.verify_grad(lambda v: min(v, axis=[0]), [data])
-        check_grad_min(data,eval_outputs(grad(min(n,axis=0).sum(),n)),axis=0)
+        check_grad_min(data, eval_outputs(grad(min(n, axis=0).sum(), n)),
+                       axis=0)
-        utt.verify_grad(lambda v: min(v,axis=[1]), [data])
+        utt.verify_grad(lambda v: min(v, axis=[1]), [data])
        #check_grad_min(data,eval_outputs(grad(min(n,axis=1),n)),axis=1)
        utt.verify_grad(lambda v: min(v.flatten()), [data])
-        check_grad_min(data,eval_outputs(grad(min(n.flatten()),n)))
+        check_grad_min(data, eval_outputs(grad(min(n.flatten()), n)))
    def _grad_list(self):
        """
        Test the gradient when we have multiple axis at the same time.
-        This not implemented, so we disable the test. See ticket: http://trac-hg.assembla.com/theano/ticket/511
+        This not implemented, so we disable the test. See ticket:
+        http://trac-hg.assembla.com/theano/ticket/511
        """
-        data = numpy.random.rand(2,3)
+        data = numpy.random.rand(2, 3)
        n = as_tensor_variable(data)
-        for fct in [max_and_argmax,max,min]:
+        for fct in [max_and_argmax, max, min]:
-            utt.verify_grad(lambda v: fct(v,axis=[0,1]), [data])
+            utt.verify_grad(lambda v: fct(v, axis=[0, 1]), [data])
-        #check_grad_max(data,eval_outputs(grad(max_and_argmax(n,axis=1)[0],n)),axis=1)
+        #check_grad_max(data, eval_outputs(grad(max_and_argmax(n,
+        #axis=1)[0], n)),axis=1)
 class T_subtensor(unittest.TestCase):
    """
-    This is build in a way that allow to reuse it to test the equivalent gpu op.
+    This is build in a way that allow to reuse it to test the
+    equivalent gpu op.
    """
    def __init__(self, name, shared=_shared,
                 sub=tensor.Subtensor,

--- a/theano/tensor/tests/test_opt_uncanonicalize.py
+++ b/theano/tensor/tests/test_opt_uncanonicalize.py
@@ -13,91 +13,95 @@ from theano.tests import unittest_tools as utt
 class T_max_and_argmax(unittest.TestCase):
    def test_optimization(self):
-        #If we use only the max output, we should replace this op with a faster one.
+        #If we use only the max output, we should replace this op with
-        mode = theano.compile.mode.get_default_mode().including('canonicalize','fast_run')
+        #a faster one.
+        mode = theano.compile.mode.get_default_mode().including(
+            'canonicalize', 'fast_run')
-        data = numpy.asarray(numpy.random.rand(2,3),dtype=config.floatX)
+        for axis in [0, 1, -1]:
-        n = tensor.matrix()
+            data = numpy.asarray(numpy.random.rand(2, 3), dtype=config.floatX)
+            n = tensor.matrix()
-        f = function([n], tensor.max_and_argmax(n,0)[0], mode=mode)
+            f = function([n], tensor.max_and_argmax(n, axis)[0], mode=mode)
-        topo = f.maker.env.toposort()
+            topo = f.maker.env.toposort()
-        assert len(topo)==1
+            assert len(topo) == 1
-        assert isinstance(topo[0].op, CAReduce)
+            assert isinstance(topo[0].op, CAReduce)
-        f = function([n], tensor.max_and_argmax(n,0), mode=mode)
+            f = function([n], tensor.max_and_argmax(n, axis), mode=mode)
-        topo = f.maker.env.toposort()
+            topo = f.maker.env.toposort()
-        assert len(topo)==1
+            assert len(topo) == 1
-        assert isinstance(topo[0].op, tensor.MaxAndArgmax)
+            assert isinstance(topo[0].op, tensor.MaxAndArgmax)
 class T_min_max(unittest.TestCase):
    def setUp(self):
        utt.seed_rng()
-        self.mode = theano.compile.mode.get_default_mode().including('canonicalize','fast_run')
+        self.mode = theano.compile.mode.get_default_mode().including(
+            'canonicalize', 'fast_run')
    def test_optimization_max(self):
-        data = numpy.asarray(numpy.random.rand(2,3),dtype=config.floatX)
+        data = numpy.asarray(numpy.random.rand(2, 3), dtype=config.floatX)
        n = tensor.matrix()
-        f = function([n],tensor.max(n,0), mode=self.mode)
+        for axis in [0, 1, -1]:
-        topo = f.maker.env.toposort()
+            f = function([n], tensor.max(n, axis), mode=self.mode)
-        assert len(topo)==1
+            topo = f.maker.env.toposort()
-        assert isinstance(topo[0].op,CAReduce)
+            assert len(topo) == 1
-        f(data)
+            assert isinstance(topo[0].op, CAReduce)
+            f(data)
-        f = function([n],tensor.max(-n,0), mode=self.mode)
+            f = function([n], tensor.max(-n, axis), mode=self.mode)
-        topo = f.maker.env.toposort()
+            topo = f.maker.env.toposort()
-        assert len(topo)==2
+            assert len(topo) == 2
-        assert isinstance(topo[0].op, Elemwise)
+            assert isinstance(topo[0].op, Elemwise)
-        assert isinstance(topo[0].op.scalar_op, scalar.Neg)
+            assert isinstance(topo[0].op.scalar_op, scalar.Neg)
-        assert isinstance(topo[1].op,CAReduce)
+            assert isinstance(topo[1].op, CAReduce)
-        f(data)
+            f(data)
-        f = function([n],-tensor.max(n,0), mode=self.mode)
+            f = function([n], -tensor.max(n, axis), mode=self.mode)
-        topo = f.maker.env.toposort()
+            topo = f.maker.env.toposort()
-        assert len(topo)==2
+            assert len(topo) == 2
-        assert isinstance(topo[0].op,CAReduce)
+            assert isinstance(topo[0].op, CAReduce)
-        assert isinstance(topo[1].op, Elemwise)
+            assert isinstance(topo[1].op, Elemwise)
-        assert isinstance(topo[1].op.scalar_op, scalar.Neg)
+            assert isinstance(topo[1].op.scalar_op, scalar.Neg)
-        f(data)
+            f(data)
-        f = function([n],-tensor.max(-n,0), mode=self.mode)
+            f = function([n], -tensor.max(-n, axis), mode=self.mode)
-        topo = f.maker.env.toposort()
+            topo = f.maker.env.toposort()
-        assert len(topo)==1
+            assert len(topo) == 1
-        assert isinstance(topo[0].op,CAReduce)#min
+            assert isinstance(topo[0].op, CAReduce)  # min
-        f(data)
+            f(data)
    def test_optimization_min(self):
-        data = numpy.asarray(numpy.random.rand(2,3),dtype=config.floatX)
+        data = numpy.asarray(numpy.random.rand(2, 3), dtype=config.floatX)
        n = tensor.matrix()
-        f = function([n],tensor.min(n,0), mode=self.mode)
+        for axis in [0, 1, -1]:
-        topo = f.maker.env.toposort()
+            f = function([n], tensor.min(n, axis), mode=self.mode)
-        assert len(topo)==1
+            topo = f.maker.env.toposort()
-        assert isinstance(topo[0].op,CAReduce)
+            assert len(topo) == 1
-        f(data)
+            assert isinstance(topo[0].op, CAReduce)
+            f(data)
-        #test variant with neg to make sure we optimize correctly
-        f = function([n],tensor.min(-n,0), mode=self.mode)
+            #test variant with neg to make sure we optimize correctly
-        topo = f.maker.env.toposort()
+            f = function([n], tensor.min(-n, axis), mode=self.mode)
-        assert len(topo)==2
+            topo = f.maker.env.toposort()
-        assert isinstance(topo[0].op,CAReduce)#max
+            assert len(topo) == 2
-        assert isinstance(topo[1].op, Elemwise)
+            assert isinstance(topo[0].op, CAReduce)  # max
-        assert isinstance(topo[1].op.scalar_op, scalar.Neg)
+            assert isinstance(topo[1].op, Elemwise)
-        f(data)
+            assert isinstance(topo[1].op.scalar_op, scalar.Neg)
+            f(data)
-        f = function([n],-tensor.min(n,0), mode=self.mode)
-        topo = f.maker.env.toposort()
+            f = function([n], -tensor.min(n, axis), mode=self.mode)
-        assert len(topo)==2
+            topo = f.maker.env.toposort()
-        assert isinstance(topo[0].op, Elemwise)
+            assert len(topo) == 2
-        assert isinstance(topo[0].op.scalar_op, scalar.Neg)
+            assert isinstance(topo[0].op, Elemwise)
-        assert isinstance(topo[1].op,CAReduce)#max
+            assert isinstance(topo[0].op.scalar_op, scalar.Neg)
-        f(data)
+            assert isinstance(topo[1].op, CAReduce)  # max
+            f(data)
-        f = function([n],-tensor.min(-n,0), mode=self.mode)
-        topo = f.maker.env.toposort()
+            f = function([n], -tensor.min(-n, axis), mode=self.mode)
-        assert len(topo)==1
+            topo = f.maker.env.toposort()
-        assert isinstance(topo[0].op,CAReduce)#max
+            assert len(topo) == 1
-        f(data)
+            assert isinstance(topo[0].op, CAReduce)  # max
+            f(data)
--- a/theano/tensor/tests/test_sharedvar.py
+++ b/theano/tensor/tests/test_sharedvar.py
@@ -350,27 +350,6 @@ def makeSharedTester(shared_constructor_,
                assert may_share_memory(old_data, x_shared.container.storage[0])
                x_shared.get_value(borrow=True)
-            # Test by .value
-            # As we know that .value is deprecated, we filter out the warning
-            warnings.filterwarnings(
-                    action='ignore',
-                    message='The .value property of shared variables is deprecated.'
-                    )
-            try:
-                nd += 1
-                old_data = x_shared.container.storage[0]
-                x_shared.value = nd
-                assert numpy.allclose(self.ref_fct(x_shared.value), self.ref_fct(self.cast_value(nd)))
-                assert may_share_memory(old_data, x_shared.container.storage[0]) == self.set_value_inplace
-            finally:
-                # Restore the default behavior.
-                # TODO There is a cleaner way to do this in Python 2.6, once
-                # Theano drops support of Python 2.4 and 2.5.
-                warnings.filterwarnings(
-                    action='default',
-                    message='The .value property of shared variables is deprecated.'
-                    )
            # Test by set_value with borrow=False
            nd += 1
            old_data = x_shared.container.storage[0]