Merge pull request #549 from lamblin/pep8

Pep8

Merge pull request #549 from lamblin/pep8
ab56ecc1 · Olivier Delalleau · 41a4a100 · f3afab87 · ab56ecc1 · ab56ecc1
--- a/theano/compile/builders.py
+++ b/theano/compile/builders.py
-
 from theano import gof
 from theano import gradient as G
 from function_module import orig_function
@@ -33,16 +32,19 @@ class OpFromGraph(gof.Op):
      e2 = op(x, y, z) + op(z, y, x)
      fn = function([x, y, z], [e2])
    """
-    
-    def __init__(self, inputs, outputs, grad_depth = 1, **kwargs):
+
+    def __init__(self, inputs, outputs, grad_depth=1, **kwargs):
        if not isinstance(outputs, list):
            raise TypeError('outputs must be list', outputs)
        for i in inputs + outputs:
            if not isinstance(i, gof.Variable):
-                raise TypeError('inputs and outputs must be Variable instances', i)
+                raise TypeError(
+                        'inputs and outputs must be Variable instances', i)
        if 'updates' in kwargs:
            raise TypeError('updates are not allowed in kwargs')
-        # TODO: the graph may have implicit inputs like Value and SharedVariable instances.
+
+        # TODO: the graph may have implicit inputs like Value and
+        #       SharedVariable instances.
        #       what impact to they have on the validity of this Op?
        self.fn = orig_function(inputs, outputs, **kwargs)
        self.inputs = inputs
@@ -52,7 +54,8 @@ class OpFromGraph(gof.Op):

        if grad_depth > 0:
            output_grads = [t() for t in self.output_types]
-            gd = G.grad_sources_inputs(zip(self.outputs, output_grads), self.inputs)
+            gd = G.grad_sources_inputs(zip(self.outputs, output_grads),
+                    self.inputs)
            gs = map(gd.get, self.inputs)
            self.grad_ops = []
            for g in gs:
@@ -63,8 +66,9 @@ class OpFromGraph(gof.Op):
                    # to compute the gradient, so we ignore them.
                    self.grad_ops.append(OpFromGraph(inputs + output_grads,
                                                     [g],
-                                                     grad_depth = grad_depth - 1,
+                                                     grad_depth=grad_depth - 1,
                                                     on_unused_input='ignore'))
+
    def __eq__(self, other):
        #TODO: recognize a copy
        return self is other
@@ -76,7 +80,8 @@ class OpFromGraph(gof.Op):
    def make_node(self, *inputs):
        for input, type in zip(inputs, self.input_types):
            if not type == input.type:
-                raise TypeError("Wrong type, expected %s but got %s" % (type, input.type))
+                raise TypeError("Wrong type, expected %s but got %s"
+                        % (type, input.type))
        return gof.Apply(self,
                         inputs,
                         [type() for type in self.output_types])
@@ -85,8 +90,8 @@ class OpFromGraph(gof.Op):
        variables = self.fn(*inputs)
        assert len(variables) == len(outputs)
        for output, variable in zip(outputs, variables):
-            ##TODO: when function's output-borrowing semantics are correct, we wont need this
-            # copy anymore
+            ##TODO: when function's output-borrowing semantics are correct,
+            # we wont need this copy anymore
            output[0] = variable.copy()

    def grad(self, inputs, output_grads):
@@ -94,5 +99,3 @@ class OpFromGraph(gof.Op):
            return [go(*(inputs + output_grads)) for go in self.grad_ops]
        else:
            raise NotImplementedError
-
-
--- a/theano/compile/tests/test_debugmode.py
+++ b/theano/compile/tests/test_debugmode.py
-import sys
 import numpy

 from theano import config
@@ -10,36 +9,43 @@ import theano.compile
 from theano.tests import unittest_tools as utt
 import unittest

+
 def test0():
    x = theano.tensor.dvector()
-    f = theano.function([x], (2.*x + 7) / 2., mode=debugmode.DebugMode())
-    print f([1,2])
+    f = theano.function([x], ((2. * x) + 7) / 2., mode=debugmode.DebugMode())
+    print f([1, 2])
+

 class BROKEN_ON_PURPOSE_Add(gof.Op):
    def __init__(self, py_offset):
        gof.Op.__init__(self)
        self.py_offset = py_offset
+
    def __eq__(self, other):
-        return type(self) == type(other) and (self.py_offset == other.py_offset)
+        return (type(self) == type(other) and
+                (self.py_offset == other.py_offset))
+
    def __hash__(self):
        return 29834 ^ hash(type(self)) ^ hash(self.py_offset)
+
    def make_node(self, a, b):
        a = theano.tensor.as_tensor_variable(a)
        b = theano.tensor.as_tensor_variable(b)
        assert a.type.dtype == 'float64'
        assert a.type.dtype == b.type.dtype
-        assert a.type.ndim==1
+        assert a.type.ndim == 1
        r = gof.Apply(self, [a, b], [a.type()])
        return r

    def perform(self, node, inp, out_):
        a, b = inp
        out, = out_
-        z = a+b
+        z = a + b
        #ERROR TO ADD THIS CRAPPY OFFSET
        if self.py_offset:
-            out[0] = z+0.5
-        else: out[0] = z
+            out[0] = z + 0.5
+        else:
+            out[0] = z

    def c_code(self, node, name, inp, out, sub):
        a, b = inp
@@ -76,26 +82,30 @@ class BROKEN_ON_PURPOSE_Add(gof.Op):
                + ((double*)PyArray_GETPTR1(%(b)s, m))[0] ;
            }
        }
-        """% dict(locals(), **sub)
+        """ % dict(locals(), **sub)
+
 # inconsistent is a invalid op, whose perform and c_code do not match
 inconsistent = BROKEN_ON_PURPOSE_Add(False)
+
 # off_by_half is a good op, that is different from theano.sparse.sd_csc
 off_by_half = BROKEN_ON_PURPOSE_Add(True)

+
 class WeirdBrokenOp(gof.Op):
    """
    This op can be inplace if behaviour is 'times1_inplace'
    This op can be destructive if behaviour is 'times2_inplace'

-    In both cases, it does not set  the destroy_map or view_map correctly so it should raise an
-    error in DebugMode.
+    In both cases, it does not set the destroy_map or view_map correctly so
+    it should raise an error in DebugMode.
    """
    def __init__(self, behaviour):
        gof.Op.__init__(self)
        self.behaviour = behaviour

    def __eq__(self, other):
-        return type(self) == type(other) and (self.behaviour == other.behaviour)
+        return (type(self) == type(other)
+                and (self.behaviour == other.behaviour))

    def __hash__(self):
        return hash(type(self)) ^ hash(self.behaviour)
@@ -168,7 +178,8 @@ class WeirdBrokenOp(gof.Op):
            }
        """

-        total = (z_code + prep_vars + behaviour + prep_vars2)% dict(locals(), **sub)
+        total = ((z_code + prep_vars + behaviour + prep_vars2)
+                % dict(locals(), **sub))
        return total

 wb2i = WeirdBrokenOp('times2_inplace')
@@ -176,6 +187,7 @@ wb2 = WeirdBrokenOp('times2')
 wb1i = WeirdBrokenOp('times1_inplace')
 wb1 = WeirdBrokenOp('times1')

+
 def test_badclinkeroutput():

    a = theano.tensor.dvector()
@@ -184,20 +196,20 @@ def test_badclinkeroutput():
    f_good = theano.function([a, b],
            off_by_half(a, b),
            mode=debugmode.DebugMode(check_c_code=True))
-    f_inconsistent = theano.function([a,b],
+    f_inconsistent = theano.function([a, b],
            inconsistent(a, b),
            mode=debugmode.DebugMode(check_c_code=True))

    #this should evaluate with no error
-    f_good([1.0, 2.0, 3.0], [2,3,4])
+    f_good([1.0, 2.0, 3.0], [2, 3, 4])
    try:
-        f_inconsistent([1.0, 2.0, 3.0], [2,3,4])
+        f_inconsistent([1.0, 2.0, 3.0], [2, 3, 4])
    except debugmode.BadCLinkerOutput, e:
        print repr(e)
        assert e.r.owner.op is inconsistent
-        return #TEST PASS
+        return  # TEST PASS

-    assert False  #an error should have been detected
+    assert False  # an error should have been detected


 def test_badoptimization():
@@ -213,22 +225,24 @@ def test_badoptimization():
    a = theano.tensor.dvector()
    b = theano.tensor.dvector()

-    f = theano.function([a, b], a+b,
+    f = theano.function([a, b], a + b,
            mode=debugmode.DebugMode(optimizer=opt, check_c_code=True))

    try:
-        rval = f([1.0, 2.0, 3.0], [2,3,4],)
+        f([1.0, 2.0, 3.0], [2, 3, 4],)
    except debugmode.BadOptimization, e:
        assert str(e.reason) == 'insert_broken_add'
-        return #TEST PASS
+        return  # TEST PASS

    assert False

+
 def test_stochasticoptimization():

    # this optimization alternates between triggering and not triggering.

-    last_time_replaced=[False]
+    last_time_replaced = [False]
+
    @gof.local_optimizer([theano.tensor.add])
    def insert_broken_add_sometimes(node):
        if node.op == theano.tensor.add:
@@ -236,32 +250,39 @@ def test_stochasticoptimization():
            if last_time_replaced[0]:
                return [off_by_half(*node.inputs)]
        return False
+
    edb = gof.EquilibriumDB()
-    edb.register('insert_broken_add_sometimes', insert_broken_add_sometimes, 'all')
+    edb.register(
+            'insert_broken_add_sometimes',
+            insert_broken_add_sometimes,
+            'all')
    opt = edb.query('+all')

    a = theano.tensor.dvector()
    b = theano.tensor.dvector()

    try:
-        f = theano.function([a, b],
+        theano.function([a, b],
                theano.tensor.add(a, b),
                mode=debugmode.DebugMode(optimizer=opt, check_c_code=True))
    except debugmode.StochasticOrder:
-        return #TEST PASS
+        return  # TEST PASS
    assert False


 def test_just_c_code():
    x = theano.tensor.dvector()
-    f = theano.function([x], wb2(x), mode=debugmode.DebugMode(check_py_code=False))
-    assert numpy.all(f([1,2]) == [2, 4])
+    f = theano.function([x], wb2(x),
+            mode=debugmode.DebugMode(check_py_code=False))
+    assert numpy.all(f([1, 2]) == [2, 4])
+

 def test_baddestroymap():
    class BadAdd(gof.Op):
        def make_node(self, a, b):
            c = a.type()
-            return gof.Apply(self, [a,b], [c])
+            return gof.Apply(self, [a, b], [c])
+
        def perform(self, node, inp, out):
            a, b = inp
            c, = out
@@ -270,20 +291,22 @@ def test_baddestroymap():

    x = theano.tensor.dvector()
    y = theano.tensor.dvector()
-    f = theano.function([x, y], BadAdd()(x,y), mode='DEBUG_MODE')
+    f = theano.function([x, y], BadAdd()(x, y), mode='DEBUG_MODE')

    try:
-        f([1,2], [3,4])
-        assert False #failed to raise error
+        f([1, 2], [3, 4])
+        assert False  # failed to raise error
    except debugmode.BadDestroyMap:
        pass

+
 def test_baddestroymap_c():
    x = theano.tensor.dvector()
-    f = theano.function([x], wb2i(x), mode=debugmode.DebugMode(check_py_code=False))
+    f = theano.function([x], wb2i(x),
+            mode=debugmode.DebugMode(check_py_code=False))
    try:
-        assert numpy.all(f([1,2]) == [2, 4])
-        assert False #failed to raise error
+        assert numpy.all(f([1, 2]) == [2, 4])
+        assert False  # failed to raise error
    except debugmode.BadDestroyMap:
        pass

@@ -293,7 +316,8 @@ class Test_ViewMap(unittest.TestCase):
    class BadAddRef(gof.Op):
        def make_node(self, a, b):
            c = b.type()
-            return gof.Apply(self, [a,b], [c])
+            return gof.Apply(self, [a, b], [c])
+
        def perform(self, node, inp, out):
            a, b = inp
            c, = out
@@ -302,7 +326,8 @@ class Test_ViewMap(unittest.TestCase):
    class BadAddSlice(gof.Op):
        def make_node(self, a, b):
            c = b.type()
-            return gof.Apply(self, [a,b], [c])
+            return gof.Apply(self, [a, b], [c])
+
        def perform(self, node, inp, out):
            a, b = inp
            c, = out
@@ -311,20 +336,21 @@ class Test_ViewMap(unittest.TestCase):
    def test_badviewmap_ref(self):
        x = theano.tensor.dvector()
        y = theano.tensor.dvector()
-        f = theano.function([x, y], self.BadAddRef()(x,y), mode='DEBUG_MODE')
+        f = theano.function([x, y], self.BadAddRef()(x, y), mode='DEBUG_MODE')
        try:
-            f([1,2], [3,4])
-            assert False #failed to raise error
+            f([1, 2], [3, 4])
+            assert False  # failed to raise error
        except debugmode.BadViewMap:
            return

    def test_badviewmap_slice(self):
        x = theano.tensor.dvector()
        y = theano.tensor.dvector()
-        f = theano.function([x, y], self.BadAddSlice()(x,y), mode='DEBUG_MODE')
+        f = theano.function([x, y], self.BadAddSlice()(x, y),
+                mode='DEBUG_MODE')
        try:
-            f([1,2], [3,4])
-            assert False #failed to raise error
+            f([1, 2], [3, 4])
+            assert False  # failed to raise error
        except debugmode.BadViewMap:
            return

@@ -333,31 +359,34 @@ class Test_ViewMap(unittest.TestCase):
        goodop.view_map = {0: [1]}
        x = theano.tensor.dvector()
        y = theano.tensor.dvector()
-        f = theano.function([x, y], goodop(x,y), mode='DEBUG_MODE')
+        f = theano.function([x, y], goodop(x, y), mode='DEBUG_MODE')
        try:
-            f([1,5,1], [3,4,2,1,4])
+            f([1, 5, 1], [3, 4, 2, 1, 4])
            return
        except debugmode.BadViewMap:
-            assert False #failed to raise error
-
+            assert False  # failed to raise error

    def test_badviewmap_c(self):
        x = theano.tensor.dvector()
-        f = theano.function([x], wb1i(x), mode=debugmode.DebugMode(check_py_code=False))
+        f = theano.function([x], wb1i(x),
+                mode=debugmode.DebugMode(check_py_code=False))
        try:
-            f([1,2])
-            assert False #failed to raise error
+            f([1, 2])
+            assert False  # failed to raise error
        except debugmode.BadViewMap:
            pass

    def test_aliased_outputs_ok(self):
-        #here aliased outputs is ok because they are both aliased to an input as well
+        # here aliased outputs is ok because they are both aliased to an input
+        # as well
        class CustomOp(gof.Op):
-            view_map = {0:[0], 1:[0]}
+            view_map = {0: [0], 1: [0]}
+
            def make_node(self, a, b):
                c = a.type()
                d = a.type()
-                return gof.Apply(self, [a,b], [c,d])
+                return gof.Apply(self, [a, b], [c, d])
+
            def perform(self, node, inp, out):
                a, b = inp
                c, d = out
@@ -366,21 +395,22 @@ class Test_ViewMap(unittest.TestCase):

        x = theano.tensor.dvector('x')
        y = theano.tensor.dvector('y')
-        f = theano.function([x, y], CustomOp()(x,y), mode='DEBUG_MODE')
+        f = theano.function([x, y], CustomOp()(x, y), mode='DEBUG_MODE')

-        r0, r1 = f([1,2,3,4],[5,6,7,8])
+        r0, r1 = f([1, 2, 3, 4], [5, 6, 7, 8])

-        assert numpy.all(r0 == [1,2,3,4])
-        assert numpy.all(r1 == [2,3,4])
+        assert numpy.all(r0 == [1, 2, 3, 4])
+        assert numpy.all(r1 == [2, 3, 4])

    def test_aliased_outputs_ok_output(self):
-        # here aliased outputs is ok because they are both outputs of the function as a whole and
-        # thus not destroy-able
+        # here aliased outputs is ok because they are both outputs of the
+        # function as a whole and thus not destroy-able
        class CustomOp(gof.Op):
            def make_node(self, a, b):
                c = a.type()
                d = a.type()
-                return gof.Apply(self, [a,b], [c,d])
+                return gof.Apply(self, [a, b], [c, d])
+
            def perform(self, node, inp, out):
                a, b = inp
                c, d = out
@@ -390,22 +420,23 @@ class Test_ViewMap(unittest.TestCase):

        x = theano.tensor.dvector()
        y = theano.tensor.dvector()
-        f = theano.function([x, y], CustomOp()(x,y), mode='DEBUG_MODE')
+        f = theano.function([x, y], CustomOp()(x, y), mode='DEBUG_MODE')

-        r0, r1 = f([1,2,3,4],[5,6,7,8])
+        r0, r1 = f([1, 2, 3, 4], [5, 6, 7, 8])

-        assert numpy.all(r0 == [2,4,6,8])
-        assert numpy.all(r1 == [4,6,8])
+        assert numpy.all(r0 == [2, 4, 6, 8])
+        assert numpy.all(r1 == [4, 6, 8])

    def test_aliased_outputs_ok_shadow(self):
-        # here the alias between outputs is ok because one of them is not used for subsequent
-        # computation.  This is like the case where we use one output as a memory buffer to serve
-        # another output.
+        # here the alias between outputs is ok because one of them is not used
+        # for subsequent computation.  This is like the case where we use one
+        # output as a memory buffer to serve another output.
        class CustomOp(gof.Op):
            def make_node(self, a, b):
                c = a.type()
                d = a.type()
-                return gof.Apply(self, [a,b], [c,d])
+                return gof.Apply(self, [a, b], [c, d])
+
            def perform(self, node, inp, out):
                a, b = inp
                c, d = out
@@ -415,27 +446,29 @@ class Test_ViewMap(unittest.TestCase):

        x = theano.tensor.dvector('x')
        y = theano.tensor.dvector('y')
-        f = theano.function([x, y], CustomOp()(x,y)[0] * 2, mode='DEBUG_MODE')
+        f = theano.function([x, y], CustomOp()(x, y)[0] * 2, mode='DEBUG_MODE')

-        r0 = f([1,2,3,4],[5,6,7,8])
-
-        assert numpy.all(r0 == [2,4,6,8])
+        r0 = f([1, 2, 3, 4], [5, 6, 7, 8])

+        assert numpy.all(r0 == [2, 4, 6, 8])

    def test_aliased_outputs_bad(self):
-        # here the alias between outputs is not ok because destroying one destroys the other, but
-        # there's no way to warn theano about it through the view_map mechanism.
+        # here the alias between outputs is not ok because destroying one
+        # destroys the other, but there's no way to warn theano about it
+        # through the view_map mechanism.
        class CustomOp(gof.Op):
            def make_node(self, a, b):
                c = a.type()
                d = a.type()
-                return gof.Apply(self, [a,b], [c,d])
+                return gof.Apply(self, [a, b], [c, d])
+
            def perform(self, node, inp, out):
                a, b = inp
                c, d = out
                r = a * 1
                c[0] = r[:-1]
                d[0] = r[1:]
+
        custom_op = CustomOp()

        x = theano.tensor.dvector()
@@ -445,68 +478,78 @@ class Test_ViewMap(unittest.TestCase):
        f = theano.function([x, y], out, mode='DEBUG_MODE')

        try:
-            r0 = f([1,2,3,4],[5,6,7,8])
-            assert False # DebugMode should have caught the error
+            f([1, 2, 3, 4], [5, 6, 7, 8])
+            assert False  # DebugMode should have caught the error
        except debugmode.BadViewMap, e:
            print e
            pass

-        # the situation can be rescued by picking one of the inputs and pretending that it is
-        # aliased to both the outputs.  This unfairly disables any destructive operations on the
+        # the situation can be rescued by picking one of the inputs and
+        # pretending that it is aliased to both the outputs.
+        # This unfairly disables any destructive operations on the
        # input, but guarantees correctness.
        #custom_op.view_map = {0:[0], 1:[1]}
        #f([1,2,3,4],[5,6,7,8])

+
 class Test_check_isfinite(unittest.TestCase):
    def setUp(self):
        self.old_ts = theano.tensor.TensorType.filter_checks_isfinite
-        self.old_dm = theano.compile.mode.predefined_modes['DEBUG_MODE'].check_isfinite
+        self.old_dm = theano.compile.mode.predefined_modes[
+                'DEBUG_MODE'].check_isfinite
+
    def tearDown(self):
        theano.tensor.TensorType.filter_checks_isfinite = self.old_ts
-        theano.compile.mode.predefined_modes['DEBUG_MODE'].check_isfinite = self.old_dm
+        theano.compile.mode.predefined_modes[
+                'DEBUG_MODE'].check_isfinite = self.old_dm

    def test_check_isfinite(self):
        x = theano.tensor.vector()
-        f = theano.function([x], (x+2) * 5, mode='DEBUG_MODE')
+        f = theano.function([x], (x + 2) * 5, mode='DEBUG_MODE')
        g = theano.function([x], theano.tensor.log(x), mode='DEBUG_MODE')

        # this should work
        f(numpy.log([3, 4, 5]).astype(config.floatX))

-        # if TensorType.filter_checks_isfinite were true, these would raise ValueError
+        # if TensorType.filter_checks_isfinite were true, these would raise
+        # ValueError
        # if not, DebugMode will check internally, and raise InvalidValueError
        # passing an invalid value as an input should trigger ValueError
        self.assertRaises(debugmode.InvalidValueError, f,
                numpy.log([3, -4, 5]).astype(config.floatX))
        self.assertRaises(debugmode.InvalidValueError, f,
-                (numpy.asarray([0, 1.0, 0])/0).astype(config.floatX))
+                (numpy.asarray([0, 1.0, 0]) / 0).astype(config.floatX))
        self.assertRaises(debugmode.InvalidValueError, f,
-                (numpy.asarray([1.0, 1.0, 1.0])/0).astype(config.floatX))
+                (numpy.asarray([1.0, 1.0, 1.0]) / 0).astype(config.floatX))

-        # generating an invalid value internally should trigger InvalidValueError
+        # generating an invalid value internally should trigger
+        # InvalidValueError
        self.assertRaises(debugmode.InvalidValueError, g,
-                numpy.asarray([3,-4,5], dtype=config.floatX))
+                numpy.asarray([3, -4, 5], dtype=config.floatX))

        # this should disable the exception
        theano.tensor.TensorType.filter_checks_isfinite = False
-        theano.compile.mode.predefined_modes['DEBUG_MODE'].check_isfinite = False
+        theano.compile.mode.predefined_modes[
+                'DEBUG_MODE'].check_isfinite = False
        # insert several Inf
-        f(numpy.asarray(numpy.asarray([1.0, 1.0, 1.0])/0, dtype=config.floatX))
-
+        f(numpy.asarray(numpy.asarray([1.0, 1.0, 1.0]) / 0,
+            dtype=config.floatX))

    def test_check_isfinite_disabled(self):
        x = theano.tensor.dvector()
-        f = theano.function([x], (x+2) * 5, mode=debugmode.DebugMode(check_isfinite=False))
+        f = theano.function([x], (x + 2) * 5,
+                mode=debugmode.DebugMode(check_isfinite=False))

        #nan should go through
        f(numpy.log([3, -4, 5]))

        #inf should go through
-        infs = numpy.asarray([1.0,1.,1.])/0
+        infs = numpy.asarray([1.0, 1., 1.]) / 0
        print infs
        f(infs)
        return

+
 class Test_preallocated_output(unittest.TestCase):

    class BrokenCImplementationAdd(gof.Op):
@@ -521,7 +564,7 @@ class Test_preallocated_output(unittest.TestCase):
            b = theano.tensor.as_tensor_variable(b)
            assert a.type.dtype == 'float32'
            assert a.type.dtype == b.type.dtype
-            assert a.type.ndim==2
+            assert a.type.ndim == 2
            r = gof.Apply(self, [a, b], [a.type()])
            return r

@@ -595,17 +638,18 @@ class Test_preallocated_output(unittest.TestCase):
                    }
                }
            }
-            """% dict(locals(), **sub)
+            """ % dict(locals(), **sub)

    def test_f_contiguous(self):
        a = theano.tensor.fmatrix('a')
        b = theano.tensor.fmatrix('b')
        z = self.BrokenCImplementationAdd()(a, b)
-        out = theano.tensor.dot(z, numpy.eye(7)) # Needed so that z is not the output of the graph
+        # Needed so that z is not the output of the graph
+        out = theano.tensor.dot(z, numpy.eye(7))

        rng = numpy.random.RandomState(seed=utt.fetch_seed())
-        a_val = rng.randn(7,7).astype('float32')
-        b_val = rng.randn(7,7).astype('float32')
+        a_val = rng.randn(7, 7).astype('float32')
+        b_val = rng.randn(7, 7).astype('float32')

        init_conf_val = config.DebugMode.check_preallocated_output
        try:

--- a/theano/compile/tests/test_shared.py
+++ b/theano/compile/tests/test_shared.py
 import numpy
 import unittest
-import copy
 import theano
 from theano.tensor import Tensor, TensorType

 from theano.compile.sharedvalue import *

+
 class Test_SharedVariable(unittest.TestCase):

    def test_ctors(self):

-        if 0: #when using an implementation that handles scalars with Scalar type
+        if 0:
+            # when using an implementation that handles scalars with
+            # Scalar type
            assert shared(7).type == Scalar('int64')
            assert shared(7.0).type == Scalar('float64')
            assert shared(7, dtype='float64').type == Scalar('float64')
@@ -24,14 +26,16 @@ class Test_SharedVariable(unittest.TestCase):
            assert shared(numpy.float32(7)).type == theano.tensor.fscalar

        # test tensor constructor
-        b = shared(numpy.zeros((5,5), dtype='int32'))
-        assert b.type == TensorType('int32', broadcastable=[False,False])
-        b = shared(numpy.random.rand(4,5))
-        assert b.type == TensorType('float64', broadcastable=[False,False])
-        b = shared(numpy.random.rand(5,1,2))
-        assert b.type == TensorType('float64', broadcastable=[False,False,False])
+        b = shared(numpy.zeros((5, 5), dtype='int32'))
+        assert b.type == TensorType('int32', broadcastable=[False, False])
+        b = shared(numpy.random.rand(4, 5))
+        assert b.type == TensorType('float64', broadcastable=[False, False])
+        b = shared(numpy.random.rand(5, 1, 2))
+        assert b.type == TensorType('float64',
+                broadcastable=[False, False, False])

        assert shared([]).type == generic
+
        def badfunc():
            shared(7, bad_kw=False)
        self.assertRaises(TypeError, badfunc)
@@ -70,7 +74,7 @@ class Test_SharedVariable(unittest.TestCase):
        SharedVariable(
                name='u',
                type=Tensor(broadcastable=[False], dtype='float64'),
-                value=[1, 2], #different dtype and not a numpy array
+                value=[1, 2],  # different dtype and not a numpy array
                strict=False)

        # here the value is not castable, and we're not strict about it,
@@ -79,7 +83,7 @@ class Test_SharedVariable(unittest.TestCase):
            SharedVariable(
                    name='u',
                    type=Tensor(broadcastable=[False], dtype='float64'),
-                    value=dict(), #not an array by any stretch
+                    value=dict(),  # not an array by any stretch
                    strict=False)
            assert 0
        except TypeError:
@@ -96,10 +100,10 @@ class Test_SharedVariable(unittest.TestCase):
                strict=False)

        # check that assignments to value are cast properly
-        u.set_value([3,4])
+        u.set_value([3, 4])
        assert type(u.get_value()) is numpy.ndarray
        assert str(u.get_value(borrow=True).dtype) == 'float64'
-        assert numpy.all(u.get_value() == [3,4])
+        assert numpy.all(u.get_value() == [3, 4])

        # check that assignments of nonsense fail
        try:
@@ -109,7 +113,7 @@ class Test_SharedVariable(unittest.TestCase):
            pass

        # check that an assignment of a perfect value results in no copying
-        uval = theano._asarray([5,6,7,8], dtype='float64')
+        uval = theano._asarray([5, 6, 7, 8], dtype='float64')
        u.set_value(uval, borrow=True)
        assert u.get_value(borrow=True) is uval

@@ -149,10 +153,8 @@ class Test_SharedVariable(unittest.TestCase):
        assert b.type == theano.tensor.dscalar
        self.assertRaises(TypeError, f, b, 8)

-        c = shared(numpy.zeros((5,5), dtype='float32'))
-        self.assertRaises(TypeError, f, b, numpy.random.rand(5,5))
-
-
+        b = shared(numpy.zeros((5, 5), dtype='float32'))
+        self.assertRaises(TypeError, f, b, numpy.random.rand(5, 5))

    def test_tensor_strict(self):
        def f(var, val):
@@ -192,19 +194,16 @@ class Test_SharedVariable(unittest.TestCase):
 #        assert b.type == theano.tensor.dvector
 #        self.assertRaises(TypeError, f, b, 8)

-        c = shared(numpy.zeros((5,5), dtype='float32'))
-        self.assertRaises(TypeError, f, b, numpy.random.rand(5,5))
-
-
+        b = shared(numpy.zeros((5, 5), dtype='float32'))
+        self.assertRaises(TypeError, f, b, numpy.random.rand(5, 5))

    def test_scalar_floatX(self):

-        #
-        # the test should assure that floatX is not used in the shared constructor for scalars
-        # Shared values can change, and since we don't know the range they might take, we
-        # should keep the same bit width / precision as the original value used to create the
+        # the test should assure that floatX is not used in the shared
+        # constructor for scalars Shared values can change, and since we don't
+        # know the range they might take, we should keep the same
+        # bit width / precision as the original value used to create the
        # shared variable.
-        #

        # Since downcasting of a value now raises an Exception,

@@ -213,48 +212,46 @@ class Test_SharedVariable(unittest.TestCase):

        b = shared(numpy.int64(7), allow_downcast=True)
        assert b.type == theano.tensor.lscalar
-        f(b,8.23)
-        assert b.get_value()==8
+        f(b, 8.23)
+        assert b.get_value() == 8

        b = shared(numpy.int32(7), allow_downcast=True)
        assert b.type == theano.tensor.iscalar
-        f(b,8.23)
-        assert b.get_value()==8
+        f(b, 8.23)
+        assert b.get_value() == 8

        b = shared(numpy.int16(7), allow_downcast=True)
        assert b.type == theano.tensor.wscalar
-        f(b,8.23)
-        assert b.get_value()==8
+        f(b, 8.23)
+        assert b.get_value() == 8

        b = shared(numpy.int8(7), allow_downcast=True)
        assert b.type == theano.tensor.bscalar
-        f(b,8.23)
-        assert b.get_value()==8
+        f(b, 8.23)
+        assert b.get_value() == 8

        b = shared(numpy.float64(7.234), allow_downcast=True)
        assert b.type == theano.tensor.dscalar
-        f(b,8)
-        assert b.get_value()==8
+        f(b, 8)
+        assert b.get_value() == 8

        b = shared(numpy.float32(7.234), allow_downcast=True)
        assert b.type == theano.tensor.fscalar
-        f(b,8)
-        assert b.get_value()==8
+        f(b, 8)
+        assert b.get_value() == 8

        b = shared(numpy.float(7.234), allow_downcast=True)
        assert b.type == theano.tensor.dscalar
-        f(b,8)
-        assert b.get_value()==8
+        f(b, 8)
+        assert b.get_value() == 8

        b = shared(7.234, allow_downcast=True)
        assert b.type == theano.tensor.dscalar
-        f(b,8)
-        assert b.get_value()==8
-
-        c = shared(numpy.zeros((5,5), dtype='float32'), allow_downcast=True)
-        self.assertRaises(TypeError, f, b, numpy.random.rand(5,5))
-
+        f(b, 8)
+        assert b.get_value() == 8

+        b = shared(numpy.zeros((5, 5), dtype='float32'), allow_downcast=True)
+        self.assertRaises(TypeError, f, b, numpy.random.rand(5, 5))

    def test_tensor_floatX(self):
        def f(var, val):
@@ -262,32 +259,32 @@ class Test_SharedVariable(unittest.TestCase):

        b = shared(numpy.int64([7]), allow_downcast=True)
        assert b.type == theano.tensor.lvector
-        f(b,[8.23])
+        f(b, [8.23])
        assert b.get_value() == 8

        b = shared(numpy.int32([7]), allow_downcast=True)
        assert b.type == theano.tensor.ivector
-        f(b,[8.23])
+        f(b, [8.23])
        assert b.get_value() == 8

        b = shared(numpy.int16([7]), allow_downcast=True)
        assert b.type == theano.tensor.wvector
-        f(b,[8.23])
+        f(b, [8.23])
        assert b.get_value() == 8

        b = shared(numpy.int8([7]), allow_downcast=True)
        assert b.type == theano.tensor.bvector
-        f(b,[8.23])
+        f(b, [8.23])
        assert b.get_value() == 8

        b = shared(numpy.float64([7.234]), allow_downcast=True)
        assert b.type == theano.tensor.dvector
-        f(b,[8])
+        f(b, [8])
        assert b.get_value() == 8

        b = shared(numpy.float32([7.234]), allow_downcast=True)
        assert b.type == theano.tensor.fvector
-        f(b,[8])
+        f(b, [8])
        assert b.get_value() == 8

 #numpy.float([7.234]) don't work
@@ -300,10 +297,12 @@ class Test_SharedVariable(unittest.TestCase):
 #        assert b.type == theano.tensor.dvector
 #        f(b,[8])

-        b = shared(numpy.asarray([7.234],dtype=theano.config.floatX), allow_downcast=True)
+        b = shared(numpy.asarray([7.234], dtype=theano.config.floatX),
+                allow_downcast=True)
        assert b.dtype == theano.config.floatX
-        f(b,[8])
+        f(b, [8])
        assert b.get_value() == 8

-        c = shared(numpy.zeros((5,5), dtype='float32'), allow_downcast=True)
-        self.assertRaises(TypeError, f, b, numpy.random.rand(5,5))
+        b = shared(numpy.zeros((5, 5), dtype='float32'),
+                allow_downcast=True)
+        self.assertRaises(TypeError, f, b, numpy.random.rand(5, 5))
--- a/theano/gof/cmodule.py
+++ b/theano/gof/cmodule.py
@@ -5,7 +5,6 @@ import cPickle
 import logging
 import operator
 import os
-import platform
 import shutil
 import stat
 import StringIO
@@ -17,18 +16,21 @@ import time

 import distutils.sysconfig

-import numpy.distutils #TODO: TensorType should handle this
-import theano
+import numpy.distutils  # TODO: TensorType should handle this

 from theano.configparser import config
-from theano.gof.cc import hash_from_code, hash_from_file
-import compilelock # we will abuse the lockfile mechanism when reading and writing the registry
+from theano.gof.cc import hash_from_code

-from theano.configparser import TheanoConfigParser, AddConfigVar, EnumStr, StrParam, IntParam, FloatParam, BoolParam
+# we will abuse the lockfile mechanism when reading and writing the registry
+import compilelock
+
+from theano.configparser import AddConfigVar, BoolParam
 AddConfigVar('cmodule.mac_framework_link',
-        "If set to true, breaks certain mac installations with the infamous Bus Error",
+        ("If set to true, breaks certain mac installations with the infamous "
+         "Bus Error"),
        BoolParam(False))

+
 def local_bitwidth():
    """
    Return 32 for 32bit arch, 64 for 64bit arch
@@ -42,6 +44,7 @@ def local_bitwidth():
    # 'P' denotes a void*, and the size is expressed in bytes.
    return struct.calcsize('P') * 8

+
 def python_int_bitwidth():
    """
    Return the bit width of Python int (C long int).
@@ -51,11 +54,12 @@ def python_int_bitwidth():
    # 'l' denotes a C long int, and the size is expressed in bytes.
    return struct.calcsize('l') * 8

-_logger=logging.getLogger("theano.gof.cmodule")
+_logger = logging.getLogger("theano.gof.cmodule")
 _logger.setLevel(logging.WARNING)

-METH_VARARGS="METH_VARARGS"
-METH_NOARGS="METH_NOARGS"
+METH_VARARGS = "METH_VARARGS"
+METH_NOARGS = "METH_NOARGS"
+

 def debug_counter(name, every=1):
    """Debug counter to know how often we go through some piece of code.
@@ -68,6 +72,7 @@ def debug_counter(name, every=1):
    if n % every == 0:
        print >>sys.stderr, "debug_counter [%s]: %s" % (name, n)

+
 class ExtFunction(object):
    """A C function to put into a DynamicModule """

@@ -75,14 +80,18 @@ class ExtFunction(object):
    """string - function's name"""

    code_block = ""
-    """string - the entire code for the function.  Has the form ``static PyObject*
-    <name>([...]){ ... }
+    """string - the entire code for the function.
+
+    Has the form ``static PyObject* <name>([...]){ ... }

-    See Python's C API Reference for how to write c functions for python modules.
+    See Python's C API Reference for how to write c functions for python
+    modules.
    """

    method = ""
-    """str - calling method for this function (i.e. 'METH_VARARGS', 'METH_NOARGS')"""
+    """
+    str - calling method for this function (i.e. 'METH_VARARGS', 'METH_NOARGS')
+    """

    doc = ""
    """str - documentation string for this function"""
@@ -94,8 +103,14 @@ class ExtFunction(object):
        self.doc = doc

    def method_decl(self):
-        """Returns the signature for this function that goes into the DynamicModule's method table"""
-        return '\t{"%s", %s, %s, "%s"}' %(self.name, self.name, self.method, self.doc)
+        """
+        Returns the signature for this function.
+
+        It goes into the DynamicModule's method table.
+        """
+        return '\t{"%s", %s, %s, "%s"}' % (
+                self.name, self.name, self.method, self.doc)
+

 class DynamicModule(object):
    def __init__(self, name):
@@ -103,8 +118,12 @@ class DynamicModule(object):
        self.support_code = []
        self.functions = []
        self.includes = ["<Python.h>", "<iostream>"]
-        self.includes.append('<numpy/arrayobject.h>') #TODO: this should come from TensorType
-        self.init_blocks = ['import_array();'] #TODO: from TensorType
+
+        #TODO: this should come from TensorType
+        self.includes.append('<numpy/arrayobject.h>')
+
+        #TODO: from TensorType
+        self.init_blocks = ['import_array();']

    def print_methoddef(self, stream):
        print >> stream, "static PyMethodDef MyMethods[] = {"
@@ -117,22 +136,23 @@ class DynamicModule(object):
        print >> stream, "PyMODINIT_FUNC init%s(void){" % self.name
        for b in self.init_blocks:
            print >> stream, '  ', b
-        print >> stream, '  ', '(void) Py_InitModule("%s", MyMethods);' % self.name
+        print >> stream, '  ', ('(void) Py_InitModule("%s", MyMethods);'
+                % self.name)
        print >> stream, "}"

-
    def add_include(self, str):
        self.includes.append(str)
+
    def add_init_code(self, code):
        self.init_blocks.append(code)
+
    def add_support_code(self, code):
-        if code not in self.support_code: #TODO: KLUDGE
+        if code not in self.support_code:  # TODO: KLUDGE
            self.support_code.append(code)

    def add_function(self, fn):
        self.functions.append(fn)

-
    def code(self):
        sio = StringIO.StringIO()
        for inc in self.includes:
@@ -141,23 +161,23 @@ class DynamicModule(object):
            if inc[0] == '<' or inc[0] == '"':
                print >> sio, "#include", inc
            else:
-                print >> sio, '#include "%s"'%inc
+                print >> sio, '#include "%s"' % inc

-        print  >> sio, "//////////////////////"
-        print  >> sio, "////  Support Code"
-        print  >> sio, "//////////////////////"
+        print >> sio, "//////////////////////"
+        print >> sio, "////  Support Code"
+        print >> sio, "//////////////////////"
        for sc in self.support_code:
            print >> sio, sc

-        print  >> sio, "//////////////////////"
-        print  >> sio, "////  Functions"
-        print  >> sio, "//////////////////////"
+        print >> sio, "//////////////////////"
+        print >> sio, "////  Functions"
+        print >> sio, "//////////////////////"
        for f in self.functions:
            print >> sio, f.code_block

-        print  >> sio, "//////////////////////"
-        print  >> sio, "////  Module init"
-        print  >> sio, "//////////////////////"
+        print >> sio, "//////////////////////"
+        print >> sio, "////  Module init"
+        print >> sio, "//////////////////////"
        self.print_methoddef(sio)
        self.print_init(sio)

@@ -166,17 +186,19 @@ class DynamicModule(object):
    def list_code(self, ofile=sys.stdout):
        """Print out the code with line numbers to `ofile` """
        for i, line in enumerate(self.code().split('\n')):
-            print >> ofile, '%4i'%(i+1), line
+            print >> ofile, ('%4i' % (i + 1)), line
        ofile.flush()

    #TODO: add_type

+
 def dlimport(fullpath, suffix=None):
    """Dynamically load a .so, .pyd, .dll, or .py file

    :type fullpath: string
    :param fullpath: a fully-qualified path do a compiled python module
-    :param suffix: a suffix to strip from the end of fullpath to get the import name
+    :param suffix: a suffix to strip from the end of fullpath to get the
+        import name
    :type suffix: string

    :returns: the dynamically loaded module (from __import__)
@@ -200,12 +222,12 @@ def dlimport(fullpath, suffix=None):
        module_name = '.'.join(fullpath.split(os.path.sep)[-2:])[:-len(suffix)]
    else:
        raise ValueError('path has wrong suffix', (fullpath, suffix))
-    workdir = fullpath[:-len(module_name)- 1 - len(suffix)]
+    workdir = fullpath[:-len(module_name) - 1 - len(suffix)]

    _logger.debug("WORKDIR %s", workdir)
    _logger.debug("module_name %s", module_name)

-    sys.path[0:0] = [workdir] #insert workdir at beginning (temporarily)
+    sys.path[0:0] = [workdir]  # insert workdir at beginning (temporarily)
    try:
        rval = __import__(module_name, {}, {}, [module_name])
        if not rval:
@@ -216,20 +238,32 @@ def dlimport(fullpath, suffix=None):
    assert fullpath.startswith(rval.__file__)
    return rval

+
 def dlimport_workdir(basedir):
-    """Return a directory where you should put your .so file for dlimport to be able to load
-    it, given a basedir which should normally be config.compiledir"""
+    """
+    Return a directory where you should put your .so file for dlimport
+    to be able to load it, given a basedir which should normally be
+    config.compiledir
+    """
    return tempfile.mkdtemp(dir=basedir)

+
 def last_access_time(path):
-    """Return the number of seconds since the epoch of the last access of a given file"""
+    """
+    Return the number of seconds since the epoch of the last access of a
+    given file.
+    """
    return os.stat(path)[stat.ST_ATIME]

+
 def module_name_from_dir(dirname):
-    """Scan the contents of a cache directory and return full path of the dynamic lib in it.
+    """
+    Scan the contents of a cache directory and return full path of the
+    dynamic lib in it.
    """
    files = os.listdir(dirname)
-    name, = [file for file in files if file.endswith('.so') or file.endswith('.pyd')]
+    name, = [file for file in files
+             if file.endswith('.so') or file.endswith('.pyd')]
    return os.path.join(dirname, name)


@@ -322,7 +356,8 @@ def get_safe_part(key):
    # Find the md5 hash part.
    c_link_key = key[1]
    for key_element in c_link_key[1:]:
-        if isinstance(key_element, basestring) and key_element.startswith('md5:'):
+        if (isinstance(key_element, basestring)
+                and key_element.startswith('md5:')):
            md5 = key_element[4:]
            break

@@ -375,7 +410,8 @@ class KeyData(object):
            cPickle.dump(self, open(self.key_pkl, 'wb'),
                         protocol=cPickle.HIGHEST_PROTOCOL)
        except cPickle.PicklingError:
-            _logger.warning("Cache leak due to unpickle-able key data %s", self.keys)
+            _logger.warning("Cache leak due to unpickle-able key data %s",
+                    self.keys)
            os.remove(self.key_pkl)
            raise

@@ -411,9 +447,9 @@ class KeyData(object):
 class ModuleCache(object):
    """Interface to the cache of dynamically compiled modules on disk

-    Note that this interface does not assume exclusive use of the cache directory.
-    It is built to handle the case where multiple programs are also using instances of this
-    class to manage the same directory.
+    Note that this interface does not assume exclusive use of the cache
+    directory. It is built to handle the case where multiple programs are also
+    using instances of this class to manage the same directory.

    The cache works on the basis of keys. Each key is mapped to only one
    dynamic module, but multiple keys may be mapped to the same module (see
@@ -475,7 +511,9 @@ class ModuleCache(object):
    """Maps a module hash to its corresponding KeyData object."""

    stats = []
-    """A list with counters for the number of hits, loads, compiles issued by module_from_key()
+    """
+    A list with counters for the number of hits, loads, compiles issued by
+    module_from_key()
    """

    loaded_key_pkl = set()
@@ -504,7 +542,7 @@ class ModuleCache(object):
        if do_refresh:
            self.refresh()

-    age_thresh_use = 60*60*24*24    # 24 days
+    age_thresh_use = 60 * 60 * 24 * 24    # 24 days
    """
    The default age threshold (in seconds) for cache files we want to use.

@@ -552,10 +590,11 @@ class ModuleCache(object):
                elif 'key.pkl' in files:
                    try:
                        entry = module_name_from_dir(root)
-                    except ValueError: # there is a key but no dll!
+                    except ValueError:  # there is a key but no dll!
                        if not root.startswith("/tmp"):
-                            # Under /tmp, file are removed periodically by the os.
-                            # So it is normal that this happens from time to time.
+                            # Under /tmp, file are removed periodically by the
+                            # os. So it is normal that this happens from time
+                            # to time.
                            _logger.warning("ModuleCache.refresh() Found key "
                                    "without dll in cache, deleting it. %s",
                                    key_pkl)
@@ -564,9 +603,11 @@ class ModuleCache(object):
                        continue
                    if (time_now - last_access_time(entry)) < age_thresh_use:
                        _logger.debug('refresh adding %s', key_pkl)
+
                        def unpickle_failure():
                            _logger.info("ModuleCache.refresh() Failed to "
                                    "unpickle cache file %s", key_pkl)
+
                        try:
                            key_data = cPickle.load(open(key_pkl, 'rb'))
                        except EOFError:
@@ -632,12 +673,14 @@ class ModuleCache(object):
                        # TODO: check if this can happen at all
                        to_del = [key for key in key_data.keys if not key[0]]
                        if to_del:
-                            _logger.warning("ModuleCache.refresh() Found unversioned "
+                            _logger.warning(
+                                    "ModuleCache.refresh() Found unversioned "
                                    "key in cache, removing it. %s", key_pkl)
                            # Since the version is in the module hash, all
                            # keys should be unversioned.
                            if len(to_del) != len(key_data.keys):
-                                _logger.warning('Found a mix of unversioned and '
+                                _logger.warning(
+                                        'Found a mix of unversioned and '
                                        'versioned keys for the same '
                                        'module %s', key_pkl)
                            _rmtree(root, ignore_nocleanup=True,
@@ -726,14 +769,15 @@ class ModuleCache(object):
                    key_data.delete_keys_from(self.entry_from_key)
                    del self.module_hash_to_key_data[module_hash]
                    if key[0]:
-                        # this is a versioned entry, so should have been on disk
-                        # Something weird happened to cause this, so we are responding by
-                        # printing a warning, removing evidence that we ever saw this mystery
-                        # key.
+                        # this is a versioned entry, so should have been on
+                        # disk. Something weird happened to cause this, so we
+                        # are responding by printing a warning, removing
+                        # evidence that we ever saw this mystery key.
                        pkl_file_to_remove = key_data.key_pkl
                        if not root.startswith("/tmp"):
-                            # Under /tmp, file are removed periodically by the os.
-                            # So it is normal that this happen from time to time.
+                            # Under /tmp, file are removed periodically by the
+                            # os. So it is normal that this happen from time to
+                            # time.
                            _logger.warning("Removing key file %s because the "
                                    "corresponding module is gone from the "
                                    "file system.",
@@ -813,8 +857,8 @@ class ModuleCache(object):
                try:
                    compile_steps = fn(location=location).__iter__()

-                    # Check if we already know a module with the same hash. If we
-                    # do, then there is no need to even compile it.
+                    # Check if we already know a module with the same hash.
+                    # If we do, then there is no need to even compile it.
                    duplicated_module = False
                    # The first compilation step is to yield the source code.
                    src_code = compile_steps.next()
@@ -828,11 +872,12 @@ class ModuleCache(object):
                        # Note that we do not pass the `fn` argument, since it
                        # should not be used considering that the module should
                        # already be compiled.
-                        module = self.module_from_key(key=None, key_data=key_data)
+                        module = self.module_from_key(key=None,
+                                key_data=key_data)
                        name = module.__file__
-                        # Add current key to the set of keys associated to the same
-                        # module. We only save the KeyData object of versioned
-                        # modules.
+                        # Add current key to the set of keys associated to the
+                        # same module. We only save the KeyData object of
+                        # versioned modules.
                        try:
                            key_data.add_key(key, save_pkl=bool(_version))
                            key_broken = False
@@ -840,8 +885,8 @@ class ModuleCache(object):
                            # This should only happen if we tried to save the
                            # pickled file.
                            assert _version
-                            # The key we are trying to add is broken: we will not
-                            # add it after all.
+                            # The key we are trying to add is broken: we will
+                            # not add it after all.
                            key_data.remove_key(key)
                            key_broken = True

@@ -868,12 +913,13 @@ class ModuleCache(object):
                        # Obtain path to the '.so' module file.
                        name = module.__file__

-                        _logger.debug("Adding module to cache %s %s", key, name)
+                        _logger.debug("Adding module to cache %s %s",
+                                key, name)
                        assert name.startswith(location)
                        assert name not in self.module_from_name
                        # Changing the hash of the key is not allowed during
-                        # compilation. That is the only cause found that makes the
-                        # following assert fail.
+                        # compilation. That is the only cause found that makes
+                        # the following assert fail.
                        assert hash(key) == hash_key
                        assert key not in self.entry_from_key

@@ -896,10 +942,11 @@ class ModuleCache(object):
                                key_broken = False
                            except cPickle.PicklingError:
                                key_broken = True
-                                # Remove key from the KeyData object, to make sure
-                                # we never try to save it again.
-                                # We still keep the KeyData object and save it so
-                                # that the module can be re-used in the future.
+                                # Remove key from the KeyData object, to make
+                                # sure we never try to save it again.
+                                # We still keep the KeyData object and save it
+                                # so that the module can be re-used in the
+                                # future.
                                key_data.keys = set()
                                key_data.save_pkl()

@@ -910,20 +957,21 @@ class ModuleCache(object):
                            # versioned module.
                            self.loaded_key_pkl.add(key_pkl)

-                        # Map the new module to its KeyData object. Note that we
-                        # need to do it regardless of whether the key is versioned
-                        # or not if we want to be able to re-use this module inside
-                        # the same process.
+                        # Map the new module to its KeyData object. Note that
+                        # we need to do it regardless of whether the key is
+                        # versioned or not if we want to be able to re-use this
+                        # module inside the same process.
                        self.module_hash_to_key_data[module_hash] = key_data

                except Exception:
-                    # This may happen e.g. when an Op has no C implementation. In
-                    # any case, we do not want to keep around the temporary work
-                    # directory, as it may cause trouble if we create too many of
-                    # these. The 'ignore_if_missing' flag is set just in case this
-                    # directory would have already been deleted.
+                    # This may happen e.g. when an Op has no C implementation.
+                    # In any case, we do not want to keep around the temporary
+                    # work directory, as it may cause trouble if we create too
+                    # many of these. The 'ignore_if_missing' flag is set just
+                    # in case this directory would have already been deleted.
                    _rmtree(location, ignore_if_missing=True,
-                            msg='exception -- typically means no C implementation')
+                            msg=('exception -- '
+                                 'typically means no C implementation'))
                    raise

            finally:
@@ -982,8 +1030,9 @@ class ModuleCache(object):
            if key_data.keys:
                # This is to make debugging in pdb easier, by providing
                # the offending keys in the local context.
-                key_data_keys = list(key_data.keys)
+                # key_data_keys = list(key_data.keys)
                ## import pdb; pdb.set_trace()
+                pass
        elif found > 1:
            msg = 'Multiple equal keys found in unpickled KeyData file'
        if msg:
@@ -1005,8 +1054,8 @@ class ModuleCache(object):

        self.time_spent_in_check_key += time.time() - start_time

-    age_thresh_del = 60*60*24*31 # 31 days
-    age_thresh_del_unversioned = 60*60*24*7 # 7 days
+    age_thresh_del = 60 * 60 * 24 * 31  # 31 days
+    age_thresh_del_unversioned = 60 * 60 * 24 * 7  # 7 days

    """The default age threshold for `clear_old` (in seconds)
    """
@@ -1090,7 +1139,8 @@ class ModuleCache(object):

    def clear_base_files(self):
        """
-        Remove base directories 'cuda_ndarray', 'cutils_ext', 'lazylinker_ext' and 'scan_perform' if present.
+        Remove base directories 'cuda_ndarray', 'cutils_ext', 'lazylinker_ext'
+        and 'scan_perform' if present.

        Note that we do not delete them outright because it may not work on
        some systems due to these modules being currently in use. Instead we
@@ -1099,7 +1149,8 @@ class ModuleCache(object):
        """
        compilelock.get_lock()
        try:
-            for base_dir in ('cuda_ndarray', 'cutils_ext', 'lazylinker_ext', 'scan_perform'):
+            for base_dir in ('cuda_ndarray', 'cutils_ext', 'lazylinker_ext',
+                    'scan_perform'):
                to_delete = os.path.join(self.dirname, base_dir + '.delete.me')
                if os.path.isdir(to_delete):
                    try:
@@ -1174,18 +1225,20 @@ class ModuleCache(object):
            for filename in os.listdir(self.dirname):
                if filename.startswith('tmp'):
                    try:
-                        open(os.path.join(self.dirname, filename, 'key.pkl')).close()
+                        open(os.path.join(self.dirname, filename, 'key.pkl')
+                                ).close()
                        has_key = True
                    except IOError:
                        has_key = False
                    if not has_key:
-                        age = time_now - last_access_time(os.path.join(self.dirname, filename))
-                        # In normal case, the processus that created this directory
-                        # will delete it. However, if this processus crashes, it
-                        # will not be cleaned up.
-                        # As we don't know if this directory is still used, we wait
-                        # one week and suppose that the processus crashed, and we
-                        # take care of the clean-up.
+                        age = time_now - last_access_time(
+                                os.path.join(self.dirname, filename))
+                        # In normal case, the processus that created this
+                        # directory will delete it. However, if this processus
+                        # crashes, it will not be cleaned up.
+                        # As we don't know if this directory is still used,
+                        # we wait one week and suppose that the processus
+                        # crashed, and we take care of the clean-up.
                        if age > min_age:
                            _rmtree(os.path.join(self.dirname, filename),
                                    msg='old unversioned', level=logging.INFO,
@@ -1204,6 +1257,7 @@ class ModuleCache(object):
        _logger.debug('Time spent checking keys: %s',
                self.time_spent_in_check_key)

+
 def _rmtree(parent, ignore_nocleanup=False, msg='', level=logging.DEBUG,
            ignore_if_missing=False):
    # On NFS filesystems, it is impossible to delete a directory with open
@@ -1226,12 +1280,14 @@ def _rmtree(parent, ignore_nocleanup=False, msg='', level=logging.DEBUG,
        if os.path.exists(parent):
            try:
                _logger.info('placing "delete.me" in %s', parent)
-                open(os.path.join(parent,'delete.me'), 'w').close()
+                open(os.path.join(parent, 'delete.me'), 'w').close()
            except Exception, ee:
                _logger.warning("Failed to remove or mark cache directory %s "
                        "for removal %s", parent, ee)

 _module_cache = None
+
+
 def get_module_cache(dirname, init_args=None):
    """
    :param init_args: If not None, the (k, v) pairs in this dictionary will
@@ -1252,6 +1308,7 @@ def get_module_cache(dirname, init_args=None):
                _module_cache.dirname, dirname)
    return _module_cache

+
 def get_lib_extension():
    """Return the platform-dependent extension for compiled modules."""
    if sys.platform == 'win32':
@@ -1259,6 +1316,7 @@ def get_lib_extension():
    else:
        return 'so'

+
 def get_gcc_shared_library_arg():
    """Return the platform-dependent GCC argument for shared libraries."""
    if sys.platform == 'darwin':
@@ -1266,29 +1324,33 @@ def get_gcc_shared_library_arg():
    else:
        return '-shared'

+
 def std_include_dirs():
-    return numpy.distutils.misc_util.get_numpy_include_dirs() + [distutils.sysconfig.get_python_inc()]
+    return (numpy.distutils.misc_util.get_numpy_include_dirs()
+            + [distutils.sysconfig.get_python_inc()])
+

 def std_lib_dirs_and_libs():
    python_inc = distutils.sysconfig.get_python_inc()
    if sys.platform == 'win32':
        # Obtain the library name from the Python version instead of the
-        # installation directory, in case the user defined a custom installation
-        # directory.
+        # installation directory, in case the user defined a custom
+        # installation directory.
        python_version = distutils.sysconfig.get_python_version()
        libname = 'python' + python_version.replace('.', '')
        # Also add directory containing the Python library to the library
        # directories.
        python_lib_dir = os.path.join(os.path.dirname(python_inc), 'libs')
-        lib_dirs = [python_lib_dir]
        return [libname], [python_lib_dir]
-    #DSE Patch 2 for supporting OSX frameworks. Suppress -lpython2.x when frameworks are present
-    elif sys.platform=='darwin' :
-        if python_inc.count('Python.framework') :
-            return [],[]
-        else :
-            libname=os.path.basename(python_inc)
-            return [libname],[]
+
+    # DSE Patch 2 for supporting OSX frameworks.
+    # Suppress -lpython2.x when frameworks are present
+    elif sys.platform == 'darwin':
+        if python_inc.count('Python.framework'):
+            return [], []
+        else:
+            libname = os.path.basename(python_inc)
+            return [libname], []
    else:
        # Typical include directory: /usr/include/python2.6
        libname = os.path.basename(python_inc)
@@ -1399,14 +1461,10 @@ class GCC_compiler(object):
        if python_lib not in lib_dirs:
            lib_dirs.append(python_lib)

-        workdir = location
-
        cppfilename = os.path.join(location, 'mod.cpp')
        cppfile = file(cppfilename, 'w')

        _logger.debug('Writing module C++ code to %s', cppfilename)
-        ofiles = []
-        rval = None

        cppfile.write(src_code)
        # Avoid gcc warning "no newline at end of file".
@@ -1433,8 +1491,9 @@ class GCC_compiler(object):

        def print_command_line_error():
            # Print command line when a problem occurred.
-            print >> sys.stderr, ("Problem occurred during compilation with the "
-                                  "command line below:")
+            print >> sys.stderr, (
+                    "Problem occurred during compilation with the "
+                    "command line below:")
            print >> sys.stderr, ' '.join(cmd)

        try:
@@ -1457,8 +1516,8 @@ class GCC_compiler(object):
            # Print errors just below the command line.
            print compile_stderr
            # We replace '\n' by '. ' in the error message because when Python
-            # prints the exception, having '\n' in the text makes it more difficult
-            # to read.
+            # prints the exception, having '\n' in the text makes it more
+            # difficult to read.
            raise Exception('Compilation failed (return status=%s): %s' %
                            (status, compile_stderr.replace('\n', '. ')))


--- a/theano/gof/python25.py
+++ b/theano/gof/python25.py
 """
-Helper functions to make gof backwards compatible (tested on python 2.4 and 2.5)
+Helper functions to make gof backwards compatible
+
+(tested on python 2.4 and 2.5)
 """

 import collections
 import sys


-if sys.version_info[:2] < (2,5):
+if sys.version_info[:2] < (2, 5):

    def all(iterable):
        for element in iterable:
@@ -55,16 +57,19 @@ if sys.version_info[:2] < (2,5):
                raise TypeError('first argument must be callable')
            dict.__init__(self, *a, **kw)
            self.default_factory = default_factory
+
        def __getitem__(self, key):
            try:
                return dict.__getitem__(self, key)
            except KeyError:
                return self.__missing__(key)
+
        def __missing__(self, key):
            if self.default_factory is None:
                raise KeyError(key)
            self[key] = value = self.default_factory()
            return value
+
        def __reduce__(self):
            if self.default_factory is None:
                args = tuple()
@@ -72,14 +77,18 @@ if sys.version_info[:2] < (2,5):
                args = self.default_factory,
            # consider replacing items() with iteritems()
            return type(self), args, None, None, self.items()
+
        def copy(self):
            return self.__copy__()
+
        def __copy__(self):
            return type(self)(self.default_factory, self)
+
        def __deepcopy__(self, memo):
            import copy
            return type(self)(self.default_factory,
                              copy.deepcopy(self.items()))
+
        def __repr__(self):
            return 'defaultdict(%s, %s)' % (self.default_factory,
                                            dict.__repr__(self))
@@ -90,14 +99,15 @@ else:
    import __builtin__
    all = __builtin__.all
    any = __builtin__.any
-    import functools, collections
+    import collections
+    import functools
    partial = functools.partial
    defaultdict = collections.defaultdict
    deque = collections.deque

 __all__ = ['all', 'any']

-if sys.version_info[:2] < (2,6):
+if sys.version_info[:2] < (2, 6):
    # Borrowed from Python docs
    def combinations(iterable, r):
        # combinations('ABCD', 2) --> AB AC AD BC BD CD
@@ -115,18 +125,17 @@ if sys.version_info[:2] < (2,6):
            else:
                return
            indices[i] += 1
-            for j in range(i+1, r):
-                indices[j] = indices[j-1] + 1
+            for j in range(i + 1, r):
+                indices[j] = indices[j - 1] + 1
            yield tuple(pool[i] for i in indices)

-
    def product(*args, **kwds):
        # product('ABCD', 'xy') --> Ax Ay Bx By Cx Cy Dx Dy
        # product(range(2), repeat=3) --> 000 001 010 011 100 101 110 111
        pools = map(tuple, args) * kwds.get('repeat', 1)
        result = [[]]
        for pool in pools:
-            result = [x+[y] for x in result for y in pool]
+            result = [x + [y] for x in result for y in pool]
        for prod in result:
            yield tuple(prod)


--- a/theano/sandbox/cuda/tests/test_blas.py
+++ b/theano/sandbox/cuda/tests/test_blas.py
-import itertools
 from unittest import TestCase

 from theano.compile.pfunc import pfunc
@@ -15,7 +14,8 @@ if cuda_ndarray.cuda_available == False:

 import theano.sandbox.cuda as tcn

-from theano.tensor.signal.downsample import DownsampleFactorMax, DownsampleFactorMaxGrad
+from theano.tensor.signal.downsample import (DownsampleFactorMax,
+        DownsampleFactorMaxGrad)

 import theano.compile.mode
 from theano.tensor.tests.test_blas import BaseGemv, TestBlasStrides, TestGer
@@ -23,20 +23,24 @@ from theano.sandbox.cuda.blas import gpu_gemv_no_inplace, gpu_gemv_inplace
 from theano.sandbox.cuda.blas import gpu_ger_inplace, gpu_ger_no_inplace


-if theano.config.mode=='FAST_COMPILE':
+if theano.config.mode == 'FAST_COMPILE':
    mode_with_gpu = theano.compile.mode.get_mode('FAST_RUN').including('gpu')
-    mode_without_gpu = theano.compile.mode.get_mode('FAST_RUN').excluding('gpu')
+    mode_without_gpu = theano.compile.mode.get_mode(
+            'FAST_RUN').excluding('gpu')
 else:
    mode_with_gpu = theano.compile.mode.get_default_mode().including('gpu')
    mode_without_gpu = theano.compile.mode.get_default_mode().excluding('gpu')

+
 def my_rand(*shape):
-    return theano._asarray(numpy.random.rand(*shape),dtype='float32')
+    return theano._asarray(numpy.random.rand(*shape), dtype='float32')
+

 def transpose(cuda_mat):
    # The easiest way to transpose a cuda matrix for now
    return tcn.dimshuffle(cuda_mat, [1, 0])

+
 def test_dot22():
    def cmp(a_shp, b_shp):
        a0 = my_rand(*a_shp)
@@ -44,7 +48,7 @@ def test_dot22():

        b = tensor.fmatrix()

-        f = pfunc([b], [], updates=[(a, tensor.dot(a,b))], mode=mode_with_gpu)
+        f = pfunc([b], [], updates=[(a, tensor.dot(a, b))], mode=mode_with_gpu)

        bval = my_rand(*b_shp)
        f(bval)
@@ -54,16 +58,18 @@ def test_dot22():
        # Try with a matrix equal to a0, but with strides in both dims
        a.set_value(a0)
        a.set_value(
-                a.get_value(borrow=True, return_internal_type=True)[::-1, ::-1],
+                a.get_value(borrow=True,
+                    return_internal_type=True)[::-1, ::-1],
                borrow=True)
        f(bval)

-    cmp((3,4),(4,5))
-    cmp((0,4),(4,5))
-    cmp((3,4),(4,0))
-    cmp((3,0),(0,5))
-    cmp((0,4),(4,0))
-    cmp((0,0),(0,0))
+    cmp((3, 4), (4, 5))
+    cmp((0, 4), (4, 5))
+    cmp((3, 4), (4, 0))
+    cmp((3, 0), (0, 5))
+    cmp((0, 4), (4, 0))
+    cmp((0, 0), (0, 0))
+

 def test_dot22scalar():
    def cmp(a_shp, b_shp):
@@ -73,32 +79,39 @@ def test_dot22scalar():
        av = my_rand(*a_shp)
        bv = my_rand(*b_shp)

-        f = theano.function([a,b], tensor.dot(a,b)*numpy.asarray(4, 'float32'), mode=mode_with_gpu)
-        f2 = theano.function([a,b], tensor.dot(a,b)*numpy.asarray(4, 'float32'))
-        t=f.maker.env.toposort()
-        assert len(t)==4
-        assert isinstance(t[0].op,tcn.GpuFromHost)
-        assert isinstance(t[1].op,tcn.GpuFromHost)
-        assert isinstance(t[2].op,tcn.blas.GpuDot22Scalar)
-        assert isinstance(t[3].op,tcn.HostFromGpu)
-        assert numpy.allclose(f(av,bv),f2(av,bv))
-
-        f = theano.function([a,b,scalar], tensor.dot(a,b)*scalar, mode=mode_with_gpu)
-        f2 = theano.function([a,b,scalar], tensor.dot(a,b)*scalar)
-        t=f.maker.env.toposort()
-        assert len(t)==4
-        assert isinstance(t[0].op,tcn.GpuFromHost)
-        assert isinstance(t[1].op,tcn.GpuFromHost)
-        assert isinstance(t[2].op,tcn.blas.GpuDot22Scalar)
-        assert isinstance(t[3].op,tcn.HostFromGpu)
-        assert numpy.allclose(f(av,bv,0.5),f2(av,bv,0.5))
-
-    cmp((3,4),(4,5))
-    cmp((0,4),(4,5))
-    cmp((3,4),(4,0))
-    cmp((3,0),(0,5))
-    cmp((0,4),(4,0))
-    cmp((0,0),(0,0))
+        f = theano.function(
+                [a, b],
+                tensor.dot(a, b) * numpy.asarray(4, 'float32'),
+                mode=mode_with_gpu)
+        f2 = theano.function(
+                [a, b],
+                tensor.dot(a, b) * numpy.asarray(4, 'float32'))
+        t = f.maker.env.toposort()
+        assert len(t) == 4
+        assert isinstance(t[0].op, tcn.GpuFromHost)
+        assert isinstance(t[1].op, tcn.GpuFromHost)
+        assert isinstance(t[2].op, tcn.blas.GpuDot22Scalar)
+        assert isinstance(t[3].op, tcn.HostFromGpu)
+        assert numpy.allclose(f(av, bv), f2(av, bv))
+
+        f = theano.function([a, b, scalar], tensor.dot(a, b) * scalar,
+                mode=mode_with_gpu)
+        f2 = theano.function([a, b, scalar], tensor.dot(a, b) * scalar)
+        t = f.maker.env.toposort()
+        assert len(t) == 4
+        assert isinstance(t[0].op, tcn.GpuFromHost)
+        assert isinstance(t[1].op, tcn.GpuFromHost)
+        assert isinstance(t[2].op, tcn.blas.GpuDot22Scalar)
+        assert isinstance(t[3].op, tcn.HostFromGpu)
+        assert numpy.allclose(f(av, bv, 0.5), f2(av, bv, 0.5))
+
+    cmp((3, 4), (4, 5))
+    cmp((0, 4), (4, 5))
+    cmp((3, 4), (4, 0))
+    cmp((3, 0), (0, 5))
+    cmp((0, 4), (4, 0))
+    cmp((0, 0), (0, 0))
+

 def test_gemm():
    def cmp(a_shp, b_shp):
@@ -108,28 +121,33 @@ def test_gemm():
        b = tensor.fmatrix('b')
        c = tensor.fmatrix('c')

-        f = pfunc([b,c], [], updates=[(a, tensor.dot(a,b) + tensor.exp(c))], mode=mode_with_gpu)
-        assert any([node.op == tcn.blas.gpu_gemm_inplace for node in f.maker.env.toposort()])
+        f = pfunc([b, c], [], updates=[(a, tensor.dot(a, b) + tensor.exp(c))],
+                mode=mode_with_gpu)
+        assert any([node.op == tcn.blas.gpu_gemm_inplace
+            for node in f.maker.env.toposort()])

        bval = my_rand(*b_shp)
-        cval = my_rand(a_shp[0],b_shp[1])
-        f(bval,cval)
+        cval = my_rand(a_shp[0], b_shp[1])
+        f(bval, cval)

-        assert numpy.allclose(numpy.dot(a0, bval)+numpy.exp(cval), a.get_value())
+        assert numpy.allclose(numpy.dot(a0, bval) + numpy.exp(cval),
+                a.get_value())

        # Try with a matrix equal to a0, but with strides in both dims
        a.set_value(a0)
        a.set_value(
-                a.get_value(borrow=True, return_internal_type=True)[::-1, ::-1],
+                a.get_value(borrow=True,
+                    return_internal_type=True)[::-1, ::-1],
                borrow=True)
        f(bval, cval)

-    cmp((3,4),(4,5))
-    cmp((0,4),(4,5))
-    cmp((3,4),(4,0))
-    cmp((3,0),(0,5))
-    cmp((0,4),(4,0))
-    cmp((0,0),(0,0))
+    cmp((3, 4), (4, 5))
+    cmp((0, 4), (4, 5))
+    cmp((3, 4), (4, 0))
+    cmp((3, 0), (0, 5))
+    cmp((0, 4), (4, 0))
+    cmp((0, 0), (0, 0))
+

 def test_gemm_no_inplace():

@@ -142,29 +160,35 @@ def test_gemm_no_inplace():
        b = tcn.fmatrix('b')
        b2 = tcn.fmatrix('b2')

-        f = pfunc([b,b2], [tensor.dot(a,b2) + c], updates=[(a, tensor.dot(a,b) + c)], mode=mode_with_gpu)
+        f = pfunc(
+                [b, b2],
+                [tensor.dot(a, b2) + c],
+                updates=[(a, tensor.dot(a, b) + c)],
+                mode=mode_with_gpu)

-        assert any([node.op == tcn.blas.gpu_gemm_no_inplace for node in f.maker.env.toposort()])
+        assert any([node.op == tcn.blas.gpu_gemm_no_inplace
+            for node in f.maker.env.toposort()])
        bval = my_rand(*b_shp)
        bval2 = my_rand(*b_shp)
-        rval = f(bval,bval2)
+        rval = f(bval, bval2)

-        assert numpy.allclose(numpy.dot(a0, bval)+cval, a.get_value())
-        assert numpy.allclose(numpy.dot(a0, bval2)+cval, rval)
+        assert numpy.allclose(numpy.dot(a0, bval) + cval, a.get_value())
+        assert numpy.allclose(numpy.dot(a0, bval2) + cval, rval)

        # Try with a matrix equal to a0, but with strides in both dims
        a.set_value(a0)
        a.set_value(
-                a.get_value(borrow=True, return_internal_type=True)[::-1, ::-1],
+                a.get_value(borrow=True,
+                    return_internal_type=True)[::-1, ::-1],
                borrow=True)
        f(bval, bval2)

-    cmp((3,4),(4,5))
-    cmp((0,4),(4,5))
-    cmp((3,4),(4,0))
-    cmp((3,0),(0,5))
-    cmp((0,4),(4,0))
-    cmp((0,0),(0,0))
+    cmp((3, 4), (4, 5))
+    cmp((0, 4), (4, 5))
+    cmp((3, 4), (4, 0))
+    cmp((3, 0), (0, 5))
+    cmp((0, 4), (4, 0))
+    cmp((0, 0), (0, 0))


 class TestBlasStridesGpu(TestBlasStrides):
@@ -221,15 +245,15 @@ if 0:
                print r, r.shape
                assert (ret==r).all()

+
 def test_downsample():
-    import random
-    shps = [ (1, 1, 1, 12),
+    shps = [(1, 1, 1, 12),
            (1, 1, 2, 2),
            (1, 1, 1, 1),
-            (1,1,4,4),
+            (1, 1, 4, 4),
            (1, 1, 10, 11),
            (1, 2, 2, 2),
-            (3,5,4,4),
+            (3, 5, 4, 4),
            (25, 1, 7, 7),
            (1, 1, 12, 12),
            (1, 1, 2, 14),
@@ -245,44 +269,61 @@ def test_downsample():
            (30, 2, 24, 24),
            (30, 6, 24, 24),
            (10, 10, 10, 11),
-            (1,1,10,1025),
-            (1,1,10,1023),
-            (1,1,1025,10),
-            (1,1,1023,10),
+            (1, 1, 10, 1025),
+            (1, 1, 10, 1023),
+            (1, 1, 1025, 10),
+            (1, 1, 1023, 10),
             ]

    numpy.random.RandomState(unittest_tools.fetch_seed()).shuffle(shps)

    for shp in shps:
-        for ds in (2, 2), (3,2), (1,1):
-            if ds[0] > shp[2]: continue
-            if ds[1] > shp[3]: continue
+        for ds in (2, 2), (3, 2), (1, 1):
+            if ds[0] > shp[2]:
+                continue
+            if ds[1] > shp[3]:
+                continue
            # GpuDownsampleFactorMax doesn't like having more than 512 columns
            # in the output tensor.
-            if float(shp[3])/ds[1]>512: continue
+            if float(shp[3]) / ds[1] > 512:
+                continue
            for ignore_border in (True, False):
                print 'test_downsample', shp, ds, ignore_border
                ds_op = DownsampleFactorMax(ds, ignore_border=ignore_border)

                a = tcn.shared_constructor(my_rand(*shp), 'a')
-                f = pfunc([], ds_op(tensor.as_tensor_variable(a)), mode=mode_with_gpu)
-                f2 = pfunc([], ds_op(tensor.as_tensor_variable(a)), mode=mode_without_gpu)
-                assert any([isinstance(node.op, tcn.blas.GpuDownsampleFactorMax) for node in
-                            f.maker.env.toposort()])
-                assert any([isinstance(node.op, DownsampleFactorMax) for node in
-                            f2.maker.env.toposort()])
-                assert numpy.allclose(f(),f2())
-
-                g = pfunc([], tensor.grad(ds_op(tensor.as_tensor_variable(a)).sum(),a), mode=mode_with_gpu)
-                g2 = pfunc([], tensor.grad(ds_op(tensor.as_tensor_variable(a)).sum(),a), mode=mode_without_gpu)
-                assert any([isinstance(node.op, tcn.blas.GpuDownsampleFactorMaxGrad)
+                f = pfunc([], ds_op(tensor.as_tensor_variable(a)),
+                        mode=mode_with_gpu)
+                f2 = pfunc([], ds_op(tensor.as_tensor_variable(a)),
+                        mode=mode_without_gpu)
+                assert any([isinstance(node.op,
+                                       tcn.blas.GpuDownsampleFactorMax)
+                    for node in f.maker.env.toposort()])
+                assert any([isinstance(node.op, DownsampleFactorMax)
+                    for node in f2.maker.env.toposort()])
+                assert numpy.allclose(f(), f2())
+
+                g = pfunc(
+                        [],
+                        tensor.grad(ds_op(tensor.as_tensor_variable(a)).sum(),
+                            a),
+                        mode=mode_with_gpu)
+                g2 = pfunc(
+                        [],
+                        tensor.grad(ds_op(tensor.as_tensor_variable(a)).sum(),
+                            a),
+                        mode=mode_without_gpu)
+                assert any([isinstance(node.op,
+                                       tcn.blas.GpuDownsampleFactorMaxGrad)
                            for node in g.maker.env.toposort()])
                assert any([isinstance(node.op, DownsampleFactorMaxGrad)
                            for node in g2.maker.env.toposort()])
-                assert numpy.allclose(g(),g2())
+                assert numpy.allclose(g(), g2())

-                #We already check that the gpu version return the same value as the gpu version
-                #for GpuDownsampleFactorMaxGrad. So no need to call verify_grad here.
+                # We already check that the gpu version return
+                # the same value as the gpu version for
+                # GpuDownsampleFactorMaxGrad. So no need to call
+                # verify_grad here.


 class TestGpuGemv(TestCase, BaseGemv,
@@ -295,6 +336,7 @@ class TestGpuGemv(TestCase, BaseGemv,
    gemv = gpu_gemv_inplace
    gemv_inplace = gpu_gemv_inplace

+
 class TestGpuGemvNoTransfer(TestCase, BaseGemv,
                  unittest_tools.TestOptimizationMixin):
    mode = mode_with_gpu
@@ -320,63 +362,70 @@ class TestVectorMatrixDot(TestCase):

    def test_dot_vm(self):
        ''' Test vector dot matrix '''
-        v = theano.shared( numpy.array(numpy.random.rand(2), dtype='float32'))
-        m = theano.shared( numpy.array(numpy.random.rand(2,5),
+        v = theano.shared(numpy.array(numpy.random.rand(2), dtype='float32'))
+        m = theano.shared(numpy.array(numpy.random.rand(2, 5),
                                       dtype='float32'))
-        no_gpu_f = theano.function([], theano.dot(v,m), mode = mode_without_gpu)
-        gpu_f    = theano.function([], theano.dot(v,m), mode = mode_with_gpu)
+        no_gpu_f = theano.function([], theano.dot(v, m), mode=mode_without_gpu)
+        gpu_f = theano.function([], theano.dot(v, m), mode=mode_with_gpu)
        #gpu_f2 is needed to test the case when the input is not on the gpu
        #but the output is moved to the gpu.
-        gpu_f2   = theano.function([], tcn.gpu_from_host(theano.dot(v,m)), mode = mode_with_gpu)
+        gpu_f2 = theano.function([], tcn.gpu_from_host(theano.dot(v, m)),
+                mode=mode_with_gpu)

        # Assert they produce the same output
        assert numpy.allclose(no_gpu_f(), gpu_f(), atol=self.atol)
        assert numpy.allclose(no_gpu_f(), gpu_f2(), atol=self.atol)
        # Assert that the gpu version actually uses gpu
        assert sum([node.op is gpu_gemv_inplace for node in
-                    gpu_f.maker.env.toposort() ]) == 1
+                    gpu_f.maker.env.toposort()]) == 1
        assert sum([node.op is gpu_gemv_inplace for node in
-                    gpu_f2.maker.env.toposort() ]) == 1
+                    gpu_f2.maker.env.toposort()]) == 1

        # Check double-strided m
        m.set_value(
-                m.get_value(borrow=True, return_internal_type=True)[::-1, ::-1],
+                m.get_value(borrow=True,
+                    return_internal_type=True)[::-1, ::-1],
                borrow=True)
        assert numpy.allclose(no_gpu_f(), gpu_f(), atol=self.atol)
        assert numpy.allclose(no_gpu_f(), gpu_f2(), atol=self.atol)

-
    def test_dot_mv(self):
        ''' Test matrix dot vector '''
-        v = theano.shared( numpy.array(numpy.random.rand(2), dtype='float32'))
-        m = theano.shared( numpy.array(numpy.random.rand(5,2),
+        v = theano.shared(numpy.array(numpy.random.rand(2), dtype='float32'))
+        m = theano.shared(numpy.array(numpy.random.rand(5, 2),
                                       dtype='float32'))
-        no_gpu_f = theano.function([], theano.dot(m,v), mode = mode_without_gpu)
-        gpu_f    = theano.function([], theano.dot(m,v), mode = mode_with_gpu)
+        no_gpu_f = theano.function([], theano.dot(m, v), mode=mode_without_gpu)
+        gpu_f = theano.function([], theano.dot(m, v), mode=mode_with_gpu)
        #gpu_f2 is needed to test the case when the input is not on the gpu
        #but the output is moved to the gpu.
-        gpu_f2   = theano.function([], tcn.gpu_from_host(theano.dot(m,v)), mode = mode_with_gpu)
+        gpu_f2 = theano.function([], tcn.gpu_from_host(theano.dot(m, v)),
+                mode=mode_with_gpu)

        # Assert they produce the same output
        assert numpy.allclose(no_gpu_f(), gpu_f(), atol=self.atol)
        assert numpy.allclose(no_gpu_f(), gpu_f2(), atol=self.atol)
        # Assert that the gpu version actually uses gpu
        assert sum([node.op is gpu_gemv_inplace for node in
-                    gpu_f.maker.env.toposort() ]) == 1
+                    gpu_f.maker.env.toposort()]) == 1
        assert sum([node.op is gpu_gemv_inplace for node in
-                    gpu_f2.maker.env.toposort() ]) == 1
+                    gpu_f2.maker.env.toposort()]) == 1

    def test_gemv1(self):
        ''' test vector1+dot(matrix,vector2) '''
-        v1 = theano.tensor._shared( numpy.array(numpy.random.rand(2)  , dtype='float32'))
-        v2 = theano.tensor._shared( numpy.array(numpy.random.rand(5)  , dtype='float32'))
-        m  = theano.tensor._shared( numpy.array(numpy.random.rand(5,2), dtype='float32'))
-
-        no_gpu_f = theano.function([], v2+theano.dot(m,v1), mode = mode_without_gpu)
-        gpu_f    = theano.function([], v2+theano.dot(m,v1), mode = mode_with_gpu)
+        v1 = theano.tensor._shared(numpy.array(numpy.random.rand(2),
+            dtype='float32'))
+        v2 = theano.tensor._shared(numpy.array(numpy.random.rand(5),
+            dtype='float32'))
+        m = theano.tensor._shared(numpy.array(numpy.random.rand(5, 2),
+            dtype='float32'))
+
+        no_gpu_f = theano.function([], v2 + theano.dot(m, v1),
+                mode=mode_without_gpu)
+        gpu_f = theano.function([], v2 + theano.dot(m, v1), mode=mode_with_gpu)
        #gpu_f2 is needed to test the case when the input is not on the gpu
        #but the output is moved to the gpu.
-        gpu_f2    = theano.function([], tcn.gpu_from_host(v2+theano.dot(m,v1)), mode = mode_with_gpu)
+        gpu_f2 = theano.function([], tcn.gpu_from_host(v2 + theano.dot(m, v1)),
+                mode=mode_with_gpu)

        # Assert they produce the same output
        assert numpy.allclose(no_gpu_f(), gpu_f(), atol=self.atol)
@@ -389,15 +438,19 @@ class TestVectorMatrixDot(TestCase):

    def test_gemv2(self):
        ''' test vector1+dot(vector2,matrix) '''
-        v1 = theano.shared( numpy.array(numpy.random.rand(5)  , dtype='float32'))
-        v2 = theano.shared( numpy.array(numpy.random.rand(2)  , dtype='float32'))
-        m  = theano.shared( numpy.array(numpy.random.rand(5,2), dtype='float32'))
-
-        no_gpu_f = theano.function([], v2+theano.dot(v1,m), mode = mode_without_gpu)
-        gpu_f    = theano.function([], v2+theano.dot(v1,m), mode = mode_with_gpu)
-        #gpu_f2 is needed to test the case when the input is not on the gpu
-        #but the output is moved to the gpu.
-        gpu_f2    = theano.function([], tcn.gpu_from_host(v2+theano.dot(v1,m)), mode = mode_with_gpu)
+        v1 = theano.shared(numpy.array(numpy.random.rand(5), dtype='float32'))
+        v2 = theano.shared(numpy.array(numpy.random.rand(2), dtype='float32'))
+        m = theano.shared(numpy.array(numpy.random.rand(5, 2),
+            dtype='float32'))
+
+        no_gpu_f = theano.function([], v2 + theano.dot(v1, m),
+                mode=mode_without_gpu)
+        gpu_f = theano.function([], v2 + theano.dot(v1, m),
+                mode=mode_with_gpu)
+        # gpu_f2 is needed to test the case when the input is not on the gpu
+        # but the output is moved to the gpu.
+        gpu_f2 = theano.function([], tcn.gpu_from_host(v2 + theano.dot(v1, m)),
+                mode=mode_with_gpu)

        # Assert they produce the same output
        assert numpy.allclose(no_gpu_f(), gpu_f(), atol=self.atol)
@@ -425,6 +478,7 @@ class TestGpuGer(TestGer):
        self.ger = gpu_ger_inplace
        self.gemm = tcn.blas.gpu_gemm_inplace

+
 class TestGpuGerNoTransfer(TestGer):
    @staticmethod
    def shared(val):

--- a/theano/scan_module/scan_opt.py
+++ b/theano/scan_module/scan_opt.py
@@ -21,7 +21,6 @@ from theano.tensor import opt, get_constant_value
 from theano import gof
 from theano.gof.python25 import maxsize
 from theano.compile import optdb
-from theano import config
 from theano.compile.function_module import deep_copy_op

 import scan_op
@@ -97,7 +96,6 @@ def remove_constants_and_unused_inputs_scan(node):
            try:
                # This works if input is a constant that has all entries
                # equal
-                val = tensor.get_constant_value(node.inputs[idx + 1])
                givens[op_ins[idx]] = node.inputs[idx + 1].clone()[0]
            except TypeError:
                pass
@@ -729,7 +727,6 @@ class ScanSaveMem(gof.Optimizer):

                        nw_slice = (fslice,) + tuple(old_slices[1:])
                        nw_pos = inv_compress_map[idx]
-                        nw_out = new_outs[nw_pos]

                        subtens = tensor.basic.Subtensor(nw_slice)
                        # slice inputs
@@ -748,7 +745,6 @@ class ScanSaveMem(gof.Optimizer):
            for pos, old_outs in old_outputs:
                if len(old_outs) > 0:
                    nw_pos = compress_map[pos]
-                    nw_out = new_outs[nw_pos]
                    for k, old in enumerate(old_outs):
                        # Get the correct slice
                        cnf_slice, old_slices = slices[pos][k]
@@ -1066,7 +1062,6 @@ def scan_merge_inouts(node):
        else:
            a_inner_outs = a.inner_outputs
        inner_outputs = scan_utils.clone(a_inner_outs, replace=inp_equiv)
-        orig_outputs = a.outer_outputs

        op = scan_op.Scan(inner_inputs, inner_outputs, info)
        outputs = op(*outer_inputs)

--- a/theano/tensor/basic.py
+++ b/theano/tensor/basic.py
@@ -2,9 +2,7 @@

 __docformat__ = "restructuredtext en"

-import __builtin__
 import sys
-from theano.configparser import config
 import warnings
 from itertools import izip

@@ -12,6 +10,7 @@ import numpy
 #from copy import copy as python_copy

 import theano
+from theano.configparser import config
 from theano import gof
 from theano.gof import Apply, Constant, Op, Type, Value, Variable

@@ -185,7 +184,7 @@ def as_tensor_variable(x, name=None, ndim=None):
    except TypeError:
        try:
            str_x = str(x)
-        except Exception, e:
+        except Exception:
            str_x = repr(x)
        raise TypeError("Cannot convert %s to TensorType" % str_x, type(x))

@@ -727,7 +726,6 @@ class TensorType(Type):
                    self=self)
                )

-
    def value_validity_msg(self, a):
        try:
            self.filter(a, strict=True)
@@ -735,33 +733,35 @@ class TensorType(Type):
            return str(e)
        return "value is valid"

-
    def dtype_specs(self):
-        """Return a tuple (python type, c type, numpy typenum) that corresponds to
-        self.dtype.
+        """Return a tuple (python type, c type, numpy typenum) that corresponds
+        to self.dtype.

        This function is used internally as part of C code generation.
        """
        #TODO: add more type correspondances for e.g. int32, int64, float32,
        #complex64, etc.
        try:
-            return {'float32': (float, 'npy_float32', 'NPY_FLOAT32'),
-                    'float64': (float, 'npy_float64', 'NPY_FLOAT64'),
-                    'uint8': (int, 'npy_uint8', 'NPY_UINT8'),
-                    'int8': (int, 'npy_int8', 'NPY_INT8'),
-                    'uint16': (int, 'npy_uint16', 'NPY_UINT16'),
-                    'int16': (int, 'npy_int16', 'NPY_INT16'),
-                    'uint32': (int, 'npy_uint32', 'NPY_UINT32'),
-                    'int32': (int, 'npy_int32', 'NPY_INT32'),
-                    'uint64': (int, 'npy_uint64', 'NPY_UINT64'),
-                    'int64': (int, 'npy_int64', 'NPY_INT64'),
-                    'complex128': (complex, 'theano_complex128', 'NPY_COMPLEX128'),
-                    'complex64': (complex, 'theano_complex64', 'NPY_COMPLEX64')}[self.dtype]
+            return {
+                'float32': (float, 'npy_float32', 'NPY_FLOAT32'),
+                'float64': (float, 'npy_float64', 'NPY_FLOAT64'),
+                'uint8': (int, 'npy_uint8', 'NPY_UINT8'),
+                'int8': (int, 'npy_int8', 'NPY_INT8'),
+                'uint16': (int, 'npy_uint16', 'NPY_UINT16'),
+                'int16': (int, 'npy_int16', 'NPY_INT16'),
+                'uint32': (int, 'npy_uint32', 'NPY_UINT32'),
+                'int32': (int, 'npy_int32', 'NPY_INT32'),
+                'uint64': (int, 'npy_uint64', 'NPY_UINT64'),
+                'int64': (int, 'npy_int64', 'NPY_INT64'),
+                'complex128': (complex, 'theano_complex128', 'NPY_COMPLEX128'),
+                'complex64': (complex, 'theano_complex64', 'NPY_COMPLEX64')
+                }[self.dtype]
        except KeyError:
-            raise TypeError("Unsupported dtype for %s: %s" % (self.__class__.__name__, self.dtype))
+            raise TypeError("Unsupported dtype for %s: %s"
+                    % (self.__class__.__name__, self.dtype))

    def to_scalar_type(self):
-        return scal.Scalar(dtype = self.dtype)
+        return scal.Scalar(dtype=self.dtype)

    def __eq__(self, other):
        """Compare True iff other is the same kind of TensorType"""
@@ -769,10 +769,10 @@ class TensorType(Type):
            and other.broadcastable == self.broadcastable

    @staticmethod
-    def may_share_memory(a,b):
+    def may_share_memory(a, b):
        # This is a method of TensorType, so both a and b should be ndarrays
        if isinstance(a, numpy.ndarray) and isinstance(b, numpy.ndarray):
-            return numpy.may_share_memory(a,b)
+            return numpy.may_share_memory(a, b)
        else:
            return False

@@ -784,9 +784,10 @@ class TensorType(Type):
            return False
        if force_same_dtype and a.dtype != b.dtype:
            return False
-        a_eq_b = (a==b)
+        a_eq_b = (a == b)
        r = numpy.all(a_eq_b)
-        if r: return True
+        if r:
+            return True
        # maybe the trouble is that there are NaNs
        a_missing = numpy.isnan(a)
        if a_missing.any():
@@ -794,8 +795,9 @@ class TensorType(Type):
            return numpy.all(a_eq_b + (a_missing == b_missing))
        else:
            return False
+
    @staticmethod
-    def values_eq_approx(a, b, allow_remove_inf = False, allow_remove_nan = False):
+    def values_eq_approx(a, b, allow_remove_inf=False, allow_remove_nan=False):
        """
        :param allow_remove_inf: If True, when there is an inf in a,
                                 we allow any value in b in that position.
@@ -810,10 +812,11 @@ class TensorType(Type):
            if a.dtype != b.dtype:
                return False
            if 'int' in str(a.dtype):
-                return numpy.all(a==b)
+                return numpy.all(a == b)
            else:
-                #work around a numpy.allclose bug: http://projects.scipy.org/numpy/ticket/1672
-                if a.ndim==0 and numpy.isinf(a):
+                # work around a numpy.allclose bug:
+                # http://projects.scipy.org/numpy/ticket/1672
+                if a.ndim == 0 and numpy.isinf(a):
                    a = a.reshape(1)
                    b = b.reshape(1)

@@ -835,9 +838,10 @@ class TensorType(Type):
                if not (a_missing.any() or (allow_remove_inf and a_inf.any())):
                    # There are no missing values in a, thus this is not the
                    # reason why numpy.allclose(a, b) returned False.
-                    _logger.info('numpy allclose failed for abs_err %f and rel_err %f',
-                        numpy.max(abs(a-b)),
-                        numpy.max(abs(a-b) / (abs(a) + abs(b))))
+                    _logger.info(
+                        'numpy allclose failed for abs_err %f and rel_err %f',
+                        numpy.max(abs(a - b)),
+                        numpy.max(abs(a - b) / (abs(a) + abs(b))))
                    return False
                # The following line is what numpy.allclose bases its decision
                # upon, according to its documentation.
@@ -853,11 +857,13 @@ class TensorType(Type):

                #cmp_elemwise is weird when we have inf and -inf.
                #set it to False
-                cmp_elemwise = numpy.where(both_inf&cmp_elemwise,
-                                           a==b,cmp_elemwise)
+                cmp_elemwise = numpy.where(
+                        both_inf & cmp_elemwise,
+                        a == b,
+                        cmp_elemwise)

                #check the sign of the inf
-                both_inf = numpy.where(both_inf,a==b,both_inf)
+                both_inf = numpy.where(both_inf, (a == b), both_inf)

                if allow_remove_inf:
                    both_inf += a_inf
@@ -871,37 +877,38 @@ class TensorType(Type):

    @staticmethod
    def values_eq_approx_remove_inf(a, b):
-        return TensorType.values_eq_approx(a,b,True)
+        return TensorType.values_eq_approx(a, b, True)

    @staticmethod
    def values_eq_approx_remove_nan(a, b):
-        return TensorType.values_eq_approx(a,b,False,True)
+        return TensorType.values_eq_approx(a, b, False, True)

    @staticmethod
    def values_eq_approx_remove_inf_nan(a, b):
-        return TensorType.values_eq_approx(a,b,True,True)
+        return TensorType.values_eq_approx(a, b, True, True)

    def __hash__(self):
        """Hash equal for same kinds of TensorType"""
        return hashtype(self) ^ hash(self.dtype) ^ hash(self.broadcastable)

-    ndim = property(lambda self: len(self.broadcastable), doc = "number of dimensions")
+    ndim = property(lambda self: len(self.broadcastable),
+            doc="number of dimensions")
    """Number of dimensions

-    This read-only property is the preferred way to get the number of dimensions
-    of a `TensorType`.
+    This read-only property is the preferred way to get the number of
+    dimensions of a `TensorType`.

    """

-    def make_variable(self, name = None):
+    def make_variable(self, name=None):
        """Return a `TensorVariable` of this type

        :Parameters:
         - `name`: str
-           A pretty name to identify this `Variable` when printing and debugging
-
+           A pretty name to identify this `Variable` when printing and
+           debugging
        """
-        return TensorVariable(self, name = name)
+        return TensorVariable(self, name=name)

    def __str__(self):
        if self.name:
@@ -932,14 +939,14 @@ class TensorType(Type):
        PyArrayObject* %(name)s;
        int type_num_%(name)s;
        typedef %(dtype)s dtype_%(name)s;
-        """ % dict(sub, name = name, dtype = self.dtype_specs()[1])
+        """ % dict(sub, name=name, dtype=self.dtype_specs()[1])

    def c_init(self, name, sub):
        """Override `CLinkerOp.c_init` """
        return """
        %(name)s = NULL;
        type_num_%(name)s = %(type_num)s;
-        """ % dict(sub, name = name, type_num = self.dtype_specs()[2])
+        """ % dict(sub, name=name, type_num=self.dtype_specs()[2])

    def c_extract(self, name, sub):
        """Override `CLinkerOp.c_extract` """
@@ -969,7 +976,7 @@ class TensorType(Type):
        }
        %(name)s = (PyArrayObject*)(py_%(name)s);
        Py_XINCREF(%(name)s);
-        """ % dict(sub, name = name, type_num = self.dtype_specs()[2])
+        """ % dict(sub, name=name, type_num=self.dtype_specs()[2])

    def c_cleanup(self, name, sub):
        """Override `CLinkerOp.c_cleanup` """
@@ -1018,12 +1025,14 @@ class TensorType(Type):
 # to have OutputGuard generate C code for this type.
 theano.compile.mode.register_OutputGuard_c_code(TensorType)

+
 # Easy constructors

 def tensor(*args, **kwargs):
-    name = kwargs.pop('name',None)
+    name = kwargs.pop('name', None)
    return TensorType(*args, **kwargs).make_variable(name=name)

+
 def _multi(*fns):
    def f2(f, *names):
        if names and isinstance(names[0], int):
@@ -1051,7 +1060,9 @@ bscalar = TensorType('int8', ())
 wscalar = TensorType('int16', ())
 iscalar = TensorType('int32', ())
 lscalar = TensorType('int64', ())
-def scalar(name = None, dtype = None):
+
+
+def scalar(name=None, dtype=None):
    """Return a symbolic scalar variable.
    :param dtype: numeric type (None means to use theano.config.floatX)
    :param name: a name to attach to this variable
@@ -1060,7 +1071,9 @@ def scalar(name = None, dtype = None):
        dtype = config.floatX
    type = TensorType(dtype, ())
    return type(name)
-scalars, fscalars, dscalars, iscalars, lscalars = _multi(scalar, fscalar, dscalar, iscalar, lscalar)
+
+scalars, fscalars, dscalars, iscalars, lscalars = _multi(
+        scalar, fscalar, dscalar, iscalar, lscalar)

 int_types = bscalar, wscalar, iscalar, lscalar
 float_types = fscalar, dscalar
@@ -1077,7 +1090,9 @@ bvector = TensorType('int8', (False,))
 wvector = TensorType('int16', (False,))
 ivector = TensorType('int32', (False, ))
 lvector = TensorType('int64', (False, ))
-def vector(name = None, dtype = None):
+
+
+def vector(name=None, dtype=None):
    """Return a symbolic vector variable.
    :param dtype: numeric type (None means to use theano.config.floatX)
    :param name: a name to attach to this variable
@@ -1086,7 +1101,9 @@ def vector(name = None, dtype = None):
        dtype = config.floatX
    type = TensorType(dtype, (False, ))
    return type(name)
-vectors, fvectors, dvectors, ivectors, lvectors = _multi(vector, fvector, dvector, ivector, lvector)
+
+vectors, fvectors, dvectors, ivectors, lvectors = _multi(
+        vector, fvector, dvector, ivector, lvector)

 int_vector_types = bvector, wvector, ivector, lvector
 float_vector_types = fvector, dvector
@@ -1100,7 +1117,9 @@ bmatrix = TensorType('int8', (False, False))
 wmatrix = TensorType('int16', (False, False))
 imatrix = TensorType('int32', (False, False))
 lmatrix = TensorType('int64', (False, False))
-def matrix(name = None, dtype = None):
+
+
+def matrix(name=None, dtype=None):
    """Return a symbolic matrix variable.
    :param dtype: numeric type (None means to use theano.config.floatX)
    :param name: a name to attach to this variable
@@ -1109,7 +1128,9 @@ def matrix(name = None, dtype = None):
        dtype = config.floatX
    type = TensorType(dtype, (False, False))
    return type(name)
-matrices, fmatrices, dmatrices, imatrices, lmatrices = _multi(matrix, fmatrix, dmatrix, imatrix, lmatrix)
+
+matrices, fmatrices, dmatrices, imatrices, lmatrices = _multi(
+        matrix, fmatrix, dmatrix, imatrix, lmatrix)

 int_matrix_types = bmatrix, wmatrix, imatrix, lmatrix
 float_matrix_types = fmatrix, dmatrix
@@ -1123,7 +1144,9 @@ brow = TensorType('int8', (True, False))
 wrow = TensorType('int16', (True, False))
 irow = TensorType('int32', (True, False))
 lrow = TensorType('int64', (True, False))
-def row(name = None, dtype = None):
+
+
+def row(name=None, dtype=None):
    """Return a symbolic row variable (ndim=2, broadcastable=[True,False]).
    :param dtype: numeric type (None means to use theano.config.floatX)
    :param name: a name to attach to this variable
@@ -1142,7 +1165,9 @@ bcol = TensorType('int8', (False, True))
 wcol = TensorType('int16', (False, True))
 icol = TensorType('int32', (False, True))
 lcol = TensorType('int64', (False, True))
-def col(name = None, dtype = None):
+
+
+def col(name=None, dtype=None):
    """Return a symbolic column variable (ndim=2, broadcastable=[False,True]).
    :param dtype: numeric type (None means to use theano.config.floatX)
    :param name: a name to attach to this variable
@@ -1153,14 +1178,16 @@ def col(name = None, dtype = None):
    return type(name)
 cols, fcols, dcols, icols, lcols = _multi(col, fcol, dcol, icol, lcol)

-ctensor3 = TensorType('complex64', (False,)*3)
-ztensor3 = TensorType('complex128', (False,)*3)
-ftensor3 = TensorType('float32', (False,)*3)
-dtensor3 = TensorType('float64', (False,)*3)
-btensor3 = TensorType('int8', (False,)*3)
-wtensor3 = TensorType('int16', (False,)*3)
-itensor3 = TensorType('int32', (False,)*3)
-ltensor3 = TensorType('int64', (False,)*3)
+ctensor3 = TensorType('complex64', ((False,) * 3))
+ztensor3 = TensorType('complex128', ((False,) * 3))
+ftensor3 = TensorType('float32', ((False,) * 3))
+dtensor3 = TensorType('float64', ((False,) * 3))
+btensor3 = TensorType('int8', ((False,) * 3))
+wtensor3 = TensorType('int16', ((False,) * 3))
+itensor3 = TensorType('int32', ((False,) * 3))
+ltensor3 = TensorType('int64', ((False,) * 3))
+
+
 def tensor3(name=None, dtype=None):
    """Return a symbolic 3-D variable.
    :param dtype: numeric type (None means to use theano.config.floatX)
@@ -1170,17 +1197,20 @@ def tensor3(name=None, dtype=None):
        dtype = config.floatX
    type = TensorType(dtype, (False, False, False))
    return type(name)
-tensor3s, ftensor3s, dtensor3s, itensor3s, ltensor3s = _multi(tensor3, ftensor3, dtensor3,
-        itensor3, ltensor3)
-
-ctensor4 = TensorType('complex64', (False,)*4)
-ztensor4 = TensorType('complex128', (False,)*4)
-ftensor4 = TensorType('float32', (False,)*4)
-dtensor4 = TensorType('float64', (False,)*4)
-btensor4 = TensorType('int8', (False,)*4)
-wtensor4 = TensorType('int16', (False,)*4)
-itensor4 = TensorType('int32', (False,)*4)
-ltensor4 = TensorType('int64', (False,)*4)
+
+tensor3s, ftensor3s, dtensor3s, itensor3s, ltensor3s = _multi(
+        tensor3, ftensor3, dtensor3, itensor3, ltensor3)
+
+ctensor4 = TensorType('complex64', ((False,) * 4))
+ztensor4 = TensorType('complex128', ((False,) * 4))
+ftensor4 = TensorType('float32', ((False,) * 4))
+dtensor4 = TensorType('float64', ((False,) * 4))
+btensor4 = TensorType('int8', ((False,) * 4))
+wtensor4 = TensorType('int16', ((False,) * 4))
+itensor4 = TensorType('int32', ((False,) * 4))
+ltensor4 = TensorType('int64', ((False,) * 4))
+
+
 def tensor4(name=None, dtype=None):
    """Return a symbolic 4-D variable.
    :param dtype: numeric type (None means to use theano.config.floatX)
@@ -1190,114 +1220,147 @@ def tensor4(name=None, dtype=None):
        dtype = config.floatX
    type = TensorType(dtype, (False, False, False, False))
    return type(name)
-tensor4s, ftensor4s, dtensor4s, itensor4s, ltensor4s = _multi(tensor4, ftensor4, dtensor4,
-        itensor4, ltensor4)
+tensor4s, ftensor4s, dtensor4s, itensor4s, ltensor4s = _multi(
+        tensor4, ftensor4, dtensor4, itensor4, ltensor4)


 class _tensor_py_operators:
    #UNARY
-    def __abs__(self): return abs_(self)
-    def __neg__(self): return neg(self)
+    def __abs__(self):
+        return abs_(self)
+
+    def __neg__(self):
+        return neg(self)

    #CASTS
-    #### REMOVED THESE BECAUSE PYTHON appears to require __int__ to return an int. -JB 20081112
+    #### REMOVED THESE BECAUSE PYTHON appears to require __int__ to return
+    #### an int. -JB 20081112
    #def __int__(self): return convert_to_int32(self)
    #def __float__(self): return convert_to_float64(self)
    #def __complex__(self): return convert_to_complex128(self)

    #COMPARISONS
    _is_nonzero = True
-    def __lt__(self,other):
+
+    def __lt__(self, other):
        rval = lt(self, other)
-        rval._is_nonzero=False
+        rval._is_nonzero = False
        return rval
-    def __le__(self,other):
-        rval =  le(self, other)
-        rval._is_nonzero=False
+
+    def __le__(self, other):
+        rval = le(self, other)
+        rval._is_nonzero = False
        return rval
-    def __gt__(self,other):
+
+    def __gt__(self, other):
        rval = gt(self, other)
-        rval._is_nonzero=False
+        rval._is_nonzero = False
        return rval
-    def __ge__(self,other):
+
+    def __ge__(self, other):
        rval = ge(self, other)
-        rval._is_nonzero=False
+        rval._is_nonzero = False
        return rval
+
    def __nonzero__(self):
-        # This is meant to prohibit stuff like a < b < c, which is internally implemented as
-        # (a < b) and (b < c). The trouble with this is the side-effect that checking for a
-        # non-NULL a by typing "if a: ..." uses the same __nonzero__ method.  We want these
-        # both to work, but it seems impossible.  Currently, all vars evaluate to nonzero
-        # except the return values of comparison operators, which raise this exception.  If you
-        # can think of a better solution, go for it!
+        # This is meant to prohibit stuff like a < b < c, which is internally
+        # implemented as (a < b) and (b < c). The trouble with this is the
+        # side-effect that checking for a non-NULL a by typing "if a: ..."
+        # uses the same __nonzero__ method.  We want these both to work, but
+        # it seems impossible.  Currently, all vars evaluate to nonzero except
+        # the return values of comparison operators, which raise this
+        # exception.  If you can think of a better solution, go for it!
        if self._is_nonzero:
            return True
        else:
            raise TypeError("Variable does not support boolean operations.")

-
    #BITWISE
-    def __invert__(self): return invert(self)
-    def __and__(self,other): return and_(self, other)
-    def __or__(self,other): return or_(self, other)
-    def __xor__(self,other): return xor(self, other)
-    def __rand__(self,other): return and_(other,self)
-    def __ror__(self,other): return or_(other, self)
-    def __rxor__(self,other): return xor(other, self)
-#     def __iand__(self, other): return _and_inplace(self, other)
-#     def __ior__(self, other): return _or_inplace(self, other)
-#     def __ixor__(self, other): return _xor_inplace(self, other)
+    def __invert__(self):
+        return invert(self)
+
+    def __and__(self, other):
+        return and_(self, other)
+
+    def __or__(self, other):
+        return or_(self, other)
+
+    def __xor__(self, other):
+        return xor(self, other)
+
+    def __rand__(self, other):
+        return and_(other, self)
+
+    def __ror__(self, other):
+        return or_(other, self)
+
+    def __rxor__(self, other):
+        return xor(other, self)
+
+    #def __iand__(self, other):
+    #    return _and_inplace(self, other)
+    #
+    #def __ior__(self, other):
+    #    return _or_inplace(self, other)
+    #
+    #def __ixor__(self, other):
+    #    return _xor_inplace(self, other)

    #ARITHMETIC - NORMAL
-    def __add__(self,other):
+    def __add__(self, other):
        try:
-            return add(self,other)
+            return add(self, other)
        # We should catch the minimum number of exception here.
        # Otherwise this will convert error when Theano flags
        # compute_test_value is used
        # Evidently, we need to catch NotImplementedError
        # But we also need to catch TypeError
        # Oterwise TensorVariable * SparseVariable won't work!
-        except (NotImplementedError, TypeError), e:
+        except (NotImplementedError, TypeError):
            # We must return NotImplemented and not an
            # NotImplementedError or raise an NotImplementedError.
            # That way python will give a good error message like this
            # `TypeError: unsupported operand type(s) for +:
            # 'TensorVariable' and 'TensorVariable'`
            return NotImplemented
-    def __sub__(self,other):
+
+    def __sub__(self, other):
        # See explanation in __add__ for the error catched
        # adn the return value in that case
        try:
-            return sub(self,other)
-        except (NotImplementedError, TypeError), e:
+            return sub(self, other)
+        except (NotImplementedError, TypeError):
            return NotImplemented
-    def __mul__(self,other):
+
+    def __mul__(self, other):
        # See explanation in __add__ for the error catched
        # adn the return value in that case
        try:
-            return mul(self,other)
-        except (NotImplementedError, TypeError), e:
+            return mul(self, other)
+        except (NotImplementedError, TypeError):
            return NotImplemented
-    def __div__(self,other):
+
+    def __div__(self, other):
        # See explanation in __add__ for the error catched
        # adn the return value in that case
        try:
-            return div_proxy(self,other)
+            return div_proxy(self, other)
        except IntegerDivisionError:
            # This is to raise the exception that occurs when trying to divide
            # two integer arrays (currently forbidden).
            raise
-        except (NotImplementedError, TypeError), e:
+        except (NotImplementedError, TypeError):
            return NotImplemented
-    def __pow__(self,other):
+
+    def __pow__(self, other):
        # See explanation in __add__ for the error catched
        # adn the return value in that case
        try:
-            return pow(self,other)
-        except (NotImplementedError, TypeError), e:
+            return pow(self, other)
+        except (NotImplementedError, TypeError):
            return NotImplemented
-    def __mod__(self,other):
+
+    def __mod__(self, other):
        # See explanation in __add__ for the error catched
        # adn the return value in that case
        try:
@@ -1306,29 +1369,56 @@ class _tensor_py_operators:
            # This is to raise the exception that occurs when trying to compute
            # x % y with either x or y a complex number.
            raise
-        except (NotImplementedError, TypeError), e:
+        except (NotImplementedError, TypeError):
            return NotImplemented

-    def __truediv__(self,other): return true_div(self, other)
-    def __floordiv__(self,other): return floor_div(self, other)
-    def __rtruediv__(self,other): return true_div(other, self)
-    def __rfloordiv__(self,other): return floor_div(other, self)
-
-#     ##### DON"T USE THESE BECAUSE INPLACE OPS SHOULD BE INSERTED BY OPTIMIZATION ONLY
-#     #ARITHMETIC - INPLACE
-#     def __iadd__(self,other): return _add_inplace(self,other)
-#     def __isub__(self,other): return _sub_inplace(self,other)
-#     def __imul__(self,other): return _mul_inplace(self,other)
-#     def __idiv__(self,other): return _div_inplace(self,other)
-#     def __ipow__(self,other): return _pow_inplace(self,other)
-
-    #ARITHMETIC - RIGHT-OPERAND
-    def __radd__(self,other): return add(other,self)
-    def __rsub__(self,other): return sub(other,self)
-    def __rmul__(self,other): return mul(other,self)
-    def __rdiv__(self,other): return div_proxy(other,self)
-    def __rmod__(self,other): return mod(other,self)
-    def __rpow__(self,other): return pow(other,self)
+    def __truediv__(self, other):
+        return true_div(self, other)
+
+    def __floordiv__(self, other):
+        return floor_div(self, other)
+
+    def __rtruediv__(self, other):
+        return true_div(other, self)
+
+    def __rfloordiv__(self, other):
+        return floor_div(other, self)
+
+    ##### DO NOT USE THESE BECAUSE INPLACE OPS SHOULD BE INSERTED
+    ##### BY OPTIMIZATIONS ONLY
+    ## ARITHMETIC - INPLACE
+    #def __iadd__(self, other):
+    #    return _add_inplace(self, other)
+    #def __isub__(self, other):
+    #    return _sub_inplace(self, other)
+    #
+    #def __imul__(self, other):
+    #    return _mul_inplace(self, other)
+    #
+    #def __idiv__(self, other):
+    #    return _div_inplace(self, other)
+    #
+    #def __ipow__(self, other):
+    #    return _pow_inplace(self, other)
+
+    # ARITHMETIC - RIGHT-OPERAND
+    def __radd__(self, other):
+        return add(other, self)
+
+    def __rsub__(self, other):
+        return sub(other, self)
+
+    def __rmul__(self, other):
+        return mul(other, self)
+
+    def __rdiv__(self, other):
+        return div_proxy(other, self)
+
+    def __rmod__(self, other):
+        return mod(other, self)
+
+    def __rpow__(self, other):
+        return pow(other, self)

    #TRANSPOSE
    T = property(lambda self: transpose(self))
@@ -1360,43 +1450,51 @@ class _tensor_py_operators:
    size = property(lambda self: prod(self.shape))

    # We can't implement __len__ to provide a better error message.
-    def any(self, axis = None):
+    def any(self, axis=None):
        return elemwise.Any(axis)(self)

-    def all(self, axis = None):
+    def all(self, axis=None):
        return elemwise.All(axis)(self)

    # Otherwise TensorVariable[:-1] does not work as Python 2.5.1 calls
    # __len__ before calling __getitem__. It also does not catch the raised
    # Exception!
-#     def __len__(self):
-#         # We can't implement __len__ as Python requests that this
-#         # function returns an integer >=0
-#         raise Exception("Theano Variables can't work with len(Theano "
-#                         "Variable) due to Python restriction. You can use "
-#                         "TheanoVariable.shape[0] instead.")
+    # def __len__(self):
+    #     # We can't implement __len__ as Python requests that this
+    #     # function returns an integer >=0
+    #     raise Exception("Theano Variables can't work with len(Theano "
+    #                     "Variable) due to Python restriction. You can use "
+    #                     "TheanoVariable.shape[0] instead.")

    def reshape(self, shape, ndim=None):
        """Return a reshaped view/copy of this variable.

-        :param shape: something that can be converted to a symbolic vector of integers
+        :param shape: something that can be converted to a symbolic vector of
+            integers

-        :param ndim: the length of the shape.  Passing None here means for theano to try and
-        guess the length of `shape`.
+        :param ndim: the length of the shape.  Passing None here means for
+            theano to try and guess the length of `shape`.
        """
        return reshape(self, shape, ndim=ndim)

    def dimshuffle(self, *pattern):
-        """Reorder the dimensions of this variable, optionally inserting broadcasted dimensions.
+        """
+        Reorder the dimensions of this variable, optionally inserting
+        broadcasted dimensions.

-        :param pattern: list/tuple of int mixed with 'x' for broadcastable dimensions
+        :param pattern: list/tuple of int mixed with 'x' for broadcastable
+            dimensions

-        For example, to create a 3D view of a [2D] matrix, call ``dimshuffle([0,'x',1])``.  This
-        will create a 3D view such that the middle dimension is an implicit broadcasted
-        dimension.  To do the same thing on the transpose of that matrix, call ``dimshuffle([1,
-        'x', 0])``.
+        For example, to create a 3D view of a [2D] matrix, call
+        ``dimshuffle([0,'x',1])``.  This will create a 3D view such that the
+        middle dimension is an implicit broadcasted dimension.  To do the same
+        thing on the transpose of that matrix, call
+        ``dimshuffle([1, 'x', 0])``.

-        This function supports the pattern passed as a tuple, or as a variable-length argument (e.g. ``a.dimshuffle(pattern)`` is equivalent to ``a.dimshuffle(*pattern)`` where ``pattern`` is a list/tuple of ints mixed with 'x' characters).
+        This function supports the pattern passed as a tuple, or as a
+        variable-length argument (e.g. ``a.dimshuffle(pattern)`` is equivalent
+        to ``a.dimshuffle(*pattern)`` where ``pattern`` is a list/tuple of ints
+        mixed with 'x' characters).

        For more information, see `DimShuffle`.
        """
@@ -1447,7 +1545,8 @@ class _tensor_py_operators:
            else:
                return AdvancedSubtensor()(self, *args)
        else:
-            return Subtensor(args)(self, *Subtensor.collapse(args, lambda entry: isinstance(entry, Variable)))
+            return Subtensor(args)(self, *Subtensor.collapse(args,
+                lambda entry: isinstance(entry, Variable)))

    #COPYING
    def copy(self):
@@ -1457,11 +1556,11 @@ class _tensor_py_operators:
        try:
            for i in xrange(get_vector_length(self)):
                yield self[i]
-        except TypeError, e:
+        except TypeError:
            # This prevents accidental iteration via builtin.sum(self)
-            raise TypeError('TensorType does not support iteration. '
-            'Maybe you are using builtin.sum instead of theano.tensor.sum? (Maybe .max?)')
-
+            raise TypeError(('TensorType does not support iteration. '
+                'Maybe you are using builtin.sum instead of '
+                'theano.tensor.sum? (Maybe .max?)'))

    # CONVENIENT ACCESS TO TYPE PROPERTIES
    ndim = property(lambda self: self.type.ndim)
@@ -1471,7 +1570,6 @@ class _tensor_py_operators:
    """The broadcastable signature of this tensor.

    See :doc:`broadcasting` for details.
-
    """

    dtype = property(lambda self: self.type.dtype)
@@ -1493,12 +1591,12 @@ class _tensor_py_operators:
        return prod(self, axis=axis, dtype=dtype)

    def norm(self, L, axis=None):
-        if L==0:
+        if L == 0:
            raise NotImplementedError()
        if numpy.isinf(L):
            raise NotImplementedError()
        #optimizations will/should catch cases like L=1, L=2
-        return pow(pow(abs_(self), L).sum(axis=axis), 1.0/L)
+        return pow(pow(abs_(self), L).sum(axis=axis), 1.0 / L)

    def mean(self, axis=None, dtype=None):
        """See `theano.tensor.mean`"""
@@ -1521,6 +1619,7 @@ class _tensor_py_operators:

    def get_constant_value(self):
        return get_constant_value(self)
+
    def zeros_like(model):
        return zeros_like(model)

@@ -1540,17 +1639,19 @@ class TensorConstantSignature(tuple):
        if type(self) != type(other):
            return False
        try:
-            (t0, d0), (t1,d1) = self, other
-        except Exception, e:
+            (t0, d0), (t1, d1) = self, other
+        except Exception:
            return False
+
        #N.B. compare shape to ensure no broadcasting in ==
        if t0 != t1 or d0.shape != d1.shape:
            return False
-        no_nan = self.no_nan # Ensure has_nan is computed.
+
+        self.no_nan  # Ensure has_nan is computed.
        # Note that in the comparisons below, the elementwise comparisons
        # come last because they are the most expensive checks.
        if self.has_nan:
-            other_no_nan = other.no_nan
+            other.no_nan  # Ensure has_nan is computed.
            return (other.has_nan and
                    self.sum == other.sum and
                    (self.no_nan.mask == other.no_nan.mask).all() and
@@ -1620,7 +1721,7 @@ class TensorConstant(_tensor_py_operators, Constant):

    To create a TensorConstant, use the `constant` function in this module.
    """
-    def __init__(self, type, data, name = None):
+    def __init__(self, type, data, name=None):
        Constant.__init__(self, type, data, name)
        if (isinstance(data, numpy.ndarray) and
            data.ndim > 0 and
@@ -1631,12 +1732,12 @@ class TensorConstant(_tensor_py_operators, Constant):

    def __str__(self):
        if self.tag.unique_value is not None:
-            name = "%s of %s"%(str(self.data.shape),
+            name = "%s of %s" % (str(self.data.shape),
                               str(self.tag.unique_value))
        else:
-            name = "%s"%self.data
+            name = "%s" % self.data
        if len(name) > 20:
-            name = name[:10]+".."+name[-10:]
+            name = name[:10] + ".." + name[-10:]

        return "TensorConstant{%s}" % name

@@ -1677,15 +1778,19 @@ def _redefine(real_symbol_value, module='tensor'):
    This is useful to trick epydoc into doing what we want.  It's a hack.
    """
    real_symbol_value.__module__ = 'tensor.basic'
+
    def decorator(f):
        return real_symbol_value
+
    return decorator


 def _redefine_asRoutine(real_symbol_value):
    real_symbol_value.__epydoc_asRoutine = True
+
    def decorator(f):
        return real_symbol_value
+
    return decorator


@@ -1707,17 +1812,18 @@ def _scal_elemwise_with_nfunc(nfunc, nin, nout):
            msg = "inplace"
        else:
            msg = "no_inplace"
-        n="Elemwise{%s,%s}"%(symbolname,msg)
+
+        n = "Elemwise{%s,%s}" % (symbolname, msg)

        if inplace:
            scalar_op = getattr(scal, symbolname[:-len('_inplace')])
            inplace_scalar_op = scalar_op.__class__(scal.transfer_type(0))
            rval = elemwise.Elemwise(inplace_scalar_op, {0: 0}, name=n,
-                                     nfunc_spec = nfunc and (nfunc, nin, nout))
+                                     nfunc_spec=(nfunc and (nfunc, nin, nout)))
        else:
            scalar_op = getattr(scal, symbolname)
            rval = elemwise.Elemwise(scalar_op, name=n,
-                                     nfunc_spec = nfunc and (nfunc, nin, nout))
+                                     nfunc_spec=(nfunc and (nfunc, nin, nout)))

        if getattr(symbol, '__doc__', False):
            rval.__doc__ = symbol.__doc__ + '\n' + rval.__doc__
@@ -1744,35 +1850,44 @@ class TensorFromScalar(Op):
        assert isinstance(s.type, scal.Scalar)
        return Apply(self,
                     [s],
-                     [tensor(dtype = s.type.dtype,
-                             broadcastable = ())])
+                     [tensor(dtype=s.type.dtype,
+                             broadcastable=())])
+
    def perform(self, node, inp, out_):
        s, = inp
        out, = out_
        out[0] = numpy.asarray(s)
+
    def grad(self, inp, grads):
        s, = inp
        dt, = grads
        return [scalar_from_tensor(dt)]
+
    def __str__(self):
        return self.__class__.__name__
+
 tensor_from_scalar = TensorFromScalar()

+
 class ScalarFromTensor(Op):
    def __eq__(self, other):
        return type(self) == type(other)
+
    def __hash__(self):
        return hash(type(self))
+
    def make_node(self, t):
        assert isinstance(t.type, TensorType)
        assert t.type.broadcastable == ()
        return Apply(self,
                     [t],
-                     [scal.Scalar(dtype = t.type.dtype).make_variable()])
+                     [scal.Scalar(dtype=t.type.dtype).make_variable()])
+
    def perform(self, node, inp, out_):
        s, = inp
        out, = out_
        out[0] = s.flatten()[0]
+
    def grad(self, inp, grads):
        s, = inp
        dt, = grads
@@ -1785,66 +1900,81 @@ class ScalarFromTensor(Op):

    def __str__(self):
        return self.__class__.__name__
+
    def c_code(self, node, name, inputs, outputs, sub):
        x, = inputs
        z, = outputs
        fail = sub['fail']
        return """
        %(z)s = ((dtype_%(x)s*)(%(x)s->data))[0];
-        """%locals()
+        """ % locals()
+
    def c_code_cache_version(self):
        return (1,)
+
 scalar_from_tensor = ScalarFromTensor()


-#to be removed as we get the epydoc routine-documenting thing going -JB 20080924
+#to be removed as we get the epydoc routine-documenting thing going
+#-JB 20080924
 def _conversion(real_value, name):
    __oplist_tag(real_value, 'casting')
-    real_value.__module__='tensor.basic'
+    real_value.__module__ = 'tensor.basic'
    pprint.assign(real_value, printing.FunctionPrinter(name))
    return real_value


-#
-#  These _conver_to_<type> functions have leading underscores to indicate that they should not
-#  be called directly.  They do not perform sanity checks about what types you are casting to
-#  what.  That logic is implemented by the `cast()` function below.
-#
+# These _conver_to_<type> functions have leading underscores to indicate that
+# they should not be called directly.  They do not perform sanity checks about
+# what types you are casting to what.  That logic is implemented by the
+# `cast()` function below.

-_convert_to_int8  = _conversion(elemwise.Elemwise(scal.convert_to_int8), 'int8')
+_convert_to_int8 = _conversion(
+        elemwise.Elemwise(scal.convert_to_int8), 'int8')
 """Cast to 8-bit integer"""

-_convert_to_int16 = _conversion(elemwise.Elemwise(scal.convert_to_int16), 'int16')
+_convert_to_int16 = _conversion(
+        elemwise.Elemwise(scal.convert_to_int16), 'int16')
 """Cast to 16-bit integer"""

-_convert_to_int32 = _conversion(elemwise.Elemwise(scal.convert_to_int32), 'int32')
+_convert_to_int32 = _conversion(
+        elemwise.Elemwise(scal.convert_to_int32), 'int32')
 """Cast to 32-bit integer"""

-_convert_to_int64 = _conversion(elemwise.Elemwise(scal.convert_to_int64), 'int64')
+_convert_to_int64 = _conversion(
+        elemwise.Elemwise(scal.convert_to_int64), 'int64')
 """Cast to 64-bit integer"""

-_convert_to_uint8  = _conversion(elemwise.Elemwise(scal.convert_to_uint8), 'uint8')
+_convert_to_uint8 = _conversion(
+        elemwise.Elemwise(scal.convert_to_uint8), 'uint8')
 """Cast to unsigned 8-bit integer"""

-_convert_to_uint16 = _conversion(elemwise.Elemwise(scal.convert_to_uint16), 'uint16')
+_convert_to_uint16 = _conversion(
+        elemwise.Elemwise(scal.convert_to_uint16), 'uint16')
 """Cast to unsigned 16-bit integer"""

-_convert_to_uint32 = _conversion(elemwise.Elemwise(scal.convert_to_uint32), 'uint32')
+_convert_to_uint32 = _conversion(
+        elemwise.Elemwise(scal.convert_to_uint32), 'uint32')
 """Cast to unsigned 32-bit integer"""

-_convert_to_uint64 = _conversion(elemwise.Elemwise(scal.convert_to_uint64), 'uint64')
+_convert_to_uint64 = _conversion(
+        elemwise.Elemwise(scal.convert_to_uint64), 'uint64')
 """Cast to unsigned 64-bit integer"""

-_convert_to_float32 = _conversion(elemwise.Elemwise(scal.convert_to_float32), 'float32')
+_convert_to_float32 = _conversion(
+        elemwise.Elemwise(scal.convert_to_float32), 'float32')
 """Cast to single-precision floating point"""

-_convert_to_float64 = _conversion(elemwise.Elemwise(scal.convert_to_float64), 'float64')
+_convert_to_float64 = _conversion(
+        elemwise.Elemwise(scal.convert_to_float64), 'float64')
 """Cast to double-precision floating point"""

-_convert_to_complex64  = _conversion(elemwise.Elemwise(scal.convert_to_complex64), 'complex64')
+_convert_to_complex64 = _conversion(
+        elemwise.Elemwise(scal.convert_to_complex64), 'complex64')
 """Cast to single-precision complex"""

-_convert_to_complex128 = _conversion(elemwise.Elemwise(scal.convert_to_complex128), 'complex128')
+_convert_to_complex128 = _conversion(
+        elemwise.Elemwise(scal.convert_to_complex128), 'complex128')
 """Cast to double-precision complex"""

 _cast_mapping = {
@@ -1860,20 +1990,24 @@ _cast_mapping = {
           'float64': _convert_to_float64,
           'complex64': _convert_to_complex64,
           'complex128': _convert_to_complex128}
+
+
 @constructor
 def cast(x, dtype):
    """Symbolically cast `x` to a Tensor of type `dtype`."""
-    if dtype=='floatX': dtype = config.floatX
+    if dtype == 'floatX':
+        dtype = config.floatX

    _x = as_tensor_variable(x)
    if _x.type.dtype == dtype:
        return _x
    if _x.type.dtype.startswith('complex') and not dtype.startswith('complex'):
-        raise TypeError('Casting from complex to real is ambiguous: consider real(), imag(), angle() or abs()')
+        raise TypeError((
+            'Casting from complex to real is ambiguous: consider real(), '
+            'imag(), angle() or abs()'))
    return _cast_mapping[dtype](x)


-
 ##########################
 # Unary Operations
 ##########################
@@ -1886,10 +2020,13 @@ class Shape(Op):
    """
    def __hash__(self):
        return hash(type(self))
+
    def __eq__(self, other):
        return type(self) == type(other)
+
    def __str__(self):
        return self.__class__.__name__
+
    def make_node(self, x):
        #Must work for all type that have a shape attribute.
        #This will fail at execution time.
@@ -1899,21 +2036,29 @@ class Shape(Op):
        #the type to TensorVariable to have the optimization working
        #correctly.
        return Apply(self, [x], [lvector()])
+
    def perform(self, node, inp, out_):
        x, = inp
        out, = out_
-        out[0] = theano._asarray(x.shape, dtype = 'int64')
+        out[0] = theano._asarray(x.shape, dtype='int64')
+
    def grad(self, inp, grads):
        return [None]

    def R_op(self, inputs, eval_points):
        return [None]
+
+
 @constructor
 def old_shape(a):
-    """Return the shape tuple of a TensorType Variable, it may be either symbolic or nonsymbolic.
+    """
+    Return the shape tuple of a TensorType Variable.
+
+    It may be either symbolic or nonsymbolic.

-    If the shape of the expression is not known at graph-construction time, then a symbolic
-    lvector will be returned, corresponding to the actual shape at graph-execution time.
+    If the shape of the expression is not known at graph-construction time,
+    then a symbolic lvector will be returned, corresponding to the actual
+    shape at graph-execution time.
    """
    va = as_tensor_variable(a)
    #print 'HERE', va, va.type
@@ -1926,7 +2071,7 @@ def old_shape(a):
        return va.type.shape

 shape = Shape()
-_shape = shape #was used in the past, now use shape directly.
+_shape = shape  # was used in the past, now use shape directly.
 pprint.assign(_shape, printing.MemberPrinter('shape'))


@@ -1974,7 +2119,7 @@ class SpecifyShape(Op):
                s = get_constant_value(node.inputs[1][dim])
                s = as_tensor_variable(s)
                new_shape.append(s)
-            except TypeError, e:
+            except TypeError:
                new_shape.append(node.inputs[1][dim])

        assert len(new_shape) == len(xshape)
@@ -2185,16 +2330,25 @@ def argmin(x, axis=None):

 @constructor
 def smallest(*args):
-    """Return the [elementwise] smallest of a variable number of arguments (like python's min)."""
+    """
+    Return the [elementwise] smallest of a variable number of arguments.
+
+    Like python's min.
+    """
    if len(args) == 2:
        a, b = args
        return switch(a < b, a, b)
    else:
        return min(stack(*args), axis=0)

+
 @constructor
 def largest(*args):
-    """Return the [elementwise] largest of a variable number of arguments (like python's max)."""
+    """
+    Return the [elementwise] largest of a variable number of arguments.
+
+    Like python's max.
+    """
    if len(args) == 2:
        a, b = args
        return switch(a > b, a, b)
@@ -2210,30 +2364,37 @@ def largest(*args):
 def lt(a, b):
    """a < b"""

+
 @_scal_elemwise_with_nfunc('greater', 2, 1)
 def gt(a, b):
    """a > b"""

+
 @_scal_elemwise_with_nfunc('less_equal', 2, 1)
 def le(a, b):
    """a <= b"""

+
 @_scal_elemwise_with_nfunc('greater_equal', 2, 1)
 def ge(a, b):
    """a >= b"""

+
 @_scal_elemwise_with_nfunc('equal', 2, 1)
 def eq(a, b):
    """a == b"""

+
 @_scal_elemwise_with_nfunc('not_equal', 2, 1)
 def neq(a, b):
    """a != b"""

+
 @_scal_elemwise_with_nfunc('isnan', 1, 1)
 def isnan(a):
    """isnan(a)"""

+
 @_scal_elemwise_with_nfunc('isinf', 1, 1)
 def isinf(a):
    """isinf(a)"""
@@ -2253,24 +2414,27 @@ def switch(cond, ift, iff):
 ##########################

 @_scal_elemwise_with_nfunc('bitwise_and', 2, 1)
-def and_(a,b):
+def and_(a, b):
    """bitwise a & b"""
-bitwise_and = and_ # numpy name for it
+bitwise_and = and_  # numpy name for it
+

 @_scal_elemwise_with_nfunc('bitwise_or', 2, 1)
-def or_(a,b):
+def or_(a, b):
    """bitwise a | b"""
-bitwise_or = or_ # numpy name for it
+bitwise_or = or_  # numpy name for it
+

 @_scal_elemwise_with_nfunc('bitwise_xor', 2, 1)
-def xor(a,b):
+def xor(a, b):
    """bitwise a ^ b"""
-bitwise_xor = xor # numpy name for it
+bitwise_xor = xor  # numpy name for it
+

 @_scal_elemwise_with_nfunc('invert', 1, 1)
 def invert(a):
    """bitwise ~a"""
-bitwise_not = invert # numpy alias for it
+bitwise_not = invert  # numpy alias for it


 ##########################
@@ -2288,50 +2452,64 @@ def abs_(a):

 pprint.assign(abs_, printing.PatternPrinter(('|%(0)s|', -1000)))

+
 @_scal_elemwise_with_nfunc('exp', 1, 1)
 def exp(a):
    """e^`a`"""

+
 @_scal_elemwise_with_nfunc('negative', 1, 1)
 def neg(a):
    """-a"""

-@_scal_elemwise # numpy.reciprocal does integer division on integer inputs (which is not very interesting)
+
+# numpy.reciprocal does integer division on integer inputs
+# (which is not very interesting)
+@_scal_elemwise
 def inv(a):
    """1.0/a"""

+
 @_scal_elemwise_with_nfunc('log', 1, 1)
 def log(a):
    """base e logarithm of a"""

+
 @_scal_elemwise_with_nfunc('log2', 1, 1)
 def log2(a):
    """base 2 logarithm of a"""

+
 @_scal_elemwise_with_nfunc('log10', 1, 1)
 def log10(a):
    """base 10 logarithm of a"""

+
 @_scal_elemwise_with_nfunc('log1p', 1, 1)
 def log1p(a):
    """log(1+a)"""

+
 @_scal_elemwise_with_nfunc('sign', 1, 1)
 def sgn(a):
    """sign of a"""

+
 @_scal_elemwise_with_nfunc('ceil', 1, 1)
 def ceil(a):
    """ceiling of a"""

+
 @_scal_elemwise_with_nfunc('floor', 1, 1)
 def floor(a):
    """floor of a"""

+
 @constructor
 def iround(a, mode="half_away_from_zero"):
    """cast(round(a,mode),'int64')"""
-    return cast(round(a,mode),'int64')
+    return cast(round(a, mode), 'int64')
+

 @constructor
 def round(a, mode="half_away_from_zero"):
@@ -2341,80 +2519,99 @@ def round(a, mode="half_away_from_zero"):
    elif mode == "half_to_even":
        return round_half_to_even(a)
    else:
-        raise Exception("round mode %s is not implemented."%mode)
+        raise Exception("round mode %s is not implemented." % mode)
+

 @_scal_elemwise_with_nfunc('around', 1, -1)
 def round_half_to_even(a):
    """round_half_to_even(a)"""

+
 @_scal_elemwise
 def round_half_away_from_zero(a):
    """round_half_away_from_zero(a)"""

+
 @_scal_elemwise_with_nfunc('square', 1, 1)
 def sqr(a):
    """square of a"""

+
 @_scal_elemwise_with_nfunc('sqrt', 1, 1)
 def sqrt(a):
    """square root of a"""

+
 @_scal_elemwise_with_nfunc('cos', 1, 1)
 def cos(a):
    """cosine of a"""

-@_scal_elemwise_with_nfunc('arccos',1,1)
+
+@_scal_elemwise_with_nfunc('arccos', 1, 1)
 def arccos(a):
    """arccosine of a"""

+
 @_scal_elemwise_with_nfunc('sin', 1, 1)
 def sin(a):
    """sine of a"""

+
 @_scal_elemwise_with_nfunc('tan', 1, 1)
 def tan(a):
    """tangent of a"""

+
 @_scal_elemwise_with_nfunc('cosh', 1, 1)
 def cosh(a):
    """hyperbolic cosine of a"""

+
 @_scal_elemwise_with_nfunc('sinh', 1, 1)
 def sinh(a):
    """hyperbolic sine of a"""

+
 @_scal_elemwise_with_nfunc('tanh', 1, 1)
 def tanh(a):
    """hyperbolic tangent of a"""

+
 @_scal_elemwise
 def erf(a):
    """error function"""

+
 @_scal_elemwise
 def erfc(a):
    """complementary error function"""

+
 @_scal_elemwise_with_nfunc('real', 1, -1)
 def real(z):
    """Return real component of complex-valued tensor `z`"""

+
 @_scal_elemwise_with_nfunc('imag', 1, -1)
 def imag(z):
    """Return imaginary component of complex-valued tensor `z`"""

+
 @_scal_elemwise_with_nfunc('angle', 1, -1)
 def angle(z):
    """Return polar-coordinate angle of complex-valued tensor `z`"""

-@_scal_elemwise # numpy.complex cannot build tensors
+
+@_scal_elemwise  # numpy.complex cannot build tensors
 def complex(real, imag):
    """Return complex-valued tensor with `real` and `imag` components"""

+
 @_scal_elemwise
 def complex_from_polar(abs, angle):
    """Return complex-valued tensor from polar coordinate specification"""

+
 ##########################
 # Misc
 ##########################
@@ -2434,9 +2631,10 @@ def ones_like(model, dtype=None):
    """equivalent of numpy.ones_like"""
    if dtype is None:
        dtype = model.type.dtype
-    ret= fill(model, constant(1.0, dtype=dtype))
+    ret = fill(model, constant(1.0, dtype=dtype))
    return ret

+
 @constructor
 def zeros_like(model, dtype=None):
    """equivalent of numpy.zeros_like"""
@@ -2444,6 +2642,7 @@ def zeros_like(model, dtype=None):
        dtype = model.type.dtype
    return fill(model, constant(0.0, dtype=dtype))

+
 def zeros(shape, dtype=config.floatX):
    """
    Create a Tensor filled with zeros, closer to Numpy's syntax than ``alloc``.
@@ -2458,39 +2657,41 @@ def ones(shape, dtype=config.floatX):
    return alloc(numpy.array(1, dtype=dtype), *shape)


-
 class Eye(gof.Op):
    def __init__(self, dtype=config.floatX):
        self.dtype = dtype
-    def make_node(self,n,m,k):
+
+    def make_node(self, n, m, k):
        n = as_tensor_variable(n)
        m = as_tensor_variable(m)
        k = as_tensor_variable(k)
-        return gof.Apply(self, [n,m,k], [TensorType(dtype = self.dtype, broadcastable = (False,False))()])
+        return gof.Apply(self, [n, m, k],
+                [TensorType(dtype=self.dtype, broadcastable=(False, False))()])

    def perform(self, node, inp, out_):
        n, m, k = inp
        out, = out_
-        out[0] = numpy.eye(n,m,k,dtype=self.dtype)
+        out[0] = numpy.eye(n, m, k, dtype=self.dtype)

    def grad(self, inp, grads):
        return [None, None, None]

-    def __eq__(self,other):
+    def __eq__(self, other):
        return type(self) == type(other) and self.dtype == other.dtype

    def __hash__(self):
        return hash(self.dtype) ^ hash(type(self))


-def eye(n, m=None, k = 0, dtype = config.floatX):
+def eye(n, m=None, k=0, dtype=config.floatX):
    if m == None:
        m = n
    localop = Eye(dtype)
-    return localop(n,m,k)
+    return localop(n, m, k)
+

 def identity_like(x):
-    return eye(x.shape[0], x.shape[1], k=0, dtype = x.dtype)
+    return eye(x.shape[0], x.shape[1], k=0, dtype=x.dtype)

 if 0:
    ## COMMENTED OUT FEB 17 2010
@@ -2552,20 +2753,22 @@ if 0:
    pprint.assign(lambda pstate, r: r.owner and isinstance(r.owner.op, Filler) and r.owner.op.value == 0, printing.FunctionPrinter('zeros'))
    pprint.assign(lambda pstate, r: r.owner and isinstance(r.owner.op, Filler) and r.owner.op.value == 1, printing.FunctionPrinter('ones'))

+
 class Alloc(gof.Op):
    """Create a Tensor from an initial value and a desired shape

    alloc(value, shape0, shape1, ..., shapeN)

-    Returns an N-dimensional tensor initialized by `value` using something equivalent to
+    Returns an N-dimensional tensor initialized by `value` using something
+    equivalent to
    >>> z = numpy.zeros(shape, value.dtype)
    >>> z += value

-    The result has N dimensions, has the dtype of `value` and is obtained by broadcasting value
-    over the output ndarray.
+    The result has N dimensions, has the dtype of `value` and is obtained by
+    broadcasting value over the output ndarray.

-    This Op is used to replace fill() during optimizations because after shapes are lifted,
-    the first argument to fill can often be pruned from the graph.
+    This Op is used to replace fill() during optimizations because after shapes
+    are lifted, the first argument to fill can often be pruned from the graph.
    """
    def __init__(self):
        pass
@@ -2599,7 +2802,7 @@ class Alloc(gof.Op):
                const_shp = None
            bcast.append(numpy.all(1 == const_shp))
        otype = TensorType(dtype=v.dtype, broadcastable=bcast)
-        return gof.Apply(self, [v]+sh, [otype()])
+        return gof.Apply(self, ([v] + sh), [otype()])

    def perform(self, node, inputs, out_):
        out, = out_
@@ -2610,10 +2813,10 @@ class Alloc(gof.Op):
                out[0] = numpy.zeros(sh, dtype=v.dtype)
            else:
                out[0] = numpy.empty(sh, dtype=v.dtype)
-                out[0][...] = v # broadcast v to fill us up
+                out[0][...] = v  # broadcast v to fill us up
        else:
            #reuse the allocated memory.
-            out[0][...] = v # broadcast v to fill us up
+            out[0][...] = v  # broadcast v to fill us up

    def c_code(self, node, name, inp, out, sub):
        # TODO: use the elemwise code generator here
@@ -2647,6 +2850,7 @@ class Alloc(gof.Op):
                    zz[i] = vv;
                }
                """ % locals()
+
        # else pretend this never happened
        return super(Alloc, self).c_code(node, name, inp, out, sub)

@@ -2665,10 +2869,11 @@ class Alloc(gof.Op):
        If the alloc would be useless, this function returns val.
        If you always want an Alloc node, call make_node.
        """
-        ret = super(Alloc,self).__call__(val, *shapes)
+        ret = super(Alloc, self).__call__(val, *shapes)
        try:
-            #It makes optimization difficult when useless allocs are thrown into the graph at every
-            #stage of optimization.  This little logic tries to help at least in some cases.
+            # It makes optimization difficult when useless allocs are thrown
+            # into the graph at every stage of optimization.  This little logic
+            # tries to help at least in some cases.
            if val.type == ret.type:
                return val
        except AttributeError:
@@ -2729,9 +2934,11 @@ def prod(input, axis=None, dtype=None):
    """
    return elemwise.Prod(axis, dtype=dtype)(input)

+
 class Mean(elemwise.CAReduce):
-    def __init__(self, axis = None):
+    def __init__(self, axis=None):
        elemwise.CAReduce.__init__(self, scal.add, axis)
+
    def __str__(self):
        if self.axis is not None:
            return "Mean{%s}" % (", ".join(str(x) for x in self.axis))
@@ -2745,22 +2952,24 @@ class Mean(elemwise.CAReduce):
    def perform(self, node, inp, out):
        input, = inp
        output, = out
-        output[0]=numpy.mean(input,axis=self.axis)
+        output[0] = numpy.mean(input, axis=self.axis)

    def c_code(self, node, name, inames, onames, sub):
-        if self.axis!=None:
+        if self.axis != None:
            return super(Op, self).c_code(node, name, inames, onames, sub)
        ret = elemwise.CAReduce.c_code(self, node, name, inames, onames, sub)
        #TODO: c_code perform support only axis==None
        return ret + """
  *((double *)PyArray_DATA(%s)) /= PyArray_SIZE(%s);
-  """%(onames[0],inames[0])
+  """ % (onames[0], inames[0])

-#TODO: implement the grad. When done and tested, you can make this the default version.
+#TODO: implement the grad. When done and tested, you can make this the default
+# version.
 #    def grad(self, (x,), (gout,)):
 #      import pdb;pdb.set_trace()
 #      return grad(mean(x, self.axis, op=False),[x])

+
 @constructor
 def mean(input, axis=None, dtype=None, op=False):
    """Compute the mean value along the given axis of a tensor `input`
@@ -2817,8 +3026,9 @@ def mean(input, axis=None, dtype=None, op=False):

    return s

+
 @constructor
-def var(input, axis = None):
+def var(input, axis=None):
    """Compute the variance along the given axis of a tensor `input`.

    :param axis: Compute the variance along this axis of the tensor.
@@ -2854,7 +3064,8 @@ def var(input, axis = None):
    centered_input = input - mean_input

    #return the mean sqr
-    return mean(centered_input**2, axis)
+    return mean((centered_input ** 2), axis)
+

 @constructor
 def std(input, axis=None):
@@ -2901,6 +3112,7 @@ if 0:

    repeat = Repeat()

+
 class Default(gof.Op):
    """
    Takes an input x and a default value. If the input is not None, a
@@ -2909,39 +3121,45 @@ class Default(gof.Op):
    have exactly the same type.
    """
    view_map = {0: [0]}
+
    def make_node(self, x, default):
        x, default = as_tensor_variable(x), as_tensor_variable(default)
        if  x.type != default.type:
-            raise TypeError('Both default() arguments must have same type', x, default)
+            raise TypeError('Both default() arguments must have same type',
+                    x, default)
        return gof.Apply(self, [x, default], [default.type()])
+
    def perform(self, node, inp, out_):
        x, default = inp
        out, = out_
        if x is None:
-            # why copy?  Theano can't yet understand out[0] being a view of either x or y,
-            # so we can be a view of x, but only a copy of y.
+            # why copy?  Theano can't yet understand out[0] being a view of
+            # either x or y, so we can be a view of x, but only a copy of y.
            out[0] = default.copy()
        else:
            out[0] = x
+
 default = Default()
-setdefault = default # legacy
+setdefault = default  # legacy


 ##########################
 # Arithmetics
 ##########################
 @_scal_elemwise_with_nfunc('maximum', 2, 1)
-def maximum(x,y):
+def maximum(x, y):
    """elemwise maximum. See max for the maximum in one tensor
    """
    # see decorator for function body

+
 @_scal_elemwise_with_nfunc('minimum', 2, 1)
-def minimum(x,y):
+def minimum(x, y):
    """elemwise minimum. See min for the minimum in one tensor
    """
    # see decorator for function body

+
 def div_proxy(x, y):
    """Proxy for either true_div or int_div, depending on types of x, y."""
    f = eval('%s_div' % scal.int_or_true_div(
@@ -2949,32 +3167,39 @@ def div_proxy(x, y):
        as_tensor_variable(y).dtype in discrete_dtypes))
    return f(x, y)

+
 @_scal_elemwise_with_nfunc('add', 2, 1)
 def add(a, *other_terms):
    """elementwise addition"""
    # see decorator for function body

+
 @_scal_elemwise_with_nfunc('subtract', 2, 1)
 def sub(a, b):
    """elementwise subtraction"""
    # see decorator for function body

+
 @_scal_elemwise_with_nfunc('multiply', 2, 1)
 def mul(a, *other_terms):
    """elementwise multiplication"""
    # see decorator for function body

+
 @_scal_elemwise_with_nfunc('true_divide', 2, 1)
 def true_div(a, b):
    """elementwise [true] division (inverse of multiplication)"""
    # see decorator for function body

+
 @_scal_elemwise_with_nfunc('floor_divide', 2, 1)
 def floor_div(a, b):
    """elementwise [floor] division (inverse of multiplication)"""
    # see decorator for function body

-@_scal_elemwise_with_nfunc('floor_divide', 2, 1) # not a c/p error, floor_div and int_div are the same thing
+
+# not a c/p error, floor_div and int_div are the same thing
+@_scal_elemwise_with_nfunc('floor_divide', 2, 1)
 def int_div(a, b):
    """elementwise integer-division"""
    # see decorator for function body
@@ -3009,19 +3234,22 @@ def mod_check(x, y):
    else:
        return mod(x, y)

+
 @_scal_elemwise_with_nfunc('mod', 2, 1)
 def mod(a, b):
    """elementwise modulo"""
    # see decorator for function body

+
 @_scal_elemwise_with_nfunc('power', 2, 1)
 def pow(a, b):
    """elementwise power"""
    # see decorator for function body

+
 # The numpy.clip don't work correctly when
 # the min is bigger then the max
-@_scal_elemwise #_with_nfunc('clip', 3, 1)
+@_scal_elemwise  # _with_nfunc('clip', 3, 1)
 def clip(x, min, max):
    """clip x to be between min and max"""
    # see decorator for function body
@@ -3036,7 +3264,6 @@ pprint.assign(int_div, printing.OperatorPrinter('//', -1, 'left'))
 pprint.assign(pow, printing.OperatorPrinter('**', 1, 'right'))


-
 ##########################
 # View Operations
 ##########################
@@ -3045,9 +3272,6 @@ pprint.assign(pow, printing.OperatorPrinter('**', 1, 'right'))
 # Helpful functions to deal with Subtensor and IncSubtensor
 ##########

-
-
-
 def get_idx_list(inputs, idx_list):
    '''
    Given a list of inputs to the subtensor and its idx_list reorders
@@ -3105,53 +3329,52 @@ def get_canonical_form_slice(theslice, length):
    resulting set of numbers needs to be reversed or not.
   '''

-
-    if isinstance(theslice,slice):
+    if isinstance(theslice, slice):

        start = extract_constant(theslice.start)
-        stop  = extract_constant(theslice.stop)
-        step  = extract_constant(theslice.step)
+        stop = extract_constant(theslice.stop)
+        step = extract_constant(theslice.step)
        if step is None:
            step = 1

-        defstart = switch(lt(step,0), length-1, 0)
-        defstop  = switch(lt(step,0), -1, length )
+        defstart = switch(lt(step, 0), (length - 1), 0)
+        defstop = switch(lt(step, 0), -1, length)
        if start is None:
            start = defstart
        else:
-            start = switch(lt(start,0), start + length, start)
-            start = switch(lt(start,0), switch(lt(step,0), -1, 0), start)
-            start = switch(ge(start,length)
-                           , switch(lt(step,0),length-1,length)
-                           , start)
+            start = switch(lt(start, 0), start + length, start)
+            start = switch(lt(start, 0), switch(lt(step, 0), -1, 0), start)
+            start = switch(ge(start, length),
+                           switch(lt(step, 0), (length - 1), length),
+                           start)
        if stop in [None, maxsize]:
            # The special "maxsize" case is probably not needed here,
            # as slices containing maxsize are not generated by
            # __getslice__ anymore.
            stop = defstop
        else:
-            stop = switch(lt(stop,0), stop + length, stop)
-            stop = switch(lt(stop,0), -1, stop)
-            stop = switch(ge(stop,length), length,stop)
-
-        nw_stop  = switch(lt(step,0), start+1, stop )
-        slice_len = ( start -stop - 1)//abs(step) + 1
-        slice_len = switch(lt(slice_len,0), 0, slice_len)
-        neg_start = nw_stop - (slice_len-1)*abs(step)-1
-        neg_start = switch(lt(neg_start,0), nw_stop-1, neg_start)
-        nw_start  = switch(lt(step,0), neg_start, start)
-        nw_start = switch(lt(nw_start,0), 0, nw_start)
-        nw_stop  = switch(lt(nw_stop,0) , 0, nw_stop )
-
-        nw_step  = abs(step)
+            stop = switch(lt(stop, 0), stop + length, stop)
+            stop = switch(lt(stop, 0), -1, stop)
+            stop = switch(ge(stop, length), length, stop)
+
+        nw_stop = switch(lt(step, 0), (start + 1), stop)
+        slice_len = (start - stop - 1) // abs(step) + 1
+        slice_len = switch(lt(slice_len, 0), 0, slice_len)
+        neg_start = nw_stop - (slice_len - 1) * abs(step) - 1
+        neg_start = switch(lt(neg_start, 0), (nw_stop - 1), neg_start)
+        nw_start = switch(lt(step, 0), neg_start, start)
+        nw_start = switch(lt(nw_start, 0), 0, nw_start)
+        nw_stop = switch(lt(nw_stop, 0), 0, nw_stop)
+
+        nw_step = abs(step)
        if step != 1:
-            reverse  = sgn(step)
+            reverse = sgn(step)
            return slice(nw_start, nw_stop, nw_step), reverse
        else:
            return slice(nw_start, nw_stop, nw_step), 1
    else:
        value = extract_constant(theslice)
-        value = switch(lt(value,0), value+length, value)
+        value = switch(lt(value, 0), (value + length), value)

        return value, 1

@@ -3165,7 +3388,7 @@ def transpose(x, axes=None):

    """
    if axes is None:
-        axes = range(x.ndim-1, -1, -1)
+        axes = range((x.ndim - 1), -1, -1)
    return DimShuffle(x.broadcastable, axes, inplace=False)(x)


@@ -3175,7 +3398,7 @@ class AdvancedIndexingError(TypeError):
    """

    def __init__(self, *args):
-        TypeError.__init__( self, *args)
+        TypeError.__init__(self, *args)


 class Subtensor(Op):
@@ -3185,8 +3408,8 @@ class Subtensor(Op):
    to remember how the input tensor x should be sliced.  The instance variable
    idx_list is a list whose elements are either integers, or slices.  The
    integers are indexes into the inputs array, and the start/stop/step members
-    of each slice are also integer indexes into the inputs array (or None).  The
-    inputs array is the tensor x, followed by scalar integer variables.
+    of each slice are also integer indexes into the inputs array (or None).
+    The inputs array is the tensor x, followed by scalar integer variables.

    @todo: add support for advanced tensor indexing (in Subtensor_dx too).

@@ -3197,7 +3420,7 @@ class Subtensor(Op):
    additionally be a Scalar instance, and slice components can also be Scalar
    instances too.
    """
-    e_invalid = ( 'The index list is longer (size %d) than the number of '
+    e_invalid = ('The index list is longer (size %d) than the number of '
                 'dimensions of the tensor(namely %d). You are asking for '
                 'a dimension of the tensor that does not exist! You might '
                 'need to use dimshuffle to add extra dimension to your '
@@ -3211,33 +3434,42 @@ class Subtensor(Op):
    @staticmethod
    def collapse(idxs, cond):
        ret = []
+
        def helper(entry):
            if cond(entry):
                ret.append(entry)
            elif isinstance(entry, slice):
                helper(entry.start)
                helper(entry.stop)
-                helper( entry.step)
+                helper(entry.step)
+
        for idx in idxs:
            helper(idx)
        return ret

    @staticmethod
    def convert(entry, slice_ok=True):
-        invalid_scal_types = [scal.float64, scal.float32 ]
+        invalid_scal_types = [scal.float64, scal.float32]
        scal_types = [scal.int64, scal.int32, scal.int16, scal.int8]
        tensor_types = [lscalar, iscalar, wscalar, bscalar]
-        invalid_tensor_types = [fscalar, dscalar, cscalar, zscalar ]
-        if isinstance(entry, gof.Variable) and (entry.type in invalid_scal_types \
-                or entry.type in invalid_tensor_types):
+        invalid_tensor_types = [fscalar, dscalar, cscalar, zscalar]
+        if (isinstance(entry, gof.Variable)
+                and (entry.type in invalid_scal_types
+                     or entry.type in invalid_tensor_types)):
            raise TypeError("Expected an integer")
+
        if isinstance(entry, gof.Variable) and entry.type in scal_types:
            return entry.type
        elif isinstance(entry, gof.Type) and entry in scal_types:
            return entry
-        if isinstance(entry, gof.Variable) and entry.type in tensor_types and numpy.all(entry.type.broadcastable):
+
+        if (isinstance(entry, gof.Variable)
+                and entry.type in tensor_types
+                and numpy.all(entry.type.broadcastable)):
            return scal.Scalar(entry.type.dtype)
-        elif isinstance(entry, gof.Type) and entry in tensor_types and numpy.all(entry.broadcastable):
+        elif (isinstance(entry, gof.Type)
+                and entry in tensor_types
+                and numpy.all(entry.broadcastable)):
            return scal.Scalar(entry.dtype)
        elif slice_ok and isinstance(entry, slice):
            a = entry.start
@@ -3283,15 +3515,14 @@ class Subtensor(Op):
        else:
            return scal.as_scalar(a)

-
    def make_node(self, x, *inputs):
        x = as_tensor_variable(x)
        inputs = tuple(self.my_as_scalar(a) for a in inputs)

        idx_list = list(self.idx_list)
        if len(idx_list) > x.type.ndim:
-            exception = ValueError(Subtensor.e_invalid%(len(idx_list),
-                                                        x.type.ndim))
+            exception = ValueError(Subtensor.e_invalid % (
+                len(idx_list), x.type.ndim))
            exception.subtensor_invalid = True
            raise exception

@@ -3310,13 +3541,13 @@ class Subtensor(Op):
        for input, expected_type in zip(inputs, input_types):
            if input.type != expected_type:
                raise TypeError(
-                    "Wrong type for Subtensor template. Expected %s, got %s."%(
-                        input.type, expected_type))
+                    "Wrong type for Subtensor template. Expected %s, got %s."
+                    % (input.type, expected_type))

        return gof.Apply(self,
                         (x, ) + inputs,
-                         [tensor(dtype = x.type.dtype,
-                                 broadcastable = broadcastable)])
+                         [tensor(dtype=x.type.dtype,
+                                 broadcastable=broadcastable)])

    def perform(self, node, inputs, out_):
        out, = out_
@@ -3342,21 +3573,22 @@ class Subtensor(Op):
        assert len(xshp) == node.inputs[0].ndim
        outshp = []
        actual_idx_list = list(get_idx_list(node.inputs, self.idx_list))
-        padded = ( actual_idx_list +
-                  [slice(None, None, None)]*(len(xshp)-len(self.idx_list)))
+        padded = (actual_idx_list +
+                  [slice(None, None, None)] * (len(xshp) - len(self.idx_list)))
        i = 0
        for idx, xl in izip(padded, xshp):
            if isinstance(idx, slice):
                # If it is the default (None, None, None) slice, or a variant,
                # the shape will be xl
-                if ( (idx.start in [None, 0])
+                if ((idx.start in [None, 0])
                    and (idx.stop in [None, maxsize])
-                    and (idx.step is None or idx.step == 1) ):
+                    and (idx.step is None or idx.step == 1)):
                    outshp.append(xl)
                else:
                    cnf = get_canonical_form_slice(idx, xl)
-                    length = (cnf[0].stop - cnf[0].start -1) // cnf[0].step + 1
-                    length = switch(lt(length,0), 0, length)
+                    length = ((cnf[0].stop - cnf[0].start - 1) // cnf[0].step
+                            + 1)
+                    length = switch(lt(length, 0), 0, length)
                    outshp.append(length)
                i += 1
            else:
@@ -3370,7 +3602,8 @@ class Subtensor(Op):
        gz, = grads
        x = inputs[0]
        rest = inputs[1:]
-        return [IncSubtensor(self.idx_list)(zeros_like(x), gz, *rest)] + [None] * len(rest)
+        return ([IncSubtensor(self.idx_list)(zeros_like(x), gz, *rest)]
+                + [None] * len(rest))

    def __eq__(self, other):
        return type(self) == type(other) and self.idx_list == other.idx_list
@@ -3401,6 +3634,7 @@ class Subtensor(Op):
            else:
                msg.append(str(x))
        return ":".join(msg)
+
    def __str__(self):
        indices = []
        for entry in self.idx_list:
@@ -3420,44 +3654,53 @@ class Subtensor(Op):
        # subtensor_spec: len = n_ints + 3 * n_slices
        #
        fail = sub['fail']
-        init_cmds = [] # initialization for subtensor_spec
+        init_cmds = []  # initialization for subtensor_spec
        is_slice = []
        #TODO: change that, it might lead to unexpected results,
        # see assembla-#767
        NONE_CODE = maxsize - 1

-        pos = [0,1] #annoying version of global variable for init_entry
-        def inc_spec_pos(amt): pos[0] += amt
-        def inc_input_pos(amt): pos[1] += amt
-        def spec_pos(): return pos[0]
-        def input_pos(): return pos[1]
+        pos = [0, 1]  # annoying version of global variable for init_entry
+
+        def inc_spec_pos(amt):
+            pos[0] += amt
+
+        def inc_input_pos(amt):
+            pos[1] += amt
+
+        def spec_pos():
+            return pos[0]
+
+        def input_pos():
+            return pos[1]
+
        def init_entry(entry, depth=0):
            if isinstance(entry, int):
                init_cmds.append(
-                        "subtensor_spec[%i] = %i;" %(spec_pos(),
+                        "subtensor_spec[%i] = %i;" % (spec_pos(),
                            entry))
                inc_spec_pos(1)
-                if depth==0:
+                if depth == 0:
                    is_slice.append(0)
            elif isinstance(entry, Type):
                init_cmds.append(
-                        "subtensor_spec[%i] = %s;" %(spec_pos(),
+                        "subtensor_spec[%i] = %s;" % (spec_pos(),
                            inputs[input_pos()]))
                inc_spec_pos(1)
                inc_input_pos(1)
-                if depth==0:
+                if depth == 0:
                    is_slice.append(0)
            elif entry is None:
                init_cmds.append(
-                        "subtensor_spec[%i] = %i;" %(spec_pos(),
+                        "subtensor_spec[%i] = %i;" % (spec_pos(),
                            NONE_CODE))
                inc_spec_pos(1)
-                if depth==0:
+                if depth == 0:
                    is_slice.append(0)
-            elif depth==0 and isinstance(entry, slice):
-                init_entry(entry.start, depth+1)
-                init_entry(entry.stop, depth+1)
-                init_entry(entry.step, depth+1)
+            elif depth == 0 and isinstance(entry, slice):
+                init_entry(entry.start, depth + 1)
+                init_entry(entry.stop, depth + 1)
+                init_entry(entry.step, depth + 1)
                is_slice.append(1)
            else:
                assert 0, entry
@@ -3469,7 +3712,7 @@ class Subtensor(Op):
        assert len(is_slice) <= node.inputs[0].ndim, node.inputs[0].ndim

        len_is_slice = len(is_slice)
-        view_ndim = node.inputs[0].ndim - (numpy.asarray(is_slice)==0).sum()
+        view_ndim = node.inputs[0].ndim - (numpy.asarray(is_slice) == 0).sum()

        len_subtensor_spec = spec_pos()

@@ -3635,7 +3878,7 @@ class Subtensor(Op):
            outer_ii += 1;
        }
        PyArray_UpdateFlags(xview, NPY_C_CONTIGUOUS|NPY_F_CONTIGUOUS);
-        """% locals()
+        """ % locals()
        #print rval
        return rval

@@ -3643,7 +3886,7 @@ class Subtensor(Op):
    def helper_c_code_cache_version():
        return (4,)

-    def c_code(self, node, name, inputs, outputs, sub): #DEBUG
+    def c_code(self, node, name, inputs, outputs, sub):  # DEBUG
        part0 = self.helper_c_code(node, name, inputs, outputs, sub,
                self.idx_list)

@@ -3655,11 +3898,10 @@ class Subtensor(Op):
        xview->base = py_%(x)s;
        assert(py_%(x)s == (PyObject*)%(x)s);
        %(z)s = xview;
-        """ %locals()
+        """ % locals()

        return part0 + part1

-
    def c_code_cache_version(self):
        hv = self.helper_c_code_cache_version()
        # If `helper_c_code_cache_version` is not versioned we do not want to
@@ -3676,6 +3918,7 @@ class Subtensor(Op):
            return [None]
        return self.make_node(eval_points[0], *inputs[1:]).outputs

+
 class SubtensorPrinter:

    def process(self, r, pstate):
@@ -3686,34 +3929,39 @@ class SubtensorPrinter:
            inputs = list(r.owner.inputs)
            input = inputs.pop()
            sidxs = []
-            inbrack_pstate = pstate.clone(precedence = -1000)
+            inbrack_pstate = pstate.clone(precedence=-1000)
            for entry in idxs:
                if isinstance(entry, int):
                    sidxs.append(str(entry))
                elif isinstance(entry, scal.Scalar):
                    sidxs.append(inbrack_pstate.pprinter.process(inputs.pop()))
                elif isinstance(entry, slice):
-                    if entry.start is None or entry.start==0:
+                    if entry.start is None or entry.start == 0:
                        msg1 = ""
                    else:
-                        msg1 =  entry.start
+                        msg1 = entry.start

                    if entry.stop is None or entry.stop == maxsize:
                        msg2 = ""
                    else:
-                        msg2 =  entry.stop
+                        msg2 = entry.stop

                    if entry.step is None:
                        msg3 = ""
                    else:
-                        msg3 =  ":%s" % entry.step
+                        msg3 = ":%s" % entry.step

-                    sidxs.append("%s:%s%s"  % (msg1, msg2, msg3))
-            return "%s[%s]" % (pstate.pprinter.process(input, pstate.clone(precedence = 1000)), ", ".join(sidxs))
+                    sidxs.append("%s:%s%s" % (msg1, msg2, msg3))
+            return "%s[%s]" % (pstate.pprinter.process(
+                input,
+                pstate.clone(precedence=1000)),
+                ", ".join(sidxs))
        else:
            raise TypeError("Can only print Subtensor.")

-pprint.assign(lambda pstate, r: r.owner and isinstance(r.owner.op, Subtensor), SubtensorPrinter())
+pprint.assign(lambda pstate, r: r.owner and isinstance(r.owner.op, Subtensor),
+        SubtensorPrinter())
+

 def set_subtensor(x, y, inplace=False,
        tolerate_inplace_aliasing=False):
@@ -3730,6 +3978,7 @@ def set_subtensor(x, y, inplace=False,
    return inc_subtensor(x, y, inplace, set_instead_of_inc=True,
            tolerate_inplace_aliasing=tolerate_inplace_aliasing)

+
 def inc_subtensor(x, y, inplace=False, set_instead_of_inc=False,
        tolerate_inplace_aliasing=False):
    """Return x with the given subtensor incremented by y.
@@ -3753,7 +4002,8 @@ def inc_subtensor(x, y, inplace=False, set_instead_of_inc=False,
        else:
            destroyhandler_tolerate_aliased = []
        the_op = IncSubtensor(x.owner.op.idx_list, inplace, set_instead_of_inc,
-                destroyhandler_tolerate_aliased=destroyhandler_tolerate_aliased)
+                destroyhandler_tolerate_aliased=destroyhandler_tolerate_aliased
+                )
        real_x = x.owner.inputs[0]
        real_idxargs = x.owner.inputs[1:]
        return the_op(real_x, y, *real_idxargs)
@@ -3790,7 +4040,8 @@ class IncSubtensor(Op):
        self.inplace = inplace
        if inplace:
            self.destroy_map = {0: [0]}
-        self.destroyhandler_tolerate_aliased = list(destroyhandler_tolerate_aliased)
+        self.destroyhandler_tolerate_aliased = list(
+                destroyhandler_tolerate_aliased)
        self.set_instead_of_inc = set_instead_of_inc

    def __eq__(self, other):
@@ -3843,19 +4094,13 @@ class IncSubtensor(Op):
        idx_list = list(self.idx_list)
        if len(idx_list) > x.type.ndim:
            exception = ValueError(
-                    Subtensor.e_invalid%(
+                    Subtensor.e_invalid % (
                        len(idx_list),
                        x.type.ndim))
            exception.subtensor_invalid = True
            raise exception

-        #infer the broadcasting pattern
-        padded = (idx_list
-                + [slice(None, None, None)] * (x.type.ndim - len(idx_list)))
-        broadcastable = [bc for p, bc in zip(padded, x.type.broadcastable)
-                if isinstance(p, slice)]
-
-        input_types = Subtensor.collapse( idx_list,
+        input_types = Subtensor.collapse(idx_list,
                lambda entry: isinstance(entry, gof.Type))
        if len(inputs) != len(input_types):
            raise IndexError(
@@ -3864,8 +4109,8 @@ class IncSubtensor(Op):
        for input, expected_type in zip(inputs, input_types):
            if input.type != expected_type:
                raise TypeError(
-                    "Wrong type for Subtensor template. Expected %s, got %s."%(
-                        input.type, expected_type))
+                    "Wrong type for Subtensor template. Expected %s, got %s."
+                    % (input.type, expected_type))

        return gof.Apply(self,
                         (x, y) + inputs,
@@ -3907,16 +4152,16 @@ class IncSubtensor(Op):
                x.__setitem__(cdata, y)
        out[0] = x

-    def c_code(self, node, name, inputs, outputs, sub): #DEBUG
+    def c_code(self, node, name, inputs, outputs, sub):  # DEBUG

-        if self.inplace: # convert bool to int
+        if self.inplace:  # convert bool to int
            inplace = 1
        else:
            inplace = 0
        x = inputs[0]
        y = inputs[1]
        z, = outputs
-        if self.set_instead_of_inc: # convert bool to int
+        if self.set_instead_of_inc:  # convert bool to int
            op_is_set = 1
        else:
            op_is_set = 0
@@ -3941,10 +4186,9 @@ class IncSubtensor(Op):

        # make xview actually a view of %(z)s
        get_xview = Subtensor.helper_c_code(node, name,
-                outputs[:1]+inputs[2:],
+                outputs[:1] + inputs[2:],
                outputs, sub, self.idx_list)

-
        make_modification = """
        if (%(op_is_set)s)
        {
@@ -3970,7 +4214,7 @@ class IncSubtensor(Op):
                %(fail)s;
            }
        }
-        """ %locals()
+        """ % locals()

        return (copy_input_if_necessary
                + get_xview
@@ -4295,7 +4539,6 @@ class Join(Op):

    def _make_node_internal(self, axis, tensors,
                as_tensor_variable_args, output_maker):
-        orig = as_tensor_variable_args
        if not python_all(targs.type.ndim for targs
                          in as_tensor_variable_args):
            raise TypeError('Join cannot handle arguments of dimension 0.'
@@ -4340,7 +4583,7 @@ class Join(Op):
                            bcastable[current_axis] = True
                try:
                    bcastable[axis] = False
-                except IndexError, e:
+                except IndexError:
                    raise ValueError('Join argument "axis" is out of range'
                                     ' (given input dimensions)')
                as_tensor_variable_args = [unbroadcast(x, axis)
@@ -4699,7 +4942,6 @@ if 0:
            x, y = inp
            gz, = grads
            xs = shape(x)
-            ys = shape(y)
            return gz[:xs[0]], gz[xs[0]:]
    vertical_stack = VerticalStack()

@@ -4765,7 +5007,7 @@ class Reshape(Op):
                             ', should be %i' % (len(shp), self.ndim), shp)
        try:
            out[0] = numpy.reshape(x, shp)
-        except Exception, e:
+        except Exception:
            raise ValueError('Cannot reshape input of shape %s to shape %s' %
                             (x.shape, shp))


--- a/theano/tensor/elemwise.py
+++ b/theano/tensor/elemwise.py
@@ -88,7 +88,7 @@ class DimShuffle(Op):
    Adding, subtracting dimensions can be done with reshape.
    """

-    def __init__(self, input_broadcastable, new_order, inplace = False):
+    def __init__(self, input_broadcastable, new_order, inplace=False):
        """
        Usage: DimShuffle(input_broadcastable, new_order, inplace = False)

@@ -115,33 +115,41 @@ class DimShuffle(Op):
        self.new_order = new_order
        self.inplace = inplace

-        for i in xrange(len(new_order)-1):
+        for i in xrange(len(new_order) - 1):
            j = new_order[i]
-            if j != 'x' and j in new_order[i+1:]:
-                raise ValueError("The same input dimension may not appear twice in the list of output dimensions", (new_order))
+            if j != 'x' and j in new_order[(i + 1):]:
+                raise ValueError((
+                    "The same input dimension may not appear twice in the "
+                    "list of output dimensions", (new_order)))

        # list of dimensions of the input to drop
        self.drop = []
-        i2j = {} # this maps i before dropping dimensions to j after dropping dimensions so self.shuffle can be set properly later on
+        # this maps i before dropping dimensions to j after dropping dimensions
+        # so self.shuffle can be set properly later on
+        i2j = {}
        j = 0
        for i, b in enumerate(input_broadcastable):
            if i not in new_order:
-                # we want to drop this dimension because it's not a value in new_order
-                if b == 1: # 1 aka True
+                # we want to drop this dimension because it's not a value in
+                # new_order
+                if b == 1:  # 1 aka True
                    self.drop.append(i)
                else:
                    # we cannot drop non-broadcastable dimensions
-                    raise ValueError("You cannot drop a non-broadcastable dimension.", (input_broadcastable, new_order))
+                    raise ValueError(
+                            "You cannot drop a non-broadcastable dimension.",
+                            (input_broadcastable, new_order))
            else:
                i2j[i] = j
                j += 1

        # transposition of non-broadcastable dimensions
-        # This is how the dimensions will be permuted, without accounting for the extra
-        # 'x' broadcastable dimensions to insert.
+        # This is how the dimensions will be permuted, without accounting for
+        # the extra 'x' broadcastable dimensions to insert.
        self.shuffle = [i2j[x] for x in new_order if x != 'x']

-        # list of dimensions of the output that are broadcastable and were not in the original input
+        # list of dimensions of the output that are broadcastable and were not
+        # in the original input
        self.augment = [i for i, x in enumerate(new_order) if x == 'x']

        if self.inplace:
@@ -162,7 +170,10 @@ class DimShuffle(Op):
        input = as_tensor_variable(_input)
        ib = tuple(input.type.broadcastable)
        if not ib == self.input_broadcastable:
-            raise TypeError("The number of dimensions and/or broadcastable pattern of the input is incorrect for this op. Expected %s, got %s." % (self.input_broadcastable, ib))
+            raise TypeError((
+                "The number of dimensions and/or broadcastable pattern of the "
+                "input is incorrect for this op. Expected %s, got %s."
+                % (self.input_broadcastable, ib)))
        ob = []
        for value in self.new_order:
            if value == 'x':
@@ -170,8 +181,8 @@ class DimShuffle(Op):
            else:
                ob.append(ib[value])

-        output = TensorType(dtype = input.type.dtype,
-                        broadcastable = ob).make_variable()
+        output = TensorType(dtype=input.type.dtype,
+                        broadcastable=ob).make_variable()

        return Apply(self, [input], [output])

@@ -183,15 +194,20 @@ class DimShuffle(Op):
            and self.input_broadcastable == other.input_broadcastable

    def _rehash(self):
-        self._hashval = hash(type(self).__name__) ^ hash(type(self).__module__) ^ hash(self.inplace) \
-                ^ hash(self.new_order) ^ hash(self.input_broadcastable)
+        self._hashval = (
+                hash(type(self).__name__)
+                ^ hash(type(self).__module__)
+                ^ hash(self.inplace)
+                ^ hash(self.new_order)
+                ^ hash(self.input_broadcastable))

    def __hash__(self):
        return self._hashval

    def __str__(self):
        if self.inplace:
-            return "InplaceDimShuffle{%s}" % ",".join(str(x) for x in self.new_order)
+            return "InplaceDimShuffle{%s}" % ",".join(str(x)
+                    for x in self.new_order)
        else:
            return "DimShuffle{%s}" % ",".join(str(x) for x in self.new_order)

@@ -220,7 +236,7 @@ class DimShuffle(Op):
        if not self.inplace:
            res = numpy.copy(res)

-        storage[0] = numpy.asarray(res) #asarray puts scalars back into array
+        storage[0] = numpy.asarray(res)  # asarray puts scalars back into array

    def infer_shape(self, node, shapes):
        ishp, = shapes
@@ -256,32 +272,33 @@ class DimShuffle(Op):

        clear_output = ['if (%(res)s) {Py_XDECREF(%(res)s);}']

-        #get the copy / view of the input depending on whether we're doing things inplace or not.
+        #get the copy / view of the input depending on whether we're doingi
+        # things inplace or not.
        if self.inplace:
            get_base = ['{ PyArrayObject * %(basename)s = %(input)s', 'Py_INCREF((PyObject*)%(basename)s)']
        else:
            get_base = [('{ PyArrayObject * %(basename)s = (PyArrayObject*)PyArray_FromAny((PyObject*)%(input)s, NULL,'
                    '0, 0, NPY_ALIGNED|NPY_ENSURECOPY, NULL)')]

-        shape_statements = ['npy_intp dimensions[%i]'%nd_out]
+        shape_statements = ['npy_intp dimensions[%i]' % nd_out]
        for i, o in enumerate(self.new_order):
            if o != 'x':
-                shape_statements += [('dimensions['+str(i)+'] = %(basename)s->dimensions['+str(o)+']')]
+                shape_statements += [('dimensions[' + str(i) + '] = %(basename)s->dimensions[' + str(o) + ']')]
            else:
-                shape_statements += [('dimensions['+str(i)+'] = 1')]
+                shape_statements += [('dimensions[' + str(i) + '] = 1')]

-
-        strides_statements = ['npy_intp strides[%i]'%nd_out]
+        strides_statements = ['npy_intp strides[%i]' % nd_out]

        #set the strides of the non-broadcasted dimensions
        for i, o in enumerate(self.new_order):
            if o != 'x':
-                strides_statements += [('strides['+str(i)+'] = %(basename)s->strides['+str(o)+']')]
+                strides_statements += [('strides[' + str(i) + '] = %(basename)s->strides[' + str(o) + ']')]
            else:
-                strides_statements += [('strides['+str(i)+'] = 0')]
+                strides_statements += [('strides[' + str(i) + '] = 0')]

        # set the strides of the broadcasted dimensions
-        # this algorithm is from numpy: PyArray_Newshape() in cvs/numpy/numpy/core/src/multiarraymodule.c
+        # this algorithm is from numpy: PyArray_Newshape() in
+        # cvs/numpy/numpy/core/src/multiarraymodule.c
        if nd_out > 0:
            strides_statements.append(
                'if (strides[' +
@@ -290,8 +307,8 @@ class DimShuffle(Op):
                str(nd_out) +
                '-1] = %(basename)s->descr->elsize'
            )
-        for i in xrange(nd_out-2,-1, -1):
-            strides_statements.append("if (strides[%(i)s] == 0) strides[%(i)s] = strides[%(i)s+1] * dimensions[%(i)s+1]"%dict(i=str(i)))
+        for i in xrange(nd_out - 2, -1, -1):
+            strides_statements.append("if (strides[%(i)s] == 0) strides[%(i)s] = strides[%(i)s+1] * dimensions[%(i)s+1]" % dict(i=str(i)))

        #
        # PyObject* PyArray_New(PyTypeObject* subtype, int nd, npy_intp* dims, int type_num,
@@ -332,7 +349,6 @@ class DimShuffle(Op):
            print full_code

            if 0:
-                import sys
                sys.exit()

        return full_code % dict(locals(), **sub)
@@ -351,8 +367,8 @@ class DimShuffle(Op):
        # Do not make the DimShuffle inplace as an optimization at the
        # canonicalization optimization phase will remove the implace.
        # The inplace will be reintroduced automatically later in the graph.
-        return [DimShuffle(gz.type.broadcastable, grad_order)(Elemwise(scalar.identity)(gz))]
-
+        return [DimShuffle(gz.type.broadcastable, grad_order)(
+            Elemwise(scalar.identity)(gz))]


 class DimShufflePrinter:
@@ -365,7 +381,8 @@ class DimShufflePrinter:
            return pstate.pprinter.process(r)
        if list(new_order) == list(reversed(range(r.type.ndim))):
            return "%s.T" % pstate.pprinter.process(r)
-        return "DimShuffle{%s}(%s)" % (", ".join(map(str, new_order)), pstate.pprinter.process(r))
+        return "DimShuffle{%s}(%s)" % (", ".join(map(str, new_order)),
+                pstate.pprinter.process(r))

    def process(self, r, pstate):
        if r.owner is None:
@@ -376,8 +393,8 @@ class DimShufflePrinter:
        else:
            raise TypeError("Can only print DimShuffle.")

-pprint.assign(lambda pstate, r: r.owner and isinstance(r.owner.op, DimShuffle), DimShufflePrinter())
-
+pprint.assign(lambda pstate, r: r.owner and isinstance(r.owner.op, DimShuffle),
+        DimShufflePrinter())


 ################
@@ -405,30 +422,34 @@ class Elemwise(Op):
      Elemwise(add) # represents + on tensors (x + y)
      Elemwise(add, {0 : 0}) # represents the += operation (x += y)
      Elemwise(add, {0 : 1}) # represents += on the second argument (y += x)
-      Elemwise(mul)(rand(10, 5), rand(1, 5)) # the second input is completed along the first dimension to match the first input
-      Elemwise(true_div)(rand(10, 5), rand(10, 1)) # same but along the second dimension
+      Elemwise(mul)(rand(10, 5), rand(1, 5)) # the second input is completed
+        # along the first dimension to match the first input
+      Elemwise(true_div)(rand(10, 5), rand(10, 1)) # same but along the
+        # second dimension
      Elemwise(int_div)(rand(1, 5), rand(10, 1)) # the output has size (10, 5)
      Elemwise(log)(rand(3, 4, 5))
    """

-    def __init__(self, scalar_op, inplace_pattern = {}, name = None, nfunc_spec = None):
+    def __init__(self, scalar_op, inplace_pattern={}, name=None,
+            nfunc_spec=None):
        """
        Usage: Elemwise(scalar_op, inplace_pattern = {})

-        * scalar_op: an instance of a subclass of scalar.ScalarOp which works uniquely on
-                     scalars
+        * scalar_op: an instance of a subclass of scalar.ScalarOp which works
+            uniquely on scalars
        * inplace_pattern: a dictionary that maps the index of an output to the
-                           index of an input so the output is calculated inplace using
-                           the input's storage. (Just like destroymap, but without the lists.)
-        * nfunc_spec: either None or a tuple of three elements, (nfunc_name, nin, nout) such
-                      that getattr(numpy, nfunc_name) implements this operation, takes nin
-                      inputs and abs(nout) outputs (nout < 0 if the numpy function
-                      does not provide the option of providing a numpy array to store the
-                      results in). Note that nin cannot always be inferred from the scalar op's
-                      own nin field because that value is sometimes 0 (meaning a variable number
-                      of inputs), whereas the numpy function may not have varargs. NOTE: as of
-                      now, the sign of the nout field is ignored (some work needs to be done
-                      to resize the destinations when needed).
+            index of an input so the output is calculated inplace using
+            the input's storage. (Just like destroymap, but without the lists.)
+        * nfunc_spec: either None or a tuple of three elements,
+            (nfunc_name, nin, nout) such that getattr(numpy, nfunc_name)
+            implements this operation, takes nin inputs and abs(nout) outputs
+            (nout < 0 if the numpy function does not provide the option of
+            providing a numpy array to store the results in). Note that nin
+            cannot always be inferred from the scalar op's own nin field
+            because that value is sometimes 0 (meaning a variable number of
+            inputs), whereas the numpy function may not have varargs.
+            NOTE: as of now, the sign of the nout field is ignored (some work
+            needs to be done to resize the destinations when needed).
        """
        self.name = name
        self.scalar_op = scalar_op
@@ -441,7 +462,8 @@ class Elemwise(Op):
        if nfunc_spec:
            self.nfunc = getattr(numpy, nfunc_spec[0])
        elif scalar_op.nin > 0:
-            self.ufunc = numpy.frompyfunc(scalar_op.impl, scalar_op.nin, scalar_op.nout)
+            self.ufunc = numpy.frompyfunc(scalar_op.impl, scalar_op.nin,
+                    scalar_op.nout)

        #precompute the hash of this node
        self._rehash()
@@ -461,7 +483,8 @@ class Elemwise(Op):
        if getattr(self, 'nfunc_spec', None):
            self.nfunc = getattr(numpy, self.nfunc_spec[0])
        elif self.scalar_op.nin > 0:
-            self.ufunc = numpy.frompyfunc(self.scalar_op.impl, self.scalar_op.nin, self.scalar_op.nout)
+            self.ufunc = numpy.frompyfunc(self.scalar_op.impl,
+                    self.scalar_op.nin, self.scalar_op.nout)
        self._rehash()

    def make_node(self, *inputs):
@@ -472,7 +495,8 @@ class Elemwise(Op):
        """

        inputs = map(as_tensor_variable, inputs)
-        shadow = self.scalar_op.make_node(*[Scalar(dtype=i.type.dtype)() for i in inputs])
+        shadow = self.scalar_op.make_node(
+                *[Scalar(dtype=i.type.dtype)() for i in inputs])

        target_length = max([input.type.ndim for input in inputs])

@@ -486,30 +510,43 @@ class Elemwise(Op):
                # TODO: use LComplete instead
                args.append(DimShuffle(
                    input.type.broadcastable,
-                    ['x']*difference + range(length),
-                    inplace = True)(input))
+                    ['x'] * difference + range(length),
+                    inplace=True)(input))
        inputs = args

        #HERE: all the broadcast dims have the same length now

-        #cleverness: we iterate over the first, second, third broadcast flag of all inputs in
-        #parallel... the all() gives us each output broadcastable bit in turn.
+        # cleverness: we iterate over the first, second, third broadcast flag
+        # of all inputs in parallel... the all() gives us each output
+        # broadcastable bit in turn.

-        #it is multiplied by nout because Elemwise supports multiple outputs (nout of them)
-        out_broadcastables = [[all(bcast) for bcast in zip(*[input.type.broadcastable for input in inputs])]] * shadow.nout
+        # it is multiplied by nout because Elemwise supports multiple outputs
+        # (nout of them)
+        out_broadcastables = [[all(bcast)
+            for bcast in zip(*[input.type.broadcastable
+                for input in inputs])]] * shadow.nout

        #inplace_pattern maps output idx -> input idx
        inplace_pattern = self.inplace_pattern
        if inplace_pattern:
            for overwriter, overwritten in inplace_pattern.items():
-                for ob, ib in zip(out_broadcastables[overwriter], inputs[overwritten].type.broadcastable):
+                for ob, ib in zip(out_broadcastables[overwriter],
+                                  inputs[overwritten].type.broadcastable):
                    if ib and not ob:
-                        raise ValueError("Operation cannot be done inplace on an input with broadcasted dimensions.")
+                        raise ValueError((
+                            "Operation cannot be done inplace on an input "
+                            "with broadcasted dimensions."))
+
        out_dtypes = [o.type.dtype for o in shadow.outputs]
-        if any(inputs[i].type.dtype != out_dtypes[o] for o, i in inplace_pattern.items()):
-            raise TypeError("Cannot do an inplace operation on incompatible data types.",
-                    ([i.type.dtype for i in inputs], out_dtypes, inplace_pattern))
-        outputs = [TensorType(dtype = dtype, broadcastable = broadcastable)() for dtype, broadcastable in zip(out_dtypes, out_broadcastables)]
+        if any(inputs[i].type.dtype != out_dtypes[o]
+                for o, i in inplace_pattern.items()):
+            raise TypeError((
+                "Cannot do an inplace operation on incompatible data types.",
+                ([i.type.dtype for i in inputs], out_dtypes, inplace_pattern)))
+
+        outputs = [TensorType(dtype=dtype, broadcastable=broadcastable)()
+                for dtype, broadcastable in zip(out_dtypes, out_broadcastables)
+                ]
        return Apply(self, inputs, outputs)

    def __eq__(self, other):
@@ -518,25 +555,24 @@ class Elemwise(Op):
            other_items = other.inplace_pattern.items()
            items.sort()
            other_items.sort()
-            rval = (self.scalar_op == other.scalar_op) and (items == other_items)
+            rval = ((self.scalar_op == other.scalar_op)
+                    and (items == other_items))
            return rval
        return False

    def _rehash(self):
        items = self.inplace_pattern.items()
        items.sort()
-        first_part = [k for k,v in items]
+        first_part = [k for k, v in items]
        second_part = []
-        for k,v in items:
+        for k, v in items:
            if isinstance(v, (tuple, list)):
                second_part += [tuple(v)]
            else:
                second_part += [v]
        tuple_items = tuple(first_part + second_part)
-        #backport
-        #tuple_items = tuple([k for k,v in items] + [(tuple(v) if isinstance(v, (tuple, list)) else v) for k,v in items])
        h = hash('Elemwise') ^ hash(self.scalar_op) ^ hash(tuple_items)
-        assert h == getattr(self,'_hashval', h)
+        assert h == getattr(self, '_hashval', h)
        self._hashval = h

    def __hash__(self):
@@ -560,7 +596,7 @@ class Elemwise(Op):
        for idx, out in enumerate(outs):
            # make such that _bgrads computes only the gradients of the
            # current output on the inputs ( and not all outputs)
-            ograds = [ theano.tensor.zeros_like(x) for x in outs]
+            ograds = [theano.tensor.zeros_like(x) for x in outs]
            ograds[idx] = theano.tensor.ones_like(out)

            bgrads = self._bgrad(inputs, ograds)
@@ -578,9 +614,9 @@ class Elemwise(Op):
                    pass
                elif eval_point is not None:
                    if rop_out is None:
-                        rop_out = bgrads[jdx]*eval_point
+                        rop_out = bgrads[jdx] * eval_point
                    else:
-                        rop_out = rop_out + bgrads[jdx]*eval_point
+                        rop_out = rop_out + bgrads[jdx] * eval_point

            rval[idx] = rop_out

@@ -589,17 +625,18 @@ class Elemwise(Op):
    def grad(self, inputs, ograds):

        #compute grad with respect to broadcasted input
-        rval = self._bgrad(inputs,ograds)
+        rval = self._bgrad(inputs, ograds)

        #sum out the broadcasted dimensions
        for i, ipt in enumerate(inputs):
            if rval[i] is None:
                continue

-            # list of all the dimensions that are broadcastable for input[i] so we
-            # can sum over them
+            # list of all the dimensions that are broadcastable for input[i] so
+            # we can sum over them
            # todo: only count dimensions that were effectively broadcasted
-            to_sum = [j for j, bcast in enumerate(ipt.type.broadcastable) if bcast]
+            to_sum = [j for j, bcast in enumerate(ipt.type.broadcastable)
+                    if bcast]

            if to_sum:
                shuffle = []
@@ -612,7 +649,7 @@ class Elemwise(Op):
                        j += 1
                    #close if
                #close for
-                sr = Sum(axis = to_sum)(rval[i])
+                sr = Sum(axis=to_sum)(rval[i])
                sr = sr.dimshuffle(shuffle)
                #sr = DimShuffle(sr.type.broadcastable, shuffle)(sr)
                rval[i] = sr
@@ -621,7 +658,6 @@ class Elemwise(Op):

        return rval

-
    def _bgrad(self, inputs, ograds):
        # returns grad, with respect to broadcasted versions of inputs

@@ -636,15 +672,17 @@ class Elemwise(Op):

            theano.config.compute_test_value = 'off'

-            scalar_inputs = [Scalar(dtype = t.type.dtype)() for t in inputs]
-            scalar_ograds = [Scalar(dtype = ograd.type.dtype)() for ograd in ograds]
+            scalar_inputs = [Scalar(dtype=t.type.dtype)() for t in inputs]
+            scalar_ograds = [Scalar(dtype=ograd.type.dtype)()
+                    for ograd in ograds]
            scalar_igrads = self.scalar_op.grad(scalar_inputs, scalar_ograds)

        finally:

            theano.config.compute_test_value = prev_setting

-        nd = len(inputs[0].type.broadcastable) # this is the same for everyone
+        nd = len(inputs[0].type.broadcastable)  # this is the same for everyone
+
        def transform(r):
            # From a graph of ScalarOps, make a graph of Broadcast ops.
            if r in scalar_inputs:
@@ -654,12 +692,14 @@ class Elemwise(Op):
            node = r.owner
            if node is None:
                # the gradient contains a constant, translate it as
-                # an equivalent TensorType of size 1 and proper number of dimensions
-                res = TensorConstant(TensorType(dtype = r.type.dtype,
-                                            broadcastable = ()),
-                                     numpy.asarray(r.data)) # .reshape(b)
-                return DimShuffle((), ['x']*nd, inplace = True)(res)
-            new_r = Elemwise(node.op, {})(*[transform(ipt) for ipt in node.inputs])
+                # an equivalent TensorType of size 1 and proper number of
+                # dimensions
+                res = TensorConstant(TensorType(dtype=r.type.dtype,
+                                            broadcastable=()),
+                                     numpy.asarray(r.data))  # .reshape(b)
+                return DimShuffle((), ['x'] * nd, inplace=True)(res)
+            new_r = Elemwise(node.op, {})(
+                    *[transform(ipt) for ipt in node.inputs])
            return new_r
        ret = []
        for scalar_igrad, ipt in zip(scalar_igrads, inputs):
@@ -667,18 +707,19 @@ class Elemwise(Op):
                # undefined gradient
                ret.append(None)
                continue
-            ret.append( transform(scalar_igrad))
-
+            ret.append(transform(scalar_igrad))

        return ret

    def perform(self, node, inputs, output_storage):
        maxsize = max(len(input.shape) for input in inputs)
-        for dims in zip(*[[(1, True)]*(maxsize - len(input.shape)) + zip(input.shape, sinput.type.broadcastable)
+        for dims in zip(*[([(1, True)] * (maxsize - len(input.shape))
+                            + zip(input.shape, sinput.type.broadcastable))
                          for input, sinput in zip(inputs, node.inputs)]):
-            if max(d for d,b in dims) != 1 and (1, False) in dims:
+            if max(d for d, b in dims) != 1 and (1, False) in dims:
                # yes there may be more compact ways to write this code,
-                # but please maintain python 2.4 compatibility (no "x if c else y")
+                # but please maintain python 2.4 compatibility
+                # (no "x if c else y")
                msg = []
                assert len(inputs) == len(node.inputs)
                for input, sinput in zip(inputs, node.inputs):
@@ -701,33 +742,32 @@ class Elemwise(Op):
                    raise ValueError('\n'.join(msg_chunks))
                else:
                    raise ValueError(base_exc_str)
-
-                #backport
-                #raise ValueError('Dimension mismatch; shapes are %s' %
-                #                 ', '.join('(%s)' % ', '.join('*' if b else str(d)
-                #                                              for d, b in zip(input.shape, sinput.type.broadcastable))
-                #                           for input, sinput in zip(inputs, node.inputs)))
                # Other mismatches will be caught by the ufunc
+
        if not self.inplace_pattern:
            for output, storage in zip(node.outputs, output_storage):
                odat = storage[0]
-                shape = [max(values) for values in zip(*[input.shape for input in inputs])]
+                shape = [max(values)
+                        for values in zip(*[input.shape for input in inputs])]
                if odat is not None:
                    # reuse storage if we can
-                    odat.resize(shape, refcheck = 0)
+                    odat.resize(shape, refcheck=0)
                else:
-                    odat = numpy.ndarray(shape, dtype = output.type.dtype)
+                    odat = numpy.ndarray(shape, dtype=output.type.dtype)
                storage[0] = odat
        else:
-            for i, (output, storage) in enumerate(zip(node.outputs, output_storage)):
+            for i, (output, storage) in enumerate(zip(node.outputs,
+                    output_storage)):
                #i is an output idx
                if i in self.inplace_pattern:
                    odat = inputs[self.inplace_pattern[i]]
                else:
                    odat = storage[0]
-                    shape = [max(values) for values in zip(*[input.shape for input in inputs])]
+                    shape = [max(values)
+                             for values in zip(*[input.shape
+                                 for input in inputs])]
                    if odat is not None:
-                        odat.resize(shape, refcheck = 0)
+                        odat.resize(shape, refcheck=0)
                    else:
                        odat = numpy.ndarray(shape, dtype=output.type.dtype)
                storage[0] = odat
@@ -784,10 +824,13 @@ class Elemwise(Op):
                # Since numpy 1.6, function created with numpy.frompyfunc
                # always return an ndarray with dtype object
                variable = numpy.asarray(variable, dtype=nout.dtype)
-            if hasattr(variable, 'shape') and storage[0].shape != variable.shape:
+
+            if (hasattr(variable, 'shape')
+                    and storage[0].shape != variable.shape):
                if numpy.prod(variable.shape) == 0:
                    # numpy don't resize from a shape (1,5) to (0,5)
-                    # This bypass the inplace... But I it is important in this case.
+                    # This bypass the inplace...
+                    # But I it is important in this case.
                    storage[0] = variable
                    continue
                storage[0].resize(variable.shape)
@@ -797,7 +840,8 @@ class Elemwise(Op):
            else:
                storage[0].itemset(variable)
            assert str(storage[0].dtype) != 'object'
-        # the following should be used instead of the previous loop, unfortunately it tends to segfault
+        # the following should be used instead of the previous loop,
+        # unfortunately it tends to segfault
        # self.ufunc(*(ufunc_args+[s[0] for s in output_storage]))

    def infer_shape(self, node, i_shapes):
@@ -806,12 +850,15 @@ class Elemwise(Op):
            oshp = []
            for dim, b in enumerate(o.type.broadcastable):
                b_dim = None
-                if b: # this is broadcastable
+                if b:
+                    # this is broadcastable
                    b_dim = 1
-                else: # there must be some input that is not broadcastable in dimension 'dim'
-                    for ishp, i in zip(i_shapes,node.inputs):
-                        if isinstance(i.type,theano.scalar.Scalar):
-                            continue #we skip scalar
+                else:
+                    # there must be some input that is not broadcastable in
+                    # dimension 'dim'
+                    for ishp, i in zip(i_shapes, node.inputs):
+                        if isinstance(i.type, theano.scalar.Scalar):
+                            continue  # we skip scalar
                        if not i.type.broadcastable[dim]:
                            # input i is not broadcastable in position dim
                            # therefore if its shape is known, we can use it
@@ -819,12 +866,14 @@ class Elemwise(Op):
                            if ishp[dim]:
                                b_dim = ishp[dim]
                                break
-                # b_dim might still be None, if every input's shape was unknown in dimension 'dim'
+
+                # b_dim might still be None, if every input's shape was unknown
+                # in dimension 'dim'
                oshp.append(b_dim)
-                # TODO: it would be interesting to return the constraining information that if
-                # one of the inputs shape[dim] is known and another input's shape[dim] is not,
-                # that we can now assume that the other input's shape[dim] is the same as the
-                # first.
+                # TODO: it would be interesting to return the constraining
+                # information that if one of the inputs shape[dim] is known
+                # and another input's shape[dim] is not, that we can now assume
+                # that the other input's shape[dim] is the same as the first.
            rval.append(tuple(oshp))
        return rval

@@ -888,16 +937,17 @@ class Elemwise(Op):
        # We loop over the "real" outputs, i.e., those that are not
        # inplace (must be allocated) and we declare/allocate/check
        # them
-        for output, oname, odtype in zip(real_outputs, real_onames, real_odtypes):
-            i += 1 # before this loop, i = number of inputs
+        for output, oname, odtype in zip(
+                real_outputs, real_onames, real_odtypes):
+            i += 1  # before this loop, i = number of inputs
            sub['lv%i' % i] = oname
            sub['olv'] = oname
            alloc += cgen.make_declare([range(nnested)], [odtype],
-                                       dict(sub, lv0 = oname))
+                                       dict(sub, lv0=oname))
            alloc += cgen.make_alloc(orders, odtype, sub)
            alloc += cgen.make_checks([range(nnested)], [odtype],
-                                      dict(sub, lv0 = oname))
-        olv_index = i # index of the last output
+                                      dict(sub, lv0=oname))
+        olv_index = i  # index of the last output

        # We loop over the "aliased" outputs, i.e., those that are
        # inplace (overwrite the contents of one of the inputs) and
@@ -927,15 +977,18 @@ class Elemwise(Op):
        # We declare the scalar variables used in the inner loop to do
        # the element-wise computation. Aliased scalar variables need
        # not be declared, as they are #defined in defines
-        task_decl = "".join(["%(dtype)s& %(name)s_i = *%(name)s_iter;\n" % locals()
-                             for name, dtype in zip(inames + list(real_onames),
-                                                    idtypes + list(real_odtypes))])
+        task_decl = "".join([
+            "%(dtype)s& %(name)s_i = *%(name)s_iter;\n" % locals()
+                for name, dtype in zip(inames + list(real_onames),
+                                       idtypes + list(real_odtypes))])

        # We generate the C code of the inner loop using the scalar op
        task_code = self.scalar_op.c_code(
                Apply(self.scalar_op,
-                      [Scalar(dtype = input.type.dtype)() for input in node.inputs],
-                      [Scalar(dtype = output.type.dtype)() for output in node.outputs]),
+                      [Scalar(dtype=input.type.dtype)()
+                          for input in node.inputs],
+                      [Scalar(dtype=output.type.dtype)()
+                          for output in node.outputs]),
                nodename + '_scalar_',
                ["%s_i" % s for s in _inames],
                ["%s_i" % s for s in onames],
@@ -950,11 +1003,11 @@ class Elemwise(Op):
        """ % locals()

        loop = cgen.make_reordered_loop(
-                init_loop_orders = orders + [range(nnested)] * len(real_onames),
-                olv_index = olv_index,
-                dtypes = idtypes + list(real_odtypes),
-                inner_task = code,
-                sub = sub)
+                init_loop_orders=orders + [range(nnested)] * len(real_onames),
+                olv_index=olv_index,
+                dtypes=(idtypes + list(real_odtypes)),
+                inner_task=code,
+                sub=sub)
        return decl, checks, alloc, loop

    def c_code(self, node, nodename, inames, onames, sub):
@@ -973,12 +1026,12 @@ class Elemwise(Op):
        return support_code

    def c_code_cache_version_apply(self, node):
-        version = [6] # the version corresponding to the c code in this Op
+        version = [6]  # the version corresponding to the c code in this Op

        # now we insert versions for the ops on which we depend...
        scalar_node = Apply(self.scalar_op,
-                [Scalar(dtype = input.type.dtype)() for input in node.inputs],
-                [Scalar(dtype = output.type.dtype)() for output in node.outputs])
+                [Scalar(dtype=input.type.dtype)() for input in node.inputs],
+                [Scalar(dtype=output.type.dtype)() for output in node.outputs])
        version.extend(self.scalar_op.c_code_cache_version_apply(scalar_node))
        for i in node.inputs + node.outputs:
            version.extend(Scalar(dtype=i.type.dtype).c_code_cache_version())
@@ -996,7 +1049,6 @@ class Elemwise(Op):
 #             raise TypeError('All ops in the graph must be Elemwise.')


-
 ################
 ### CAReduce ###
 ################
@@ -1040,7 +1092,9 @@ class CAReduce(Op):
                - if None, all dimensions are reduced
        """
        if scalar_op.nin not in [-1, 2] or scalar_op.nout != 1:
-            raise NotImplementedError("CAReduce only supports binary functions with a single output.")
+            raise NotImplementedError((
+                "CAReduce only supports binary functions with a single "
+                "output."))
        self.scalar_op = scalar_op

        if axis is None:
@@ -1081,20 +1135,23 @@ class CAReduce(Op):

        if self.axis is not None:
            for axis in self.axis:
-                if axis >= input.type.ndim or (axis<0 and abs(axis)>input.type.ndim):
-                    raise ValueError('Not enough dimensions on %s to reduce on axis %s' % (input, axis))
+                if (axis >= input.type.ndim
+                        or (axis < 0 and abs(axis) > input.type.ndim)):
+                    raise ValueError((
+                        'Not enough dimensions on %s to reduce on axis %s'
+                        % (input, axis)))
        input = as_tensor_variable(input)
        axis = self.axis
        if axis is None:
            axis = range(len(input.type.broadcastable))
-        if any([a<0 for a in axis]):
-            axis2=[]
+        if any([a < 0 for a in axis]):
+            axis2 = []
            for a in self.axis:
-                if a<0:
-                    axis2.append(a+input.type.ndim)
+                if a < 0:
+                    axis2.append(a + input.type.ndim)
                else:
                    axis2.append(a)
-            assert len(axis)==len(axis2)
+            assert len(axis) == len(axis2)
            axis = tuple(axis2)
            op = self.__class__(self.scalar_op, axis)
        else:
@@ -1115,7 +1172,9 @@ class CAReduce(Op):
        self.set_ufunc(self.scalar_op)

    def __eq__(self, other):
-        return type(self) == type(other) and self.scalar_op == other.scalar_op and self.axis == other.axis
+        return (type(self) == type(other)
+                and self.scalar_op == other.scalar_op
+                and self.axis == other.axis)

    def __hash__(self):
        if self.axis is None:
@@ -1125,7 +1184,8 @@ class CAReduce(Op):

    def __str__(self):
        if self.axis is not None:
-            return "Reduce{%s}{%s}" % (self.scalar_op, ", ".join(str(x) for x in self.axis))
+            return "Reduce{%s}{%s}" % (
+                    self.scalar_op, ", ".join(str(x) for x in self.axis))
        else:
            return "Reduce{%s}" % self.scalar_op

@@ -1139,13 +1199,17 @@ class CAReduce(Op):
        to_reduce = reversed(sorted(axis))
        if to_reduce:
            for dimension in to_reduce:
-                # If it's a zero-size array, use scalar_op.identity if available
+                # If it's a zero-size array, use scalar_op.identity
+                # if available
                if variable.shape[dimension] == 0:
                    if hasattr(self.scalar_op, 'identity'):
                        variable = numpy.array(self.scalar_op.identity)
                        break
                    else:
-                        raise ValueError("Input (%s) has zero-size on axis %s, but self.scalar_op (%s) has no attribute 'identity'" % (variable, dimension, self.scalar_op))
+                        raise ValueError((
+                            "Input (%s) has zero-size on axis %s, but "
+                            "self.scalar_op (%s) has no attribute 'identity'"
+                            % (variable, dimension, self.scalar_op)))
                else:
                    # Numpy 1.6 has a bug where you sometimes have to specify
                    # "dtype='object'" in reduce for it to work, if the ufunc
@@ -1161,9 +1225,11 @@ class CAReduce(Op):

            variable = numpy.asarray(variable)
            if numpy.may_share_memory(variable, input):
-                # perhaps numpy is clever for reductions of size 1?  We don't want this.
+                # perhaps numpy is clever for reductions of size 1?
+                # We don't want this.
                variable = variable.copy()
-            output[0] = theano._asarray(variable, dtype = node.outputs[0].type.dtype)
+            output[0] = theano._asarray(variable,
+                    dtype=node.outputs[0].type.dtype)
        else:
            output[0] = numpy.copy(variable)

@@ -1172,8 +1238,9 @@ class CAReduce(Op):
        axis = self.axis
        if axis is None:
            return (),
-        return [ishape[i] for (i,b) in enumerate(node.inputs[0].type.broadcastable) if i not in axis],
-
+        return [ishape[i]
+                for (i, b) in enumerate(node.inputs[0].type.broadcastable)
+                if i not in axis],

    def _c_all(self, node, name, inames, onames, sub):

@@ -1210,36 +1277,41 @@ class CAReduce(Op):
        i += 1
        sub['lv%i' % i] = oname
        sub['olv'] = oname
-        alloc += cgen.make_declare([range(nnested) + ['x'] * len(axis)], [odtype], dict(sub, lv0 = oname))
+        alloc += cgen.make_declare(
+                [range(nnested) + ['x'] * len(axis)],
+                [odtype], dict(sub, lv0=oname))
        alloc += cgen.make_alloc([order1], odtype, sub)
-        alloc += cgen.make_checks([range(nnested) + ['x'] * len(axis)], [odtype], dict(sub, lv0 = oname))
+        alloc += cgen.make_checks(
+                [range(nnested) + ['x'] * len(axis)],
+                [odtype], dict(sub, lv0=oname))

-        if hasattr(self.scalar_op,'identity'):
+        if hasattr(self.scalar_op, 'identity'):
            identity = self.scalar_op.identity
        elif self.scalar_op in [scalar.maximum, scalar.minimum]:
            if self.scalar_op == scalar.maximum:
                scal_name = 'maximum'
-                if input.type.dtype in ["float32","float64"]:
+                if input.type.dtype in ["float32", "float64"]:
                    identity = "-__builtin_inf()"
                elif input.type.dtype.startswith("uint"):
                    # numpy1.5.1 don't define NPY_MIN_UINT*
                    identity = "0"
                else:
-                    identity = "NPY_MIN_"+str(input.type.dtype).upper()
+                    identity = "NPY_MIN_" + str(input.type.dtype).upper()
            if self.scalar_op == scalar.minimum:
                scal_name = 'minimum'
-                if input.type.dtype in ["float32","float64"]:
+                if input.type.dtype in ["float32", "float64"]:
                    identity = "__builtin_inf()"
                else:
-                    identity = "NPY_MAX_"+str(input.type.dtype).upper()
+                    identity = "NPY_MAX_" + str(input.type.dtype).upper()
            fail = sub["fail"]
-            pattern=[0]*len(node.inputs[0].broadcastable)
+            pattern = [0] * len(node.inputs[0].broadcastable)
            axis = self.axis
-            if axis == None: axis = range(len(pattern))
+            if axis == None:
+                axis = range(len(pattern))
            for i in axis:
-                pattern[i]=1
+                pattern[i] = 1
            pattern_ = str(pattern)[1:-1]
-            decl +="""int tosum[]={%(pattern_)s};"""%locals()
+            decl += """int tosum[]={%(pattern_)s};""" % locals()
            alloc += """
 for(int i=0;i<%(iname)s->nd;i++){
  if(PyArray_DIMS(%(iname)s)[i]==0 && tosum[i]){
@@ -1247,23 +1319,30 @@ for(int i=0;i<%(iname)s->nd;i++){
    %(fail)s;
  }
 }
-                   """%locals()
+                   """ % locals()
        else:
-            raise TypeError("The CAReduce.scalar_op must have an identity field.")
-
-        task0_decl = "%(dtype)s& %(name)s_i = *%(name)s_iter;\n%(name)s_i = %(identity)s;" % dict(dtype = odtype,
-                                                                                                  name = onames[0],
-                                                                                                  identity = identity)
-
-        task1_decl = "%(dtype)s& %(name)s_i = *%(name)s_iter;\n" % dict(dtype = idtype, name = inames[0])
-
-        task1_code = self.scalar_op.c_code(Apply(self.scalar_op,
-                                                 [Scalar(dtype = input.type.dtype)() for input in node.inputs*2],
-                                                 [Scalar(dtype = output.type.dtype)() for input in node.outputs]),
-                                           None,
-                                           ["%s_i" % onames[0], "%s_i" % inames[0]],
-                                           ["%s_i" % onames[0]],
-                                           sub)
+            raise TypeError(
+                    "The CAReduce.scalar_op must have an identity field.")
+
+        task0_decl = (
+                "%(dtype)s& %(name)s_i = *%(name)s_iter;\n"
+                "%(name)s_i = %(identity)s;"
+                % dict(dtype=odtype, name=onames[0], identity=identity))
+
+        task1_decl = ("%(dtype)s& %(name)s_i = *%(name)s_iter;\n"
+                % dict(dtype=idtype, name=inames[0]))
+
+        task1_code = self.scalar_op.c_code(
+                Apply(
+                    self.scalar_op,
+                    [Scalar(dtype=input.type.dtype)()
+                        for input in (node.inputs * 2)],
+                    [Scalar(dtype=output.type.dtype)()
+                        for input in node.outputs]),
+                None,
+                ["%s_i" % onames[0], "%s_i" % inames[0]],
+                ["%s_i" % onames[0]],
+                sub)
        code1 = """
        {
            %(task1_decl)s
@@ -1275,10 +1354,16 @@ for(int i=0;i<%(iname)s->nd;i++){
            if len(axis) == 1:
                all_code = [("", "")] * nnested + [(task0_decl, code1), ""]
            else:
-                all_code = [("", "")] * nnested + [(task0_decl, "")] + [("", "")] * (len(axis) - 2) + [("", code1), ""]
+                all_code = (
+                        [("", "")] * nnested
+                        + [(task0_decl, "")]
+                        + [("", "")] * (len(axis) - 2)
+                        + [("", code1), ""])
        else:
            all_code = [task0_decl + code1]
-        loop = cgen.make_loop([order, range(nnested) + ['x'] * len(axis)], [idtype, odtype], all_code, sub)
+        loop = cgen.make_loop(
+                [order, range(nnested) + ['x'] * len(axis)],
+                [idtype, odtype], all_code, sub)
        return decl, checks, alloc, loop

    def c_code(self, node, name, inames, onames, sub):
@@ -1290,12 +1375,12 @@ for(int i=0;i<%(iname)s->nd;i++){
        return ['<vector>', '<algorithm>']

    def c_code_cache_version_apply(self, node):
-        version = [4] # the version corresponding to the c code in this Op
+        version = [4]  # the version corresponding to the c code in this Op

        # now we insert versions for the ops on which we depend...
        scalar_node = Apply(self.scalar_op,
-                [Scalar(dtype = input.type.dtype)() for input in node.inputs],
-                [Scalar(dtype = output.type.dtype)() for output in node.outputs])
+                [Scalar(dtype=input.type.dtype)() for input in node.inputs],
+                [Scalar(dtype=output.type.dtype)() for output in node.outputs])
        version.extend(self.scalar_op.c_code_cache_version_apply(scalar_node))
        for i in node.inputs + node.outputs:
            version.extend(Scalar(dtype=i.type.dtype).c_code_cache_version())
@@ -1553,8 +1638,9 @@ class Prod(CAReduceDtype):
        of the other terms). This is easy to do by broadcasting the original
        product.

-        (Note that we also need to broadcast-multiply by the "incoming gradient",
-        ie. the gradient of the cost relative to the output/product).
+        (Note that we also need to broadcast-multiply by the
+        "incoming gradient", ie. the gradient of the cost relative to the
+        output/product).

        -----

@@ -1565,8 +1651,8 @@ class Prod(CAReduceDtype):
            non-zero, but is zero for all others.
        * If more than one zero is present, then all the derivatives are zero.

-        For the last two cases (with 1 or more zeros), we can't use the division
-        trick, as this gives divisions by 0.
+        For the last two cases (with 1 or more zeros), we can't use the
+        division trick, as this gives divisions by 0.

        Implementing that case-by-case logic is not as trivial, so a bunch of
        hacks are piled down here to do it. Notably, for the "only one zero"
@@ -1583,10 +1669,9 @@ class Prod(CAReduceDtype):
        '''
        prod_in, = inp
        gz, = grads
-        if prod_in.dtype[0:3] in ('int','uin'):
+        if prod_in.dtype[0:3] in ('int', 'uin'):
            return [None]

-
        # Prepare the broadcasting that is used everywhere to broadcast
        # over the original groups (ie. broadcast over the elements of a given
        # product)
@@ -1622,7 +1707,8 @@ class Prod(CAReduceDtype):

            where_zeros = T.eq(prod_in, 0.0)
            sum_where_zeros = T.sum(where_zeros, axis=self.axis)
-            groups_with_single_zero = T.eq(sum_where_zeros, 1).dimshuffle(new_dims)
+            groups_with_single_zero = T.eq(sum_where_zeros, 1).dimshuffle(
+                    new_dims)
            # tensor with 0 everywhere except for those places where
            # a 0 part of a group with a single zero was to be found
            where_single_zero = groups_with_single_zero * where_zeros
@@ -1631,8 +1717,8 @@ class Prod(CAReduceDtype):
            where_gz_not_zero = T.neq(gz, 0.0)
            # only take ProdWithoutZeros for the groups with single zeros
            # with non-null incoming gradient
-            where_to_take_prod_without_zeros = \
-                        groups_with_single_zero * where_gz_not_zero
+            where_to_take_prod_without_zeros = (
+                        groups_with_single_zero * where_gz_not_zero)
            # preprocess the original input so that we set 0 everywhere
            # except for groups that contain a single zero, to avoid computing
            # multiplications on other groups
@@ -1640,13 +1726,17 @@ class Prod(CAReduceDtype):
            # TODO: put lazy switch here, if it'd work
            # this is pretty efficient already (no multiplication if 0), but
            # it'd be even better if we had a lazy if per element
-            prod_without_zeros = ProdWithoutZeros(axis=self.axis)(prod_without_zeros_in)
+            prod_without_zeros = ProdWithoutZeros(axis=self.axis)(
+                    prod_without_zeros_in)
            prod_without_zeros = prod_without_zeros.dimshuffle(new_dims)

-            groups_without_zeros = T.eq(sum_where_zeros, 0).dimshuffle(new_dims)
+            groups_without_zeros = T.eq(sum_where_zeros, 0).dimshuffle(
+                    new_dims)

-            final_grad = T.switch(groups_without_zeros, grad_case_without_zeros,
-                            T.switch(where_single_zero, prod_without_zeros, 0.0) * gz)
+            final_grad = T.switch(
+                    groups_without_zeros,
+                    grad_case_without_zeros,
+                    T.switch(where_single_zero, prod_without_zeros, 0.0) * gz)

            return [final_grad]

@@ -1659,6 +1749,7 @@ class Prod(CAReduceDtype):
    def c_code_cache_version(self):
        return ()

+
 class MulWithoutZeros(scalar.BinaryScalarOp):
    # "identity" here is zero, as in Reduce we don't want to start
    # with reducing (1, something_else): this leads to the erronous
@@ -1669,22 +1760,27 @@ class MulWithoutZeros(scalar.BinaryScalarOp):
    identity = 0.
    commutative = True
    associative = True
+
    def impl(self, x, y):
        if x == 0:
            return y
        if y == 0:
            return x
-        return x*y
+        return x * y

    def c_code(self, node, name, inp, out, sub):
        x, y = inp
        z, = out
-        return ("%(z)s = ((%(x)s == 0) ? (%(y)s) : " + \
-                    "((%(y)s == 0) ? (%(x)s) : ((%(y)s)*(%(x)s))) );") % locals()
+        return (("%(z)s = ((%(x)s == 0) ? (%(y)s) : "
+                 + "((%(y)s == 0) ? (%(x)s) : ((%(y)s)*(%(x)s))) );")
+                % locals())

    def c_code_cache_version(self):
        return (1,)
-mul_without_zeros = MulWithoutZeros(scalar.upcast_out, name = 'mul_without_zeros')
+
+mul_without_zeros = MulWithoutZeros(scalar.upcast_out,
+        name='mul_without_zeros')
+

 class ProdWithoutZeros(CAReduceDtype):
    def __init__(self, axis=None, dtype=None):

--- a/theano/tensor/opt.py
+++ b/theano/tensor/opt.py
@@ -721,14 +721,14 @@ class ShapeFeature(object):

    def shape_ir(self, i, r):
        """Return symbolic r.shape[i] for tensor variable r, int i"""
-        if hasattr(r.type,"broadcastable") and r.type.broadcastable[i]:
+        if hasattr(r.type, "broadcastable") and r.type.broadcastable[i]:
            return self.lscalar_one
        else:
            return Shape_i(i).make_node(r).outputs[0]

    def shape_tuple(self, r):
        """Return a tuple of symbolic shape vars for tensor variable r"""
-        return tuple([self.shape_ir(i,r) for i in xrange(r.ndim)])
+        return tuple([self.shape_ir(i, r) for i in xrange(r.ndim)])

    def default_infer_shape(self, node, i_shapes):
        """Return a list of shape tuple or None for the outputs of node.
@@ -861,7 +861,7 @@ class ShapeFeature(object):
        if r not in self.shape_of:
            try:
                self.set_shape(r, self.shape_tuple(r))
-            except AttributeError: #XXX: where would this come from?
+            except AttributeError:  # XXX: where would this come from?
                self.set_shape(r, None)

    def make_vector_shape(self, r):
@@ -949,17 +949,18 @@ class ShapeFeature(object):
            if sh is None:
                continue
            for i, d in enumerate(sh):
-                # Note: we ignore any shape element that is not typed (i.e. does
-                # not have a 'dtype' attribute). This means there may still
-                # remain int elements that are int32 on 32-bit platforms, but
-                # this works with `local_useless_subtensor`, so for now we
+                # Note: we ignore any shape element that is not typed (i.e.,
+                # does not have a 'dtype' attribute). This means there may
+                # still remain int elements that are int32 on 32-bit platforms,
+                # but this works with `local_useless_subtensor`, so for now we
                # keep it this way. See #266 for a better long-term fix.
                if getattr(d, 'dtype', 'int64') != 'int64':
                    assert d.dtype in theano.tensor.int_dtypes
                    new_shape += sh[len(new_shape):i + 1]
                    new_shape[i] = theano.tensor.cast(d, 'int64')
            if new_shape:
-                # We replace the shape with wrong dtype by the one with 'int64'.
+                # We replace the shape with wrong dtype by the one with
+                # 'int64'.
                new_shape += sh[len(new_shape):]
                o_shapes[sh_idx] = tuple(new_shape)
                new_shape = []
@@ -990,8 +991,8 @@ class ShapeFeature(object):
        for (shpnode, idx) in (r.clients + [(node, i)]):
            if isinstance(getattr(shpnode, 'op', None), Shape_i):
                self.scheduled[shpnode] = new_r
-        # In case 2, if r is a variable that we've scheduled for shape update, then we
-        # should cancel it.
+        # In case 2, if r is a variable that we've scheduled for shape update,
+        # then we should cancel it.
        unscheduled = [k for k, v in self.scheduled.items() if v == r]
        for k in unscheduled:
            del self.scheduled[k]
@@ -1212,9 +1213,10 @@ def local_alloc_unary(node):
 class Assert(T.Op):
    """
    Implements assertion in a computational graph.
+
    Notes:
-    This Op can be removed from the graph because of optimizations, and can hide
-    some possible optimizations to the optimizer.
+    This Op can be removed from the graph because of optimizations, and can
+    hide some possible optimizations to the optimizer.
    Also, the output of the Op must be returned by the function computing the
    graph, otherwise it will not be used.
    """
@@ -2773,7 +2775,6 @@ class Canonizer(gof.LocalOptimizer):
        if op not in [self.main, self.inverse, self.reciprocal]:
            return False

-        inputs = node.inputs
        out = node.outputs[0]
        assert len(node.outputs) == 1

@@ -2934,7 +2935,6 @@ def local_sum_div_dimshuffle(node):
            axis = range(node.inputs[0].ndim)
        #print 'axis =', axis
        thing_summed = node.inputs[0]
-        dimshuffled = None
        if thing_summed.owner and thing_summed.owner.op == T.true_div:
            numerator, denominator = thing_summed.owner.inputs

@@ -3035,11 +3035,13 @@ def local_sum_sum(node):

                if summed.owner.op.axis is None:
                    # special case of local_cut_useless_reduce
-                    return [T.Sum(None, dtype=out_dtype)(summed.owner.inputs[0])]
+                    return [T.Sum(None, dtype=out_dtype)(
+                        summed.owner.inputs[0])]
                if node.op.axis is None:
                    # we're summing up everything anyway so lets
                    # do it all at once
-                    return [T.Sum(None, dtype=out_dtype)(summed.owner.inputs[0])]
+                    return [T.Sum(None, dtype=out_dtype)(
+                        summed.owner.inputs[0])]

                newaxis = list(tuple(summed.owner.op.axis))
                # figure out which dimensions of the original input
@@ -3113,7 +3115,7 @@ def local_sum_alloc(node):
                    assert val.size == 1
                    val = val.reshape(1)[0] * T.mul(*shapes)
                    return [T.cast(val, dtype=node.outputs[0].dtype)]
-                except TypeError, e:
+                except TypeError:
                    pass
            else:
                try:
@@ -3127,7 +3129,7 @@ def local_sum_alloc(node):
                    return [T.alloc(T.cast(val, dtype=node.outputs[0].dtype),
                                    *[shapes[i] for i in xrange(len(shapes))
                                      if i not in node.op.axis])]
-                except TypeError, e:
+                except TypeError:
                    pass


@@ -4433,7 +4435,6 @@ def local_elemwise_fusion_op(OP, max_input_fct=lambda node: 1024):
 fusion optimization. We skip this optimization. You can ignore this message,
 your code will run correctly, but may be slower.""")

-        otype = node.outputs[0].type
        s_new_out = node.op.scalar_op(*s_g)
        try:
            s_new_out.owner.op.c_code(s_new_out.owner,
@@ -4509,7 +4510,7 @@ class FusionOptimizer(Optimizer):
                                zip(node.outputs, new_outputs),
                                reason=self.__class__.__name__)
                            did_something = True
-                        except InconsistencyError, e:
+                        except InconsistencyError:
                            pass

 if config.tensor.local_elemwise_fusion: