merged

9c4c58ad · Ian Goodfellow · e731582c · 4befd3b9 · 9c4c58ad · 9c4c58ad
--- a/theano/scalar/basic.py
+++ b/theano/scalar/basic.py
@@ -821,9 +821,9 @@ class BinaryBitOp(BinaryScalarOp):
        return [None, None]
 class OR(BinaryBitOp):
-    identity = False
+    identity = 0
    commutative = True
-    associative = False
+    associative = True
    def impl(self, x, y):
        return x | y
    def c_code(self, node, name, (x, y), (z, ), sub):
@@ -831,9 +831,9 @@ class OR(BinaryBitOp):
 or_ = OR()
 class XOR(BinaryBitOp):
-    identity = False
+    identity = 0
    commutative = True
-    associative = False
+    associative = True
    def impl(self, x, y):
        return x ^ y
    def c_code(self, node, name, (x, y), (z, ), sub):
@@ -841,9 +841,9 @@ class XOR(BinaryBitOp):
 xor = XOR()
 class AND(BinaryBitOp):
-    identity = False
+    identity = 1
    commutative = True
-    associative = False
+    associative = True
    def impl(self, x, y):
        return x & y
    def c_code(self, node, name, (x, y), (z, ), sub):
@@ -851,7 +851,6 @@ class AND(BinaryBitOp):
 and_ = AND()
 class Invert(UnaryBitOp):
-    identity = False
    def impl(self, x):
        return ~x
    def c_code(self, node, name, (x,), (z, ), sub):

--- a/theano/scan_module/scan_op.py
+++ b/theano/scan_module/scan_op.py
@@ -1063,13 +1063,16 @@ def profile_printer(fct_name, compile_time, fct_call_time, fct_call,
        total_scan_op_time = 0
        for (_,node),v in apply_time.items():
            if isinstance(node.op, Scan):
-                scan_fct_time = node.op.mode_instance.fn_time
+                if v> 0:
-                scan_op_time = sum(node.op.mode_instance.local_time)
+                    scan_fct_time = node.op.mode_instance.fn_time
-                total_super_scan_time += v
+                    scan_op_time = sum(node.op.mode_instance.local_time)
-                total_scan_fct_time += scan_fct_time
+                    total_super_scan_time += v
-                total_scan_op_time += scan_op_time
+                    total_scan_fct_time += scan_fct_time
-                print '    %5.1fs  %5.1fs  %5.1fs  %5.1f%%  %5.1f%%'%(
+                    total_scan_op_time += scan_op_time
-                    v, scan_fct_time, scan_op_time, scan_fct_time/v*100,
+                    print '    %5.1fs  %5.1fs  %5.1fs  %5.1f%%  %5.1f%%'%(
-                    scan_op_time/v*100), node
+                        v, scan_fct_time, scan_op_time, scan_fct_time/v*100,
+                        scan_op_time/v*100), node
+                else:
+                    print ' The node took 0s, so we can not compute the overhead'
        print '    total %5.1fs  %5.1fs  %5.1fs  %5.1f%%  %5.1f%%'%(
            total_super_scan_time, total_scan_fct_time, total_scan_op_time, total_scan_fct_time/total_super_scan_time*100, total_scan_op_time/total_super_scan_time*100)
--- a/theano/tensor/basic.py
+++ b/theano/tensor/basic.py
@@ -1299,7 +1299,11 @@ class TensorConstant(_tensor_py_operators, Constant):
    To create a TensorConstant, use the `constant` function in this module.
    """
    def __str__(self):
-        return "TensorConstant{%s}" % self.data
+        name = "%s"%self.data
+        if len(name) > 20:
+            name = name[:10]+".."+name[-10:]
+        return "TensorConstant{%s}" % name
    def signature(self):
        return TensorConstantSignature((self.type, self.data))

--- a/theano/tensor/tests/test_elemwise.py
+++ b/theano/tensor/tests/test_elemwise.py
@@ -172,7 +172,7 @@ class test_CAReduce(unittest.TestCase):
    def setUp(self):
        unittest_tools.seed_rng()
-    def with_linker(self, linker, scalar_op = add):
+    def with_linker(self, linker, scalar_op = add, dtype="floatX"):
        for xsh, tosum in [((5, 6), None),
                           ((5, 6), (0, 1)),
                           ((5, 6), (0, )),
@@ -188,11 +188,17 @@ class test_CAReduce(unittest.TestCase):
                           ((5, 0), ()),
                           ((), None),
                           ((), ())]:
-            x = TensorType('float64', [(entry == 1) for entry in xsh])('x')
+            if dtype == "floatX":
+                dtype = theano.config.floatX
+            x = TensorType(dtype, [(entry == 1) for entry in xsh])('x')
            e = CAReduce(scalar_op, axis = tosum)(x)
            if tosum is None: tosum = range(len(xsh))
            f = copy(linker).accept(Env([x], [e])).make_function()
            xv = numpy.asarray(numpy.random.rand(*xsh))
+            if dtype.startswith('float'):
+                xv = numpy.asarray(xv,dtype=dtype)
+            else:
+                xv = numpy.asarray(xv<0.5,dtype=dtype)
            zv = xv
            numpy_raised = False
            if len(tosum)>1 and any([a<0 for a in tosum]):
@@ -224,10 +230,17 @@ class test_CAReduce(unittest.TestCase):
                    numpy_raised=True
            elif scalar_op == or_:
                for axis in reversed(sorted(tosum)):
-                    zv = numpy.any(zv, axis)
+                    zv = numpy.bitwise_or.reduce(zv, axis)
            elif scalar_op == and_:
                for axis in reversed(sorted(tosum)):
-                    zv = numpy.all(zv, axis)
+                    zv = numpy.bitwise_and.reduce(zv, axis)
+            elif scalar_op == xor:
+                # There is no identity value for the xor function
+                # So we can't support shape of dimensions 0.
+                if numpy.prod(zv.shape)==0:
+                    continue
+                for axis in reversed(sorted(tosum)):
+                    zv = numpy.bitwise_xor.reduce(zv, axis)
            else:
                raise Exception("Test for CAReduce with scalar_op %s not implemented"%str(scalar_op))
            if scalar_op in [maximum,minimum] and numpy_raised:
@@ -238,13 +251,16 @@ class test_CAReduce(unittest.TestCase):
                else:
                    self.fail()
            else:
+                #numpy.{all,any} return bool type.
+                if scalar_op in [and_, or_]:
+                    zv = numpy.asarray(zv, dtype=dtype)
                self.assertTrue((numpy.abs(f(xv) - zv) < 1e-10).all())
            #test CAReduce.infer_shape
            #the Shape op don't implement c_code!
            if isinstance(linker,gof.PerformLinker):
-                x = TensorType('float64', [(entry == 1) for entry in xsh])('x')
+                x = TensorType(dtype, [(entry == 1) for entry in xsh])('x')
                e = CAReduce(scalar_op, axis = tosum)(x)
                if tosum is None: tosum = range(len(xsh))
                f = copy(linker).accept(Env([x], [e.shape])).make_function()
@@ -256,20 +272,18 @@ class test_CAReduce(unittest.TestCase):
        self.with_linker(gof.PerformLinker(), mul)
        self.with_linker(gof.PerformLinker(), maximum)
        self.with_linker(gof.PerformLinker(), minimum)
-        #need other dtype then real
+        self.with_linker(gof.PerformLinker(), or_, dtype='int8')
-        #self.with_linker(gof.PerformLinker(), or_)
+        self.with_linker(gof.PerformLinker(), and_, dtype='int8')
-        #self.with_linker(gof.PerformLinker(), and_)
+        self.with_linker(gof.PerformLinker(), xor, dtype='int8')
    def test_c(self):
        self.with_linker(gof.CLinker(), add)
        self.with_linker(gof.CLinker(), mul)
        self.with_linker(gof.CLinker(), maximum)
        self.with_linker(gof.CLinker(), minimum)
+        self.with_linker(gof.CLinker(), or_, dtype='int8')
-        #need other dtype then real
+        self.with_linker(gof.CLinker(), and_, dtype='int8')
-        #no c_code for or_, and_
+        self.with_linker(gof.CLinker(), xor, dtype='int8')
-        #self.with_linker(gof.CLinker(), or_)
-        #self.with_linker(gof.CLinker(), and_)
 class test_Prod(unittest.TestCase):