merge

ed9143d0 · James Bergstra · b0cfc18d · 2125a099 · ed9143d0 · ed9143d0
--- a/theano/compile/debugmode.py
+++ b/theano/compile/debugmode.py
@@ -219,17 +219,17 @@ class BadDestroyMap(DebugModeError):
        self.new_val = new_val
    def __str__(self):
-        npy_old_val = numpy.asarray(self.old_val)
+        sio = StringIO()
-        npy_new_val = numpy.asarray(self.new_val)
+        print >> sio, "  node:", self.node
+        print >> sio, "  node.inputs:", [(str(i), id(i)) for i in self.node.inputs]
+        print >> sio, "  destroy_map:", getattr(self.node.op, 'destroy_map', {})
+        print >> sio, "  changed input idx:", self.idx
+        print >> sio, "  changed input type:", self.node.inputs[self.idx].type
+        print >> sio, "  repr (old val):", repr(self.old_val)
+        print >> sio, "  repr (new val):", repr(self.new_val)
        try:
-            sio = StringIO()
+            npy_old_val = numpy.asarray(self.old_val)
-            print >> sio, "  node:", self.node
+            npy_new_val = numpy.asarray(self.new_val)
-            print >> sio, "  node.inputs:", [(str(i), id(i)) for i in self.node.inputs]
-            print >> sio, "  destroy_map:", getattr(self.node.op, 'destroy_map', {})
-            print >> sio, "  changed input idx:", self.idx
-            print >> sio, "  changed input type:", self.node.inputs[self.idx].type
-            print >> sio, "  repr (old val):", repr(self.old_val)
-            print >> sio, "  repr (new val):", repr(self.new_val)
            print >> sio, "  value dtype (new <space> old):", npy_new_val.dtype, npy_old_val.dtype
            print >> sio, "  value shape (new <space> old):", npy_new_val.shape, npy_old_val.shape
            print >> sio, "  value min (new <space> old):", npy_new_val.min(), npy_old_val.min()
@@ -237,10 +237,10 @@ class BadDestroyMap(DebugModeError):
            print >> sio, "  value min (new-old):", (npy_new_val-npy_old_val).min()
            print >> sio, "  value max (new-old):", (npy_new_val-npy_old_val).max()
            print >> sio, ""
-            print >> sio, "  Hint: this can also be caused by a deficient values_eq_approx() or __eq__() implementation [which compared input values]"
-            return sio.getvalue()
        except Exception, e:
-            return str(e)
+            print >> sio, "(Numpy-hints failed with: %s)" %str(e)
+        print >> sio, "  Hint: this can also be caused by a deficient values_eq_approx() or __eq__() implementation [which compared input values]"
+        return sio.getvalue()
 class BadViewMap(DebugModeError):
    """Exception: Some perform() or c_code() created a memory alias that wasn't in the view_map"""
@@ -868,6 +868,11 @@ class _Linker(gof.link.LocalLinker):
        return self
    def make_all(self, profiler = None, input_storage = None, output_storage = None):
+        if 1:
+            #can't import at toplevel because of circular import
+            # TODO: don't do this ugly hacky way of setting the filter_checks_isfinite
+            from theano.tensor import TensorType #to set filter_check_isfinite
        env = self.env
        input_storage_ = input_storage
        output_storage_ = output_storage
@@ -932,7 +937,7 @@ class _Linker(gof.link.LocalLinker):
        # This is the function that runs when you evaluate the graph
        #####
        def f():
-            debug("starting f")
+            debug("starting a DebugMode call")
            for x in no_recycling:
                x[0] = None
@@ -1027,7 +1032,10 @@ class _Linker(gof.link.LocalLinker):
                            storage_map[r][0] = _lessbroken_deepcopy(r_vals[r])
                        debug(i, "DEBUGMODE running thunk_c")
-                        thunk_c()
+                        try:
+                            thunk_c()
+                        except:
+                            raise_with_op(node)
                        for r in node.outputs:
                            # check output values for type-correctness
@@ -1075,9 +1083,6 @@ class _Linker(gof.link.LocalLinker):
                    if True: 
                        gc.collect()
-                #except:
-                #    raise_with_op(node)
                _find_bad_optimizations(order, env.equivalence_tracker.reasons, r_vals)
                #####
@@ -1132,10 +1137,27 @@ class _Linker(gof.link.LocalLinker):
                if (r.owner is None):
                    assert storage_map[r][0] is not None
            ###############
-            # Done f
+            # Done debugmode function call 'f'
            ##############
+        def run_with_tensortype_filter_check(f):
+            def deco():
+                # WARNING: this is a global mechanism... 
+                # so it will screw up if we are trying to use
+                # multiple modes at once.
+                old_filter_checks_isfinite = TensorType.filter_checks_isfinite
+                TensorType.filter_checks_isfinite = self.maker.mode.check_isfinite
+                try:
+                    return f()
+                finally:
+                    # put back the filter_checks_isfinite
+                    TensorType.filter_checks_isfinite = old_filter_checks_isfinite
+            return deco
+        f = run_with_tensortype_filter_check(f)
        f.allow_gc = True
        assert len(env.inputs) == len(input_storage)
        assert len(env.outputs) == len(output_storage)
@@ -1170,11 +1192,6 @@ class _Maker(FunctionMaker): #inheritance buys a few helper functions
        """
-        # WARNING: this is a global mechanism... so it will screw up if we are trying to use
-        # multiple modes at once.
-        from theano.tensor import TensorType #to set filter_check_isfinite
-        TensorType.filter_checks_isfinite = mode.check_isfinite
        # Handle the case where inputs and/or outputs is a single Variable (not in a list)
        unpack_single = False
        return_none = False

--- a/theano/sparse/basic.py
+++ b/theano/sparse/basic.py
@@ -8,7 +8,6 @@ To read about different sparse formats, see U{http://www-users.cs.umn.edu/~saad/
 import sys, operator
 import numpy, theano
-from scipy import sparse
 import scipy.sparse
 from theano.printing import Print
@@ -16,6 +15,7 @@ from theano import gof
 from theano import tensor
 from theano import compile
 from theano import scalar
+from theano import config
 #TODO: move this decorator to the compile submodule
 def register_specialize(lopt, *tags, **kwargs):
@@ -23,11 +23,11 @@ def register_specialize(lopt, *tags, **kwargs):
 """ Types of sparse matrices to use for testing """
-_mtypes = [sparse.csc_matrix, sparse.csr_matrix]
+_mtypes = [scipy.sparse.csc_matrix, scipy.sparse.csr_matrix]
 #_mtypes = [sparse.csc_matrix, sparse.csr_matrix, sparse.dok_matrix, sparse.lil_matrix, sparse.coo_matrix]
 #* new class ``dia_matrix`` : the sparse DIAgonal format
 #* new class ``bsr_matrix`` : the Block CSR format
-_mtype_to_str = {sparse.csc_matrix: "csc", sparse.csr_matrix: "csr"}
+_mtype_to_str = {scipy.sparse.csc_matrix: "csc", scipy.sparse.csr_matrix: "csr"}
 def _is_sparse_variable(x):
    """
@@ -51,15 +51,15 @@ def _is_sparse(x):
    @rtype: boolean
    @return: True iff x is a L{scipy.sparse.spmatrix} (and not a L{numpy.ndarray})
    """
-    if not isinstance(x, sparse.spmatrix) and not isinstance(x, numpy.ndarray):
+    if not isinstance(x, scipy.sparse.spmatrix) and not isinstance(x, numpy.ndarray):
        raise NotImplementedError("this function should only be called on sparse.scipy.sparse.spmatrix or numpy.ndarray, not,", x)
-    return isinstance(x, sparse.spmatrix)
+    return isinstance(x, scipy.sparse.spmatrix)
 def _is_dense(x):
    """
    @rtype: boolean
    @return: True unless x is a L{scipy.sparse.spmatrix} (and not a L{numpy.ndarray})
    """
-    if not isinstance(x, sparse.spmatrix) and not isinstance(x, numpy.ndarray):
+    if not isinstance(x, scipy.sparse.spmatrix) and not isinstance(x, numpy.ndarray):
        raise NotImplementedError("this function should only be called on sparse.scipy.sparse.spmatrix or numpy.ndarray, not,", x)
    return isinstance(x, numpy.ndarray)
@@ -101,22 +101,23 @@ def as_sparse_variable(x):
 as_sparse = as_sparse_variable
 def constant(x):
-    if not isinstance(x, sparse.spmatrix):
+    if not isinstance(x, scipy.sparse.spmatrix):
        raise TypeError("sparse.constant must be called on a scipy.sparse.spmatrix")
    try:
        return SparseConstant(SparseType(format = x.format,
-                                     dtype = x.dtype), x)
+                                     dtype = x.dtype), x.copy())
    except TypeError:
        raise TypeError("Could not convert %s to SparseType" % x, type(x))
-def value(x):
+if 0:
-    if not isinstance(x, sparse.spmatrix):
+    def value(x):
-        raise TypeError("sparse.value must be called on a scipy.sparse.spmatrix")
+        if not isinstance(x, scipy.sparse.spmatrix):
-    try:
+            raise TypeError("sparse.value must be called on a scipy.sparse.spmatrix")
-        return SparseValue(SparseType(format = x.format,
+        try:
-                                  dtype = x.dtype), x)
+            return SparseValue(SparseType(format = x.format,
-    except TypeError:
+                                      dtype = x.dtype), x)
-        raise TypeError("Could not convert %s to SparseType" % x, type(x))
+        except TypeError:
+            raise TypeError("Could not convert %s to SparseType" % x, type(x))
 def sp_ones_like(x):
    data, indices, indptr, shape = csm_properties(x) #TODO: don't restrict to CSM formats
@@ -132,13 +133,13 @@ class SparseType(gof.Type):
    @note As far as I can tell, L{scipy.sparse} objects must be matrices, i.e. have dimension 2.
    """
    format_cls = {
-            'csr' : sparse.csr_matrix,
+            'csr' : scipy.sparse.csr_matrix,
-            'csc' : sparse.csc_matrix
+            'csc' : scipy.sparse.csc_matrix
            }
    dtype_set = set(['int', 'int8', 'int16','int32', 'int64', 'float32', 'float64', 'complex64','complex128'])
    ndim = 2
-    def __init__(self, format, dtype = 'float64'):
+    def __init__(self, format, dtype):
        """
        Fundamental way to create a sparse node.
        @param dtype:   Type of numbers in the matrix.
@@ -187,16 +188,31 @@ class SparseType(gof.Type):
        return "Sparse[%s, %s]" % (str(self.dtype), str(self.format))
    def values_eq_approx(self, a, b, eps=1e-6):
-#        print "VEA", a, b, scipy.sparse.issparse(a), scipy.sparse.issparse(b), abs(a-b).sum(), abs(a-b).sum() < (1e-6 * a.nnz)
+        #WARNING: equality comparison of sparse matrices is not fast or easy
+        # we definitely do not want to be doing this un-necessarily during
+        # a FAST_RUN computation..
        return scipy.sparse.issparse(a) \
                and scipy.sparse.issparse(b) \
                and abs(a-b).sum() < (1e-6 * a.nnz)
+    def values_eq(self, a, b):
+        #WARNING: equality comparison of sparse matrices is not fast or easy
+        # we definitely do not want to be doing this un-necessarily during
+        # a FAST_RUN computation..
+        return scipy.sparse.issparse(a) \
+                and scipy.sparse.issparse(b) \
+                and abs(a-b).sum() == 0.0
    def is_valid_value(self, a):
        return scipy.sparse.issparse(a) and (a.format == self.format)
-csc_matrix = SparseType(format='csc')
+# for more dtypes, call SparseType(format, dtype)
-csr_matrix = SparseType(format='csr')
+csc_matrix = SparseType(format='csc', dtype=config.floatX)
+csr_matrix = SparseType(format='csr', dtype=config.floatX)
+csc_dmatrix = SparseType(format='csc', dtype='float64')
+csr_dmatrix = SparseType(format='csr', dtype='float64')
+csc_fmatrix = SparseType(format='csc', dtype='float32')
+csr_fmatrix = SparseType(format='csr', dtype='float32')
 class _sparse_py_operators:
    T = property(lambda self: transpose(self), doc = "Return aliased transpose of self (read-only)")
@@ -270,9 +286,11 @@ class CSMProperties(gof.Op):
    def perform(self, node, (csm,), out):
        if self.kmap is None:
-          out[0][0] = csm.data
+            out[0][0] = csm.data
        else:
-          out[0][0] = csm.data[self.kmap]
+            out[0][0] = csm.data[self.kmap]
+        if str(csm.data.dtype) == 'int32':
+            out[0][0] = theano._asarray(out[0][0], dtype='int32')
        #backport
        #out[0][0] = csm.data if self.kmap is None else csm.data[self.kmap]
        out[1][0] = theano._asarray(csm.indices, dtype='int32')
@@ -377,13 +395,13 @@ class CSM(gof.Op):
                     'as indices (shape'+`indices.shape`+') or elements as kmap ('+`numpy.size(self.kmap)`+')'
            raise ValueError(errmsg)
        if self.format == 'csc':
-            out[0] = sparse.csc_matrix((data, indices.copy(), indptr.copy()), 
+            out[0] = scipy.sparse.csc_matrix((data, indices.copy(), indptr.copy()), 
                    numpy.asarray(shape),
                    copy = False #1000*len(data.flatten())
                    )
        else:
            assert self.format == 'csr'
-            out[0] = sparse.csr_matrix((data, indices.copy(), indptr.copy()), 
+            out[0] = scipy.sparse.csr_matrix((data, indices.copy(), indptr.copy()), 
                    shape.copy(),
                    copy = False #1000*len(data.flatten())
                    )
@@ -546,7 +564,6 @@ class AddSS(gof.op.Op):
        if x.type.dtype != y.type.dtype:
            raise NotImplementedError()
        if x.type.format != y.type.format:
-            print x.type.format, y.type.format
            raise NotImplementedError()
        return gof.Apply(self,
                         [x, y],
@@ -795,11 +812,11 @@ class StructuredDotCSC(gof.Op):
        return r
    def perform(self, node, (a_val, a_ind, a_ptr, a_nrows, b), (out,)):
-        a = sparse.csc_matrix((a_val, a_ind, a_ptr), 
+        a = scipy.sparse.csc_matrix((a_val, a_ind, a_ptr), 
                (a_nrows, b.shape[0]),
                copy = False)
        #out[0] = a.dot(b)
-        out[0] = a * b
+        out[0] = theano._asarray(a * b, dtype=node.outputs[0].type.dtype)
        assert _is_dense(out[0]) # scipy 0.7 automatically converts to dense
    def c_code(self, node, name, (a_val, a_ind, a_ptr, a_nrows, b), (z,), sub):
@@ -952,7 +969,7 @@ class StructuredDotCSR(gof.Op):
        return r
    def perform(self, node, (a_val, a_ind, a_ptr, b), (out,)):
-        a = sparse.csr_matrix((a_val, a_ind, a_ptr), 
+        a = scipy.sparse.csr_matrix((a_val, a_ind, a_ptr), 
                (len(a_ptr)-1, b.shape[0]),
                copy = True) #use view_map before setting this to False
        #out[0] = a.dot(b)

--- a/theano/sparse/tests/test_basic.py
+++ b/theano/sparse/tests/test_basic.py
--- a/theano/tensor/basic.py
+++ b/theano/tensor/basic.py
@@ -237,7 +237,7 @@ def constant_or_value(x, rtype, name=None, ndim=None, dtype=None):
                x_shape = None
            return rtype(
                    TensorType(dtype = x_.dtype, broadcastable = bcastable, shape=x_shape),
-                    x_, name=name)
+                    x_.copy(), name=name)
        else:
            # leave the shape out of the type
            return rtype(TensorType(dtype = x_.dtype, broadcastable = bcastable), x_, name=name)