Merge pull request #712 from bouchnic/sparse_opt

fix gh-363 Move optimization from basic.py to opt.py.

Merge pull request #712 from bouchnic/sparse_opt
ded60972 · nouiz · f11612b6 · ac369fd9 · ded60972 · ded60972
--- a/theano/sparse/basic.py
+++ b/theano/sparse/basic.py
@@ -912,17 +912,11 @@ class CSMGradC(gof.Op):
        return (3,)
 csm_grad_c = CSMGradC()
-@gof.local_optimizer([csm_grad(None)])
-def local_csm_grad_c(node):
-    """ csm_grad(None) -> csm_grad_c """
-    if node.op == csm_grad(None):
-        return [csm_grad_c(*node.inputs)]
-    return False
-register_specialize(local_csm_grad_c)
 #
 # Conversion
 #
 class DenseFromSparse(gof.op.Op):
    """
    Convert a sparse matrix to an `ndarray`.
@@ -1960,28 +1954,6 @@ class StructuredDotCSR(gof.Op):
 sd_csr = StructuredDotCSR()
-# register a specialization to replace StructuredDot -> StructuredDotCSx
-@gof.local_optimizer([_structured_dot])
-def local_structured_dot(node):
-    if node.op == _structured_dot:
-        a, b = node.inputs
-        if a.type.format == 'csc':
-            a_val, a_ind, a_ptr, a_shape = csm_properties(a)
-            a_nsparse = a_shape[0]
-            return [sd_csc(a_val, a_ind, a_ptr, a_nsparse, b)]
-        if a.type.format == 'csr':
-            a_val, a_ind, a_ptr, a_shape = csm_properties(a)
-            return [sd_csr(a_val, a_ind, a_ptr, b)]
-    return False
-# Commented out because
-# a) it is only slightly faster than scipy these days, and sometimes a little
-# slower, and
-# b) the resulting graphs make it very difficult for an op to do size checking
-# on the matrices involved.  dimension mismatches are hard to detect sensibly.
-#register_specialize(local_structured_dot)
 def structured_dot_grad(sparse_A, dense_B, ga):
    if sparse_A.type.format in ('csc', 'csr'):
@@ -2648,49 +2620,3 @@ class UsmmCscDense(gof.Op):
 usmm_csc_dense = UsmmCscDense(inplace=False)
 usmm_csc_dense_inplace = UsmmCscDense(inplace=True)
-local_usmm = gof.opt.PatternSub(
-    (tensor.sub, 'z',
-     (tensor.mul,
-      {'pattern': 'alpha',
-       'constraint': lambda expr: numpy.all(expr.type.broadcastable)},
-    (_dot, 'x', 'y'))),
-    (usmm, (tensor.neg, 'alpha'), 'x', 'y', 'z'))
-register_specialize(local_usmm, name="local_usmm")
-@gof.local_optimizer([usmm])
-def local_usmm_csx(node):
-    """ usmm -> usmm_csc_dense """
-    if node.op == usmm:
-        alpha, x, y, z = node.inputs
-        x_is_sparse_variable = _is_sparse_variable(x)
-        y_is_sparse_variable = _is_sparse_variable(y)
-        if x_is_sparse_variable and not y_is_sparse_variable:
-            if x.type.format == 'csc':
-                x_val, x_ind, x_ptr, x_shape = csm_properties(x)
-                x_nsparse = x_shape[0]
-                dtype_out = scalar.upcast(alpha.type.dtype, x.type.dtype,
-                                          y.type.dtype, z.type.dtype)
-                if dtype_out not in ('float32', 'float64'):
-                    return False
-                # Sparse cast is not implemented.
-                if y.type.dtype != dtype_out:
-                    return False
-                return [usmm_csc_dense(alpha, x_val, x_ind, x_ptr,
-                                       x_nsparse, y, z)]
-    return False
-register_specialize(local_usmm_csx)
-@gof.local_optimizer([usmm_csc_dense])
-def local_usmm_csc_dense_inplace(node):
-    if node.op == usmm_csc_dense:
-        return [usmm_csc_dense_inplace(*node.inputs)]
-register_specialize(local_usmm_csc_dense_inplace, 'inplace')
--- a/theano/sparse/opt.py
+++ b/theano/sparse/opt.py
 from itertools import izip
 import theano
-from theano import gof
+import numpy
+from theano import gof, scalar
 from theano.sparse import (CSC, CSR, csm_properties, Remove0,
-                           register_specialize)
+                           register_specialize,
+                           csm_grad, csm_grad_c,
+                           usmm_csc_dense, usmm)
+from basic import (_structured_dot, _dot,
+                   _is_sparse_variable, usmm_csc_dense_inplace)
-@gof.local_optimizer([None])
-def local_inplace_remove0(node):
+# This is tested in tests/test_basic.py:UsmmTests
-    """
+local_usmm = gof.opt.PatternSub(
-    Optimization to insert inplace versions of Remove0.
+    (theano.tensor.sub, 'z',
-    """
+     (theano.tensor.mul,
-    if isinstance(node.op, Remove0) and not node.op.inplace:
+      {'pattern': 'alpha',
-        new_op = node.op.__class__(inplace=True)
+       'constraint': lambda expr: numpy.all(expr.type.broadcastable)},
-        new_node = new_op(*node.inputs)
+    (_dot, 'x', 'y'))),
-        return [new_node]
+    (usmm, (theano.tensor.neg, 'alpha'), 'x', 'y', 'z'))
+register_specialize(local_usmm, name="local_usmm")
+# This is tested in tests/test_opt.py:test_local_csm_grad_c
+@gof.local_optimizer([csm_grad(None)])
+def local_csm_grad_c(node):
+    """ csm_grad(None) -> csm_grad_c """
+    if node.op == csm_grad(None):
+        return [csm_grad_c(*node.inputs)]
    return False
-theano.compile.optdb.register('local_inplace_remove0',
+register_specialize(local_csm_grad_c)
-                              gof.TopoOptimizer(local_inplace_remove0,
-    failure_callback=gof.TopoOptimizer.warn_inplace),
-                              60, 'fast_run', 'inplace')
+# This is tested in tests/test_opt.py:test_local_csm_properties_csm
 @gof.local_optimizer([csm_properties])
 def local_csm_properties_csm(node):
    """if we find csm_properties(CSM(*args)), then we can replace that with the
@@ -37,3 +49,79 @@ def local_csm_properties_csm(node):
    return False
 register_specialize(local_csm_properties_csm)
+# This is tested in tests/test_basic.py:test_remove0
+@gof.local_optimizer([None])
+def local_inplace_remove0(node):
+    """
+    Optimization to insert inplace versions of Remove0.
+    """
+    if isinstance(node.op, Remove0) and not node.op.inplace:
+        new_op = node.op.__class__(inplace=True)
+        new_node = new_op(*node.inputs)
+        return [new_node]
+    return False
+theano.compile.optdb.register('local_inplace_remove0',
+                              gof.TopoOptimizer(local_inplace_remove0,
+    failure_callback=gof.TopoOptimizer.warn_inplace),
+                              60, 'fast_run', 'inplace')
+# register a specialization to replace StructuredDot -> StructuredDotCSx
+# This is tested in tests/test_basic.py:792
+@gof.local_optimizer([_structured_dot])
+def local_structured_dot(node):
+    if node.op == _structured_dot:
+        a, b = node.inputs
+        if a.type.format == 'csc':
+            a_val, a_ind, a_ptr, a_shape = csm_properties(a)
+            a_nsparse = a_shape[0]
+            return [sd_csc(a_val, a_ind, a_ptr, a_nsparse, b)]
+        if a.type.format == 'csr':
+            a_val, a_ind, a_ptr, a_shape = csm_properties(a)
+            return [sd_csr(a_val, a_ind, a_ptr, b)]
+    return False
+# Commented out because
+# a) it is only slightly faster than scipy these days, and sometimes a little
+# slower, and
+# b) the resulting graphs make it very difficult for an op to do size checking
+# on the matrices involved.  dimension mismatches are hard to detect sensibly.
+#register_specialize(local_structured_dot)
+# This is tested in tests/test_basic.py:UsmmTests
+@gof.local_optimizer([usmm_csc_dense])
+def local_usmm_csc_dense_inplace(node):
+    if node.op == usmm_csc_dense:
+        return [usmm_csc_dense_inplace(*node.inputs)]
+register_specialize(local_usmm_csc_dense_inplace, 'inplace')
+# This is tested in tests/test_basic.py:UsmmTests
+@gof.local_optimizer([usmm])
+def local_usmm_csx(node):
+    """ usmm -> usmm_csc_dense """
+    if node.op == usmm:
+        alpha, x, y, z = node.inputs
+        x_is_sparse_variable = _is_sparse_variable(x)
+        y_is_sparse_variable = _is_sparse_variable(y)
+        if x_is_sparse_variable and not y_is_sparse_variable:
+            if x.type.format == 'csc':
+                x_val, x_ind, x_ptr, x_shape = csm_properties(x)
+                x_nsparse = x_shape[0]
+                dtype_out = scalar.upcast(alpha.type.dtype, x.type.dtype,
+                                          y.type.dtype, z.type.dtype)
+                if dtype_out not in ('float32', 'float64'):
+                    return False
+                # Sparse cast is not implemented.
+                if y.type.dtype != dtype_out:
+                    return False
+                return [usmm_csc_dense(alpha, x_val, x_ind, x_ptr,
+                                       x_nsparse, y, z)]
+    return False
+register_specialize(local_usmm_csx)
--- a/theano/sparse/sandbox/sp2.py
+++ b/theano/sparse/sandbox/sp2.py
@@ -13,7 +13,14 @@ from theano.sparse.basic import (
    _is_sparse)
 from theano.sparse.sandbox.sp import sp_sum
 class Cast(gof.op.Op):
+    """Cast sparse variable to the desired dtype.
+    This wrap the method astype from scipy.
+    """
+    # It returns a new matrix, not a view.
    def __init__(self, out_type):
        self.out_type = out_type

--- a/theano/sparse/tests/test_opt.py
+++ b/theano/sparse/tests/test_opt.py
@@ -12,7 +12,8 @@ from theano.gof.python25 import any
 if not enable_sparse:
    raise SkipTest('Optional package sparse disabled')
-from theano.sparse import CSM, CSMProperties, csm_properties, CSC, CSR
+from theano.sparse import (CSM, CSMProperties, csm_properties, CSC, CSR,
+                           DenseFromSparse, CSMGrad)
 from theano.sparse.tests.test_basic import random_lil
@@ -32,3 +33,22 @@ def test_local_csm_properties_csm():
        v = cast(random_lil((10, 40),
                            config.floatX, 3))
        f(v.data, v.indices, v.indptr, v.shape)
+def test_local_csm_grad_c():
+    data = tensor.vector()
+    indices, indptr, shape = (tensor.ivector(), tensor.ivector(),
+                              tensor.ivector())
+    mode = theano.compile.mode.get_default_mode()
+    mode = mode.including("specialize", "local_csm_grad_c")
+    for CS, cast in [(CSC, sp.csc_matrix), (CSR, sp.csr_matrix)]:
+        cost = tensor.sum(DenseFromSparse()(CS(data, indices, indptr, shape)))
+        f = theano.function(
+            [data, indices, indptr, shape],
+            tensor.grad(cost, data),
+            mode=mode)
+        assert not any(isinstance(node.op, CSMGrad) for node
+                       in f.maker.env.toposort())
+        v = cast(random_lil((10, 40),
+                            config.floatX, 3))
+        f(v.data, v.indices, v.indptr, v.shape)