Merge pull request #3731 from nouiz/gpualloc_empty

Lift GpuAllocEmpty in the new GPU back-end.

Merge pull request #3731 from nouiz/gpualloc_empty
91f08497 · Pascal Lamblin · 52185277 · f1a61158 · 91f08497 · 91f08497
--- a/theano/gof/op.py
+++ b/theano/gof/op.py
@@ -779,6 +779,17 @@ class Op(utils.object2, PureOp, CLinkerOp):
    def _props(self):
        return tuple(getattr(self, a) for a in self.__props__)
+    def _props_dict(self):
+        """This return a dict of all ``__props__`` key-> value.
+        This is useful in optimization to swap op that should have the
+        same props. This help detect error that the new op have at
+        least all the original props.
+        """
+        return dict([(a, getattr(self, a))
+                     for a in self.__props__])
    def __hash__(self):
        if hasattr(self, '__props__'):
            return hash((type(self), self._props()))

--- a/theano/gof/tests/test_graph.py
+++ b/theano/gof/tests/test_graph.py
 from __future__ import print_function
+from itertools import count
 import pickle
 import unittest
-import numpy
-from itertools import count
+from nose.plugins.skip import SkipTest
+import numpy
 from theano import (
    sparse,
@@ -361,6 +362,8 @@ class TestAutoName:
    def test_sparsevariable(self):
        # Get counter value
+        if not sparse.enable_sparse:
+            raise SkipTest('Optional package SciPy not installed')
        autoname_id = next(Variable.__count__)
        Variable.__count__ = count(autoname_id)
        r1 = sparse.csc_matrix(name='x', dtype='float32')

--- a/theano/sandbox/cuda/tests/test_opt.py
+++ b/theano/sandbox/cuda/tests/test_opt.py
@@ -323,7 +323,7 @@ def test_opt_gpujoin_joinvectors_elemwise_then_minusone():
    assert isinstance(graph_nodes[-2].op, cuda.GpuSubtensor)
    assert isinstance(graph_nodes[-3].op, cuda.GpuJoin)
-    concat = numpy.concatenate([numpy.cos(_a), numpy.sin(_b)], axis=1)
+    concat = numpy.concatenate([numpy.cos(_a), numpy.sin(_b)], axis=0)
    concat = concat[:-1]
    assert numpy.allclose(numpy.asarray(f()), concat)

--- a/theano/sandbox/gpuarray/opt.py
+++ b/theano/sandbox/gpuarray/opt.py
@@ -273,6 +273,15 @@ def local_gpuaalloc(node, context_name):
    return GpuAlloc(context_name)(*node.inputs)
+@register_opt('fast_compile')
+@op_lifter([tensor.AllocEmpty])
+def local_gpuaallocempty(node, context_name):
+    # We use _props_dict() to make sure that the GPU op know all the
+    # CPU op props.
+    return GpuAllocEmpty(context_name=context_name,
+                         **node.op._props_dict())(*node.inputs)
 @register_opt()
 @local_optimizer([GpuAlloc])
 def local_gpualloc_memset_0(node):

--- a/theano/sandbox/gpuarray/tests/test_opt.py
+++ b/theano/sandbox/gpuarray/tests/test_opt.py
@@ -9,7 +9,8 @@ from theano.tensor.tests import test_basic
 import theano.sandbox.gpuarray
 from .. import basic_ops
 from ..type import GpuArrayType, gpuarray_shared_constructor, get_context
-from ..basic_ops import GpuAlloc, GpuReshape, GpuFromHost, host_from_gpu
+from ..basic_ops import (
+    GpuAlloc, GpuAllocEmpty, GpuReshape, GpuFromHost, host_from_gpu)
 from ..elemwise import GpuCAReduceCuda, GpuCAReduceCPY, GpuElemwise
 from ..subtensor import GpuSubtensor
@@ -151,6 +152,29 @@ def test_local_gpualloc_memset_0():
    assert (numpy.asarray(f(2)) == 1).all()
+def test_local_gpualloc_empty():
+    i = theano.tensor.iscalar()
+    ii = theano.tensor.iscalar()
+    # Test with vector
+    a = tensor.AllocEmpty('float32')(i)
+    f = theano.function([i], a, mode=mode_with_gpu)
+    topo = f.maker.fgraph.toposort()
+    assert len(topo) == 2
+    assert isinstance(topo[0].op, GpuAllocEmpty)
+    # This return not initilized data, so we can only check the shape
+    assert f(3).shape == (3,)
+    # Test with matrix
+    a = tensor.AllocEmpty('float32')(i, ii)
+    f = theano.function([i, ii], a, mode=mode_with_gpu)
+    topo = f.maker.fgraph.toposort()
+    assert len(topo) == 2
+    assert isinstance(topo[0].op, GpuAllocEmpty)
+    # This return not initilized data, so we can only check the shape
+    assert f(3, 4).shape == (3, 4)
 def test_rebroadcast():
    d = numpy.random.rand(10, 10).astype('float32')
    v = theano.tensor.fmatrix()

--- a/theano/sandbox/linalg/tests/test_linalg.py
+++ b/theano/sandbox/linalg/tests/test_linalg.py
-import unittest
 import numpy
 import numpy.linalg
-from numpy.testing import assert_array_almost_equal
-from numpy.testing import dec, assert_array_equal, assert_allclose
-from numpy import inf
 import theano
 from theano import tensor, function
@@ -16,35 +11,17 @@ from theano.tensor.nlinalg import MatrixInverse
 from theano.tensor import DimShuffle
 # The one in comment are not tested...
-from theano.sandbox.linalg.ops import (cholesky,
+from theano.sandbox.linalg.ops import (Cholesky,  # op class
-                                       Cholesky,  # op class
-                                       CholeskyGrad,
                                       matrix_inverse,
-                                       pinv,
                                       Solve,
                                       solve,
-                                       diag,
-                                       ExtractDiag,
-                                       extract_diag,
-                                       AllocDiag,
-                                       alloc_diag,
-                                       det,
-                                       svd,
-                                       qr,
                                       # PSD_hint,
-                                       trace,
-                                       matrix_dot,
                                       spectral_radius_bound,
                                       imported_scipy,
-                                       Eig,
                                       inv_as_solve,
-                                       norm
                                       )
-from theano.sandbox.linalg import eig, eigh, eigvalsh
-from theano.tests.unittest_tools import attr
 from nose.plugins.skip import SkipTest
-from nose.tools import assert_raises
 def test_rop_lop():
@@ -156,6 +133,8 @@ def test_transinv_to_invtrans():
 def test_tag_solve_triangular():
+    if not imported_scipy:
+        raise SkipTest("Scipy needed for the Cholesky op.")
    cholesky_lower = Cholesky(lower=True)
    cholesky_upper = Cholesky(lower=False)
    A = tensor.matrix('A')

--- a/theano/tensor/nnet/tests/test_corr.py
+++ b/theano/tensor/nnet/tests/test_corr.py
@@ -24,6 +24,8 @@ class TestCorr2D(utt.InferShapeTester):
        self.filters.name = 'default_filters'
        if not conv.imported_scipy_signal and theano.config.cxx == "":
            raise SkipTest("CorrMM tests need SciPy or a c++ compiler")
+        if not theano.config.blas.ldflags:
+            raise SkipTest("CorrMM tests need a BLAS")
    def validate(self, image_shape, filter_shape,
                 border_mode='valid', subsample=(1, 1),

--- a/theano/tests/test_ifelse.py
+++ b/theano/tests/test_ifelse.py
@@ -67,7 +67,10 @@ class test_ifelse(unittest.TestCase, utt.TestOptimizationMixin):
        y2 = reduce(lambda x, y: x + y, [y] + list(range(200)))
        f = theano.function([c, x, y], ifelse(c, x, y2), mode=mode)
        # For not inplace ifelse
-        self.assertFunctionContains1(f, IfElse(1))
+        ifnode = [n for n in f.maker.fgraph.toposort()
+                  if isinstance(n.op, IfElse)]
+        assert len(ifnode) == 1
+        assert not ifnode[0].op.as_view
        rng = numpy.random.RandomState(utt.fetch_seed())
        xlen = rng.randint(200)