first commit to remove Flatten Op

eced0049 · Sina Honari · 33bda7ca · eced0049 · eced0049 · eced0049
--- a/theano/sandbox/cuda/__init__.py
+++ b/theano/sandbox/cuda/__init__.py
@@ -318,7 +318,7 @@ if cuda_available:
            GpuDimShuffle, GpuCAReduce, GpuReshape, GpuContiguous,
            GpuSubtensor, GpuIncSubtensor,
            GpuAdvancedSubtensor1, GpuAdvancedIncSubtensor1,
-            GpuFlatten, GpuShape, GpuAlloc, GpuAllocEmpty, GpuSplit,
+            gpu_flatten, GpuFlatten, GpuShape, GpuAlloc, GpuAllocEmpty, GpuSplit,
            GpuJoin, fscalar, fvector, fmatrix, frow, fcol,
            ftensor3, ftensor4,
            scalar, vector, matrix, row, col,

--- a/theano/sandbox/cuda/basic_ops.py
+++ b/theano/sandbox/cuda/basic_ops.py
@@ -3322,18 +3322,33 @@ class GpuIncSubtensor(tensor.IncSubtensor, GpuOp):
        return ()


-class GpuFlatten(gof.HideC, tensor.Flatten, GpuOp):
-    """
-    Implement Flatten on the gpu.
-
-    """
-
-    def make_node(self, x):
-        assert isinstance(x.type, CudaNdarrayType)
-        rval = tensor.Flatten.make_node(self, x)
-        host_out_broadcastable = rval.outputs[0].type.broadcastable
-        out_type = CudaNdarrayType(broadcastable=host_out_broadcastable)
-        return Apply(self, [x], [out_type()])
+#class GpuFlatten(gof.HideC, tensor.Reshape, GpuOp):
+#    """
+#    Implement Flatten on the gpu.
+#
+#    """
+#
+#    def make_node(self, x):
+#        warnings.warn(
+#            "GpuFlatten class is deprecated, "
+#            "please use gpu_flatten method instead.",
+#            DeprecationWarning,
+#            stacklevel=4)
+#        assert isinstance(x.type, CudaNdarrayType)
+#        rval = tensor.Reshape.make_node(self, x, [tensor.prod(x.shape)])
+#        host_out_broadcastable = rval.outputs[0].type.broadcastable
+#        out_type = CudaNdarrayType(broadcastable=host_out_broadcastable)
+#        return Apply(self, [x], [out_type()])
+
+
+
+def gpu_flatten(x, outdim=1):
+    x = as_cuda_ndarray_variable(x)
+    if outdim > 1:
+        dims = tuple(x.shape[:outdim-1])+(theano.tensor.prod(x.shape[outdim-1:]),)
+    else:
+        dims = (-1,)
+    return  GpuReshape(outdim)(x, dims)


 class GpuShape(tensor.Shape, GpuOp):

--- a/theano/sandbox/cuda/extra_ops.py
+++ b/theano/sandbox/cuda/extra_ops.py
@@ -3,7 +3,7 @@ import copy
 from theano import Op
 from theano.gof import local_optimizer
 from theano.sandbox.cuda import cuda_available, GpuOp
-from theano.sandbox.cuda.basic_ops import GpuFlatten
+from theano.sandbox.cuda.basic_ops import gpu_flatten
 from theano.tensor.extra_ops import CumsumOp

 if cuda_available:
@@ -453,7 +453,7 @@ def use_gpu_cumsum(node):
        x = gpu_from_host(x)

        if axis is None and x.ndim > 1:
-            x = GpuFlatten()(x)
+            x = gpu_flatten(x)

        # ``gpu_cumsum`` assume array has been flattened if needed.
        if axis is None:

--- a/theano/sandbox/cuda/opt.py
+++ b/theano/sandbox/cuda/opt.py
@@ -24,7 +24,9 @@ from theano.sandbox.cuda.basic_ops import (
    gpu_eye, gpu_contiguous,
    gpu_from_host, host_from_gpu, GpuFromHost, HostFromGpu,
    GpuContiguous,
-    GpuElemwise, GpuDimShuffle, GpuReshape, GpuCAReduce, GpuFlatten,
+    GpuElemwise, GpuDimShuffle, GpuReshape, GpuCAReduce,
+    # GpuFlatten,
+    gpu_flatten, 
    GpuSubtensor, GpuAdvancedSubtensor1,
    GpuAdvancedIncSubtensor1, GpuAdvancedIncSubtensor1_dev20,
    GpuIncSubtensor, gpu_alloc, GpuAlloc, gpu_shape, GpuSplit, GpuAllocEmpty)
@@ -152,7 +154,7 @@ cpu_ops_moved_to_gpu = [
    tensor.elemwise.All, tensor.elemwise.Any,
    tensor.elemwise.CAReduceDtype, tensor.elemwise.Sum,
    tensor.elemwise.Prod, tensor.elemwise.ProdWithoutZeros,
-    tensor.Reshape, tensor.Flatten, tensor.Subtensor,
+    tensor.Reshape, tensor.flatten, tensor.Subtensor,
    tensor.AdvancedSubtensor1, tensor.AdvancedIncSubtensor1,
    tensor.IncSubtensor, tensor.Shape, tensor.Join,
    tensor.Alloc, tensor.Eye]
@@ -972,23 +974,23 @@ def local_gpu_reshape(node):
    return False


-@register_opt()
-@local_optimizer([gpu_from_host, tensor.Flatten])
-def local_gpu_flatten(node):
-    if isinstance(node.op, GpuFromHost):
-        host_input = node.inputs[0]
-        if host_input.owner and \
-           isinstance(host_input.owner.op, tensor.Flatten):
-            outdim = host_input.owner.op.outdim
-            return [GpuFlatten(outdim)(
-                as_cuda_ndarray_variable(host_input.owner.inputs[0]))]
-    if isinstance(node.op, tensor.Flatten):
-        x, = node.inputs
-        outdim = node.op.outdim
-        if x.owner and isinstance(x.owner.op, HostFromGpu):
-            gpu_x, = x.owner.inputs
-            return [host_from_gpu(GpuFlatten(outdim)(gpu_x))]
-    return False
+#@register_opt()
+#@local_optimizer([gpu_from_host, tensor.Reshape])
+#def local_gpu_flatten(node):
+#    if isinstance(node.op, GpuFromHost):
+#        host_input = node.inputs[0]
+#        if host_input.owner and \
+#           isinstance(host_input.owner.op, tensor.Reshape):
+#            outdim = host_input.owner.op.outdim
+#            return [GpuFlatten(outdim)(
+#                as_cuda_ndarray_variable(host_input.owner.inputs[0]))]
+#    if isinstance(node.op, tensor.Reshape):
+#        x, shp= node.inputs
+#        outdim = node.op.outdim
+#        if x.owner and isinstance(x.owner.op, HostFromGpu):
+#            gpu_x, = x.owner.inputs
+#            return [host_from_gpu(GpuFlatten(outdim)(gpu_x))]
+#    return False


 @register_opt()

--- a/theano/sandbox/cuda/tests/test_basic_ops.py
+++ b/theano/sandbox/cuda/tests/test_basic_ops.py
@@ -307,7 +307,7 @@ def test_flatten():
    x = cuda.fmatrix('x')
    f = theano.function([x], x.flatten(), mode=mode_with_gpu)
    assert any([node for node in f.maker.fgraph.toposort()
-                if isinstance(node.op, B.GpuFlatten)])
+                if isinstance(node.op, B.GpuReshape)])
    assert len(f([[0., 0.], [0., 0.]]).shape) == 1



--- a/theano/tensor/basic.py
+++ b/theano/tensor/basic.py
--- a/theano/tensor/nnet/tests/test_sigm.py
+++ b/theano/tensor/nnet/tests/test_sigm.py
@@ -377,7 +377,7 @@ class T_softplus_opts(unittest.TestCase):
        f = theano.function([x], out, mode=self.m)
        topo = f.maker.fgraph.toposort()
        assert len(topo) == 3
-        assert isinstance(topo[0].op, T.Flatten)
+        tensor.is_flatten(topo[0])
        assert isinstance(topo[1].op.scalar_op,
                          theano.tensor.nnet.sigm.ScalarSoftplus)
        assert isinstance(topo[2].op.scalar_op, theano.scalar.Neg)

--- a/theano/tensor/opt.py
+++ b/theano/tensor/opt.py
@@ -3877,24 +3877,24 @@ def local_useless_split(node):
 ################
 # Flatten Opts #
 ################
-@register_canonicalize
-@register_stabilize
-@gof.local_optimizer([T.Flatten])
-def local_flatten_lift(node):
-    """
-    Flatten(UnaryElemwise(x)) -> UnaryElemwise(Flatten(x))
-
-    This optimization is needed by optimization
-    nnet/sigm.py:log1msigm_to_softplus to get applied when there is a flatten.
-
-    """
-    if (isinstance(node.op, T.Flatten) and
-            node.inputs[0].owner and
-            isinstance(node.inputs[0].owner.op, T.Elemwise) and
-            len(node.inputs[0].owner.inputs) == 1):
-        f = node.op(node.inputs[0].owner.inputs[0])
-        e = node.inputs[0].owner.op(f)
-        return [e]
+#@register_canonicalize
+#@register_stabilize
+#@gof.local_optimizer([T.Flatten])
+#def local_flatten_lift(node):
+#    ""
+#    Flatten(UnaryElemwise(x)) -> UnaryElemwise(Flatten(x))
+#
+#    This optimization is needed by optimization
+#    nnet/sigm.py:log1msigm_to_softplus to get applied when there is a flatten.
+#
+#    ""
+#    if (isinstance(node.op, T.Flatten) and
+#            node.inputs[0].owner and
+#            isinstance(node.inputs[0].owner.op, T.Elemwise) and
+#            len(node.inputs[0].owner.inputs) == 1):
+#        f = node.op(node.inputs[0].owner.inputs[0])
+#        e = node.inputs[0].owner.op(f)
+#        return [e]

 ##################
 # Reshape opts   #

--- a/theano/tensor/tests/test_basic.py
+++ b/theano/tensor/tests/test_basic.py
@@ -32,7 +32,7 @@ from theano.tensor import (_shared, wvector, bvector, autocast_float_as,
        alloc, as_tensor_variable, tensor_from_scalar, ARange, autocast_float,
        clip, constant, default, dot,
        dmatrix, dscalar, dvector, eq, eye, fill, flatten, inverse_permutation,
-        tensor4, permute_row_elements, Flatten, fmatrix, fscalars, grad,
+        tensor4, permute_row_elements, fmatrix, fscalars, grad,
        inplace, iscalar, matrix, minimum, matrices, maximum, mul, neq,
        Reshape, row, scalar, scalars, second, smallest, stack, sub, Tensor,
        tensor_copy, tensordot, TensorType, Tri, tri, tril, triu, unbroadcast,
@@ -5147,11 +5147,6 @@ def test_make_column_matrix_broadcastable():


 def test_flatten_outdimNone():
-    """Flatten always returns a copy of the array. There is no danger
-    with in-place operations and thus no need to test it.
-
-    """
-
    a = dmatrix()
    c = flatten(a)
    f = inplace_func([a], c)
@@ -5161,7 +5156,7 @@ def test_flatten_outdimNone():
    f = inplace_func([a], c)
    assert numpy.all(f(a_val) == c_val)

-    utt.verify_grad(Flatten(), [a_val])
+    utt.verify_grad(flatten, [a_val])


 def test_flatten_scalar():
@@ -5174,7 +5169,7 @@ def test_flatten_scalar():
    f = inplace_func([a], c)
    assert numpy.all(f(a_val) == c_val)

-    # utt.verify_grad(Flatten(), [a_val]) #TODO: fix verify_grd to work on scalars
+    # utt.verify_grad(flatten, [a_val]) #TODO: fix verify_grd to work on scalars


 def test_flatten_outdim1():
@@ -5187,7 +5182,7 @@ def test_flatten_outdim1():
    f = inplace_func([a], c)
    assert numpy.all(f(a_val) == c_val)

-    utt.verify_grad(Flatten(1), [a_val])
+    utt.verify_grad(flatten, [a_val])


 def test_flatten_outdim2():
@@ -5199,7 +5194,7 @@ def test_flatten_outdim2():
    f = inplace_func([a], c)
    assert numpy.all(f(a_val) == a_val)

-    utt.verify_grad(Flatten(2), [a_val])
+    utt.verify_grad(flatten, [a_val])


 def test_flatten_outdim2_of_3():
@@ -5213,7 +5208,7 @@ def test_flatten_outdim2_of_3():
    f = inplace_func([a], c)
    assert numpy.all(f(a_val) == c_val)

-    utt.verify_grad(Flatten(2), [a_val])
+    utt.verify_grad(flatten, [a_val])


 def test_flatten_broadcastable():
@@ -7128,24 +7123,27 @@ class TestInferShape(utt.InferShapeTester):
        # Flatten
        atens3 = tensor3()
        atens3_val = rand(4, 5, 3)
-        for outdim in (3, 2, 1):
-            self._compile_and_check([atens3],
-                                    [Flatten(outdim)(atens3)],
-                                    [atens3_val], Flatten)
-
-        amat = matrix()
-        amat_val = rand(4, 5)
-        for outdim in (2, 1):
-            self._compile_and_check([amat],
-                                    [Flatten(outdim)(amat)],
-                                    [amat_val], Flatten)
-
-        avec = vector()
-        avec_val = rand(4)
-        outdim = 1
-        self._compile_and_check([avec],
-                                [Flatten(outdim)(avec)],
-                                [avec_val], Flatten)
+        self._compile_and_check([atens3],
+                                [flatten(atens3, 1)],
+                                [atens3_val], Reshape)
+        #for outdim in (3, 2, 1):
+        #    self._compile_and_check([atens3],
+        #                            [flatten(atens3, outdim)],
+        #                            [atens3_val], Reshape)
+
+        #amat = matrix()
+        #amat_val = rand(4, 5)
+        #for outdim in (2, 1):
+        #    self._compile_and_check([amat],
+        #                            [flatten(amat, outdim)],
+        #                            [amat_val], Reshape)
+
+        #avec = vector()
+        #avec_val = rand(4)
+        #outdim = 1
+        #self._compile_and_check([avec],
+        #                        [flatten(avec, outdim)],
+        #                        [avec_val], Reshape)

        # Eye
        aiscal = iscalar()

--- a/theano/tensor/tests/test_opt.py
+++ b/theano/tensor/tests/test_opt.py
@@ -60,6 +60,7 @@ from theano.tests import unittest_tools as utt
 from theano.compile.mode import optdb
 from theano.compile import Mode
 from nose.plugins.attrib import attr
+from theano.tensor.basic import flatten, is_flatten

 mode_opt = theano.config.mode
 if mode_opt == 'FAST_COMPILE':
@@ -5879,18 +5880,19 @@ def test_local_useless_split():

 def test_local_flatten_lift():
    for i in xrange(1, 4):
-        op = tensor.Flatten(i)
        x = tensor.tensor4()
-        out = op(T.exp(x))
+        out = tensor.flatten(T.exp(x), i)
        assert out.ndim == i
        mode = compile.mode.get_default_mode()
        mode = mode.including('local_flatten_lift')
        f = theano.function([x], out, mode=mode)
-        f(numpy.random.rand(5, 4, 3, 2).astype(config.floatX))
+        x_np = numpy.random.rand(5, 4, 3, 2).astype(config.floatX)
+        out_np = f(x_np)
        topo = f.maker.fgraph.toposort()
-        assert len(topo) == 2
-        assert isinstance(topo[0].op, tensor.Flatten)
-        assert isinstance(topo[1].op, tensor.Elemwise)
+        shape_out_np = tuple(x_np.shape[:i-1])+(numpy.prod(x_np.shape[i-1:]),)
+        assert shape_out_np == out_np.shape
+        tensor.is_flatten(topo[0], outdim=i)
+        assert isinstance(topo[-1].op, tensor.Elemwise)


 class Test_Reshape(unittest.TestCase):