merge

fd7e6d59 · Pascal Lamblin · f1b7e125 · d555ab80 · fd7e6d59 · fd7e6d59
--- a/doc/advanced_tutorial/optimization.txt
+++ b/doc/advanced_tutorial/optimization.txt
@@ -7,6 +7,19 @@ Graph optimization

 In this section we will define a couple optimizations on doubles.

+.. todo::
+
+   This tutorial goes way too far under the hood, for someone who just wants
+   to add yet another pattern to the libraries in tensor.opt for example.
+
+   We need another tutorial that covers the decorator syntax, and explains how
+   to register your optimization right away.  That's what you need to get
+   going.
+
+   Later, the rest is more useful for when that decorator syntax type thing
+   doesn't work. (There are optimizations that don't fit that model).
+
+

 Global and local optimizations
 ==============================
@@ -119,6 +132,11 @@ simplification described above:

   simplify = Simplify()

+.. todo::
+
+   What is add_requirements? Why would we know to do this? Are there other
+   requirements we might want to  know about?
+
 Here's how it works: first, in ``add_requirements``, we add the
 ``ReplaceValidate`` :ref:`envfeature` located in
 :api:`theano.gof.toolbox`. This feature adds the ``replace_validate``
@@ -150,6 +168,7 @@ and :ref:`apply` to get a better understanding of the
 pointer-following game you need to get ahold of the nodes of interest
 for the simplification (``x``, ``y``, ``z``, ``a``, ``b``, etc.).

+
 Test time:

 >>> x = double('x')
@@ -238,6 +257,10 @@ The local version of the above code would be the following:

   local_simplify = LocalSimplify()

+.. todo::
+
+    Fix up previous example... it's bad and incomplete.
+
 The definition of transform is the inner loop of the global optimizer,
 where the node is given as argument. If no changes are to be made,
 ``False`` must be returned. Else, a list of what to replace the node's
@@ -310,6 +333,9 @@ Theano defines some shortcuts to make LocalOptimizers:
   means that everything we said previously about local optimizers
   apply: they need to be wrapped in a Navigator, etc.

+.. todo::
+
+   wtf is a navigator?

 When an optimization can be naturally expressed using ``OpSub``, ``OpRemove``
 or ``PatternSub``, it is highly recommended to use them.
@@ -319,6 +345,7 @@ use constraints, etc. - there's some decent doc at
 :api:`theano.gof.opt.PatternSub` for those interested)


+
 .. _optdb:

 The optimization database (optdb)

--- a/theano/tensor/basic.py
+++ b/theano/tensor/basic.py
@@ -1781,36 +1781,44 @@ def div_proxy(x, y):
        return true_div(x, y)

 @_scal_elemwise
-def add(a, b):
+def add(a, *other_terms):
    """elementwise addition"""
+    # see decorator for function body

 @_scal_elemwise
 def sub(a, b):
    """elementwise subtraction"""
+    # see decorator for function body

 @_scal_elemwise
-def mul(a, b):
+def mul(a, *other_terms):
    """elementwise multiplication"""
+    # see decorator for function body

 @_scal_elemwise
 def true_div(a, b):
    """elementwise [true] division (inverse of multiplication)"""
+    # see decorator for function body

 @_scal_elemwise
 def int_div(a, b):
    """elementwise integer-division"""
+    # see decorator for function body

 @_scal_elemwise
 def mod(a, b):
    """elementwise modulo"""
+    # see decorator for function body

 @_scal_elemwise
 def pow(a, b):
    """elementwise power"""
+    # see decorator for function body

 @_scal_elemwise
 def clip(x, min, max):
    """clip x to be between min and max"""
+    # see decorator for function body

 pprint.assign(add, printing.OperatorPrinter('+', -2, 'either'))
 pprint.assign(mul, printing.OperatorPrinter('*', -1, 'either'))
@@ -3007,6 +3015,8 @@ class AdvancedSubtensor(Op):
        #TODO: see what's the best solution
        self.args = args #?

+        #FIXME: do not store variables in the class instance
+
        #FIXME
        #if len(args) != 2:
        #    print >>sys.stderr, 'WARNING: Advanced indexing with %i arguments not supported yet' % len(args)
@@ -3018,6 +3028,11 @@ class AdvancedSubtensor(Op):
        if x.ndim == 2 and len(inputs) == 2:
            ind1 = as_tensor_variable(inputs[0])
            ind2 = as_tensor_variable(inputs[1])
+            if not (ind1.type.dtype.startswith('int') or ind1.type.dtype.startswith('uint')):
+                raise TypeError()
+            if not (ind2.type.dtype.startswith('int') or ind2.type.dtype.startswith('uint')):
+                raise TypeError()
+
            if ind1.ndim == 1 and ind2.ndim == 1:
                return gof.Apply(self,
                        (x,) + inputs,
@@ -3029,7 +3044,11 @@ class AdvancedSubtensor(Op):
                % ','.join(str(input) for input in inputs))

    def perform(self, node, inputs, (out,)):
-        pass
+        # TODO: in general, we need to re-pack the inputs into a valid index, just like
+        # subtensor
+        out[0] = inputs[0].__getitem__(inputs[1:])
+        #return 
+        #raise NotImplementedError()

    def grad(self, inputs, (gz,)):
        x = inputs[0]
@@ -3061,9 +3080,14 @@ class AdvancedIncSubtensor(Op):
                % ','.join(str(input) for input in inputs))

    def perform(self, node, inputs, (out,)):
-        pass
+        # TODO: same thing as in AdvancedSubtensor's perform TODO
+        out[0] = inputs[0].copy()
+        out[0][inputs[2:]] += inputs[1]

    #def grad?
+        # grad on x is grad  on output
+        # grad on y is grad_output[idx_list]
+        # grad on rest is None




--- a/theano/tensor/nnet.py
+++ b/theano/tensor/nnet.py
--- a/theano/tensor/opt.py
+++ b/theano/tensor/opt.py
@@ -14,7 +14,8 @@ from elemwise import Elemwise, DimShuffle
 from theano import scalar
 import basic as T
 import inplace as I
-import numpy as N
+import numpy
+import numpy as N #guys... please don't do this in the library :(
 import operator
 import itertools
 import sys, os
@@ -62,7 +63,6 @@ def get_constant_value(v):
        return get_constant_value(v.owner.inputs[0])
    raise TypeError(v)

-
 @gof.optimizer
 def insert_inplace_optimizer(env):
    """
@@ -108,10 +108,12 @@ compile.optdb.register('inplace_opt', insert_inplace_optimizer, 75, 'fast_run',
 def register_canonicalize(lopt, *tags, **kwargs):
    name = (kwargs and kwargs.pop('name')) or lopt.__name__
    compile.optdb['canonicalize'].register(name, lopt, 'fast_run', *tags)
+    return lopt

 def register_specialize(lopt, *tags, **kwargs):
    name = (kwargs and kwargs.pop('name')) or lopt.__name__
    compile.optdb['specialize'].register(name, lopt, 'fast_run', *tags)
+    return lopt

 ######################
 # DimShuffle lifters #
@@ -876,10 +878,39 @@ register_canonicalize(local_mul_canonizer, name = 'local_mul_canonizer')
 def local_neg_to_mul(node):
    if node.op == T.neg:
        return [T.mul(-1, node.inputs[0])]
-    else:
-        return False
 register_canonicalize(local_neg_to_mul)

+@register_specialize
+@gof.local_optimizer([])
+def local_sum_mul_by_scalar(node):
+    """sum(scalar * smth) -> scalar * sum(smth)
+    """
+    # TODO: if the the thing inside the Sum is a division, 
+    # we should get at the numerator....
+    if isinstance(node.op, T.Sum):
+        thing_summed, = node.inputs
+        if thing_summed.owner and thing_summed.owner.op == T.mul:
+            terms = thing_summed.owner.inputs
+            scalars = [t.dimshuffle() for t in terms if numpy.all(t.type.broadcastable)]
+            non_scalars = [t for t in terms if not numpy.all(t.broadcastable)]
+            if scalars:
+                if len(scalars) > 1:
+                    if len(non_scalars) > 1:
+                        return [T.mul(T.mul(*scalars), node.op(T.mul(*non_scalars)))]
+                    elif len(non_scalars) == 1:
+                        return [T.mul(T.mul(*scalars), node.op(non_scalars[0]))]
+                    else:
+                        return [T.mul(*scalars)]
+                else:
+                    if len(non_scalars) > 1:
+                        return [T.mul(scalars[0], node.op(T.mul(*non_scalars)))]
+                    elif len(non_scalars) == 1:
+                        return [T.mul(scalars[0], node.op(non_scalars[0]))]
+                    else:
+                        return [scalars[0]]
+        if thing_summed.owner and thing_summed.owner.op == T.neg:
+            return [T.neg(node.op(thing_summed.owner.inputs[0]))]
+
 @gof.local_optimizer([T.mul])
 def local_mul_to_neg(node):
    if node.op == T.mul and N.all(local_mul_canonizer.get_constant(node.inputs[0]) == -1.0):
@@ -888,6 +919,16 @@ def local_mul_to_neg(node):
        return False
 register_specialize(local_mul_to_neg)

+@register_specialize
+@gof.local_optimizer([T.neg])
+def local_neg_neg(node):
+    # other specializations shouldn't put this in, 
+    # but sometimes they do
+    if node.op == T.neg:
+        if node.inputs[0].owner and node.inputs[0].owner.op == T.neg:
+            return [node.inputs[0].owner.inputs[0]]
+
+
 @gof.local_optimizer([T.mul])
 def local_mul_zero(node):
    """As part of canonicalization, we replace multiplication by zero with zero.

--- a/theano/tensor/tests/test_nnet.py
+++ b/theano/tensor/tests/test_nnet.py
@@ -317,6 +317,44 @@ def test_asymptotic_32():
        assert gxval[0,1] == 0.25


+def test_get_rid_of_advanced_indexing_version_of_xent():
+
+    rng = numpy.random.RandomState(utt.fetch_seed())
+
+    x_val = rng.randn(3,5)
+    y_val = numpy.asarray([2,4,1])
+
+    x = T.dmatrix('x')
+    y = T.lvector('y')
+
+    expressions_to_test = [
+            T.sum(-T.log(softmax(x)[T.arange(y.shape[0]), y])),
+            -T.sum(T.log(softmax(x)[T.arange(y.shape[0]), y])),
+            -T.sum(T.log(softmax(x))[T.arange(y.shape[0]), y]),
+            T.sum(-T.log(softmax(x))[T.arange(y.shape[0]), y])]
+
+    def assert_optimizer_worked(expr):
+        f = theano.function([x,y], expr)
+        for i, node in enumerate(f.maker.env.toposort()):
+            print i, node
+        f(x_val, y_val)
+        assert len(f.maker.env.toposort()) == 4
+    for expr in expressions_to_test:
+        assert_optimizer_worked(expr)
+
+    ## Gradient wrt x
+    for expr in expressions_to_test:
+        grad_x = T.grad(expr, x)
+        g = theano.function([x, y], grad_x)
+        for i, node in enumerate(g.maker.env.toposort()):
+            print i, node
+        g(x_val, y_val)
+        assert len(g.maker.env.toposort()) == 4
+
+
+    #TODO: Case with bias
+    #   hint - call local_softmax_with_bias from within the other optimization
+    #   hint - call the argmax push-down optimization first too

 if __name__ == '__main__':
    unittest.main()