merge

911b0a0a · James Bergstra · 81953c26 · 9734e6fd · 911b0a0a · 911b0a0a
--- a/doc/tutorial/symbolic_graphs.txt
+++ b/doc/tutorial/symbolic_graphs.txt
@@ -46,8 +46,8 @@ details about these building blocks see :ref:`variable`, :ref:`op`,
    circles are :ref:`Ops <op>`. Purple boxes are :ref:`Types <type>`.
-The graph can be traversed starting from a root (the result of some
+The graph can be traversed starting from outputs (the result of some
-computation) down to its leaves using the owner field.
+computation) down to its inputs using the owner field.
 Take for example the following code:
 .. code-block:: python
@@ -55,10 +55,8 @@ Take for example the following code:
    x = T.dmatrix('x')
    y = x*2.
-``y`` is such root, though there can be others for example if you also 
+If you print `type(y.owner)`` you get ``<class 'theano.gof.graph.Apply'>``, 
-had ``z = x+2``, then ``z`` would be a root as well. If you print 
+which is the apply node that connects the op and the inputs to get this
-``type(y.owner)`` you get ``<class 'theano.gof.graph.Apply'>``, which 
-is the apply node that connects the op and the inputs to get this
 output. You can now print the name of the op that is applied to get 
 ``y``:

--- a/theano/sandbox/test_scan.py
+++ b/theano/sandbox/test_scan.py
@@ -76,18 +76,148 @@ def verify_grad(op, pt, n_tests=2, rng=None, eps = None, tol = None,
-# Naming convention : 
-#  u_1,u_2,..   -> sequences
-#  s_1,s_2,..   -> initial states
-#  w_1,w_2,..   -> non-sequences
-###################################
 class T_Scan(unittest.TestCase):
    def setUp(self):
        utt.seed_rng()
-   def test_one(self):
-      pass
+    # generator network, only one output , type scalar ; no sequence or 
+    # non sequence arguments
+    def test_1():
+      def f_pow2(x_tm1):
+        return (2*x_tm1, {})
+      s = theano.tensor.dvector()
+      n_steps = theano.tensor.dscalar()
+      Y = theano.sandbox.scan.scan(f_pow2, [],s, [],n_steps = n_steps)
+      f1 = theano.function([s,n_steps], Y)
+      assert( numpy.any(f1([1],3)== [2,4,8])  )
+    # simple rnn, one input, one state, weights for each; input/state are 
+    # vectors, weights are scalars
+    def test_2():
+        def f_rnn(u_t,x_tm1,W_in, W):
+            return (u_t*W_in+x_tm1*W, {})
+        u    = theano.tensor.dvector()
+        x0   = theano.tensor.dvector()
+        W_in = theano.tensor.dscalar()
+        W    = theano.tensor.dscalar()
+        Y = theano.sandbox.scan.scan(f_rnn, u,x0,[W_in,W])
+        f2 = theano.function([u,x0,W_in,W], Y)
+        assert(numpy.any(f2([1,2,3,4],[1],.1,1)== \
+                numpy.array([1.1,1.3,1.6,2.])))
+    # simple rnn, one input, one state, weights for each; input/state are 
+    # vectors, weights are scalars; using shared variables
+    def test_3():
+        u    = theano.tensor.dvector()
+        x0   = theano.tensor.dvector()
+        W_in = theano.shared(.1, name = 'w_in')
+        W    = theano.shared(1., name ='w')
+        def f_rnn_shared(u_t,x_tm1):
+            return (u_t*W_in+x_tm1*W, {})
+        Y = theano.sandbox.scan.scan(f_rnn_shared, u,x0,[])
+        f3 = theano.function([u,x0], Y)
+        assert(numpy.any(f3([1,2,3,4],[1])== numpy.array([1.1,1.3,1.6,2.])))
+    # some rnn with multiple outputs and multiple inputs; other dimension 
+    # instead of scalars/vectors
+    def test_4():
+        W_in2 = theano.shared(numpy.array([1.,2.]), name='win2')
+        W     = theano.shared(numpy.array([[2.,1.],[1.,1.]]), name='w')
+        W_out = theano.shared(numpy.array([.5,1.]), name = 'wout')
+        W_in1 = theano.tensor.dmatrix('win')
+        u1    = theano.tensor.dmatrix('u1')
+        u2    = theano.tensor.dvector('u2')
+        x0    = theano.tensor.dmatrix('x0')
+        y0    = theano.tensor.dvector('y0')
+        def f_rnn_cmpl(u1_t, u2_t, x_tm1, y_tm1, W_in1):
+            return ({}, [theano.dot(u1_t,W_in1) + u2_t* W_in2 + \
+                    theano.dot(x_tm1, W), theano.dot(x_tm1, W_out)])
+        Y = theano.sandbox.scan.scan(f_rnn_cmpl,[u1,u2],[x0,y0],W_in1)
+        f4 = theano.function([u1,u2,x0,y0,W_in1], Y)
+        (x,y) =  f4( numpy.array([[1,2],[1,2],[1,2]]), \
+                  numpy.array([1,2,3]),             \
+                  numpy.array([[0,0]]),             \
+                  numpy.array([1]),                 \
+                  numpy.array([[1,1],[1,1]]))
+        assert( numpy.all(x == numpy.array([[4.,5.],[18.,16.],[58.,43.]])))
+        assert( numpy.all(y == numpy.array([0.,7.,25.])))
+    # basic ESN using updates 
+    def test_5(): 
+        W_in = theano.shared(numpy.array([1.,1.]), name='win')
+        W    = theano.shared(numpy.array([[.1,0.],[.0,.1]]),name='w')
+        W_out= theano.shared(numpy.array([.5,1.]), name='wout')
+        u  = theano.tensor.dvector('u')
+        x  = theano.shared(numpy.array([0.,0.]),'x')
+        y0 = theano.tensor.dvector('y0')
+        def f_ESN(u_t):
+            return ( theano.dot(x,W_out), \
+             { x: W_in*u_t + theano.dot(x,W) } )
+        Y = theano.sandbox.scan.scan(f_ESN,u,y0,[],outputs_taps={0:[]})
+        f5 = theano.function([u,y0],Y)
+        assert( f5( numpy.array([1,2,3]), numpy.array([0])) == \
+                 numpy.array([0.,1.4,3.15]))
+    # basic ESN using updates ; moving backwards
+    def test_6(): 
+        W_in = theano.shared(numpy.array([1.,1.]), name='win')
+        W    = theano.shared(numpy.array([[.1,0.],[.0,.1]]),name='w')
+        W_out= theano.shared(numpy.array([.5,1.]), name='wout')
+        u  = theano.tensor.dvector('u')
+        x  = theano.shared(numpy.array([0.,0.]),'x')
+        y0 = theano.tensor.dvector('y0')
+        def f_ESN(u_t):
+            return ( theano.dot(x,W_out), \
+             { x: W_in*u_t + theano.dot(x,W) } )
+        Y = theano.sandbox.scan.scan(f_ESN,u,y0,[],outputs_taps={0:[]}, \
+                                     go_backwards = True)
+        f6 = theano.function([u,y0],Y)
+        assert( f6( numpy.array([1,2,3]), numpy.array([0])) == \
+                 numpy.array([0., 4.5, 3.45]))
+    '''
+     TO TEST: 
+        - test taps (for sequences and outputs )
+        - test gradient (one output)
+        - test gradient (multiple outputs)
+        - test gradient (go_bacwards) 
+        - test gradient (multiple outputs / some uncomputable )
+        - test gradient (truncate_gradient)
+        - test gradient (force_gradient) 
+        - test inplace map
+    '''
 if __name__ == '__main__':
    unittest.main()