merged

a51b43fe · Ian Goodfellow · ff354011 · ff2a27d5 · a51b43fe · a51b43fe
--- a/doc/developer/index.txt
+++ b/doc/developer/index.txt
+.. _developer:
+======================
+Theano Design and Implementation Documentation
+======================
+.. toctree::
+   :maxdepth: 2
+   tensor
--- a/doc/developer/tensor.txt
+++ b/doc/developer/tensor.txt
+.. _tensor:
+=======
+Tensor
+=======
+This file describes the design of theano.tensor.
+Elemwise grad and R_op 
+=================
+Here's another straightforward example, though a bit more elaborate
+than adding two numbers together. Let's say that you want to compute
+the logistic curve, which is given by:
+.. math::
+   s(x) = \frac{1}{1 + e^{-x}}
--- a/doc/index.txt
+++ b/doc/index.txt
@@ -78,7 +78,8 @@ Roughly in order of what you'll want to check out:
 * :ref:`libdoc` -- Theano's functionality, module by module.
 * :ref:`optimizations` -- Guide to Theano's graph optimizations.
 * :ref:`extending` -- Learn to add a Type, Op, or graph optimization.
-* :ref:`internal` -- How to maintaining Theano, LISA-specific tips, and more...
+* :ref:`developer` -- Primarily of interest to developers of Theano
+* :ref:`internal` -- How to maintain Theano, LISA-specific tips, and more...
 * :ref:`release` -- How our release should work.
 You can download the latest `PDF documentation <http://deeplearning.net/software/theano/theano.pdf>`_, rather than reading it online.

--- a/theano/gradient.py
+++ b/theano/gradient.py
@@ -36,7 +36,14 @@ def grad_sources_inputs(sources, graph_inputs, warn_type=True):
    them)
    :rtype: dictionary whose keys and values are of type `Variable`
-    :return: mapping from each Variable encountered in the backward traversal to its gradient.
+    :return: mapping from each Variable encountered in the backward traversal to the gradient with respect to that Variable.
+    It is assumed that there is some objective J shared between all members of
+    sources, so that for each v, gradient-on-v is the gradient of J with respect to v
    """
    gmap = {}
    for (r, g_r) in sources:
@@ -125,3 +132,14 @@ def unimplemented_grad(op, x_pos, x):
    """
    msg = '%s.grad not implemented for input %i'%(op, x_pos)
    return Raise(msg=msg)(x)
+class GradientUndefined(Exception): pass
+def undefined_grad(op, x_pos, x):
+    msg = "Undefined gradient - do not use in computations"
+    exc = RuntimeError
+    return Raise(msg=msg, exc=exc)(x)
+def grad(self, inputs, out_storage):
+    return [g_x0, undefined_grad(self, 1, inputs[1])]
--- a/theano/scalar/basic.py
+++ b/theano/scalar/basic.py
@@ -77,6 +77,16 @@ def constant(x):
 class Scalar(Type):
+    """
+        Internal class, should not be used by clients
+        Primarily used by tensor.elemwise and tensor.reduce
+        Analogous to TensorType, but for zero-dimensional objects
+        Maps directly to C primitives
+        TODO: refactor to be named ScalarType for consistency with TensorType
+    """
    def __init__(self, dtype):
        if dtype == 'floatX':
            dtype = config.floatX

--- a/theano/tensor/elemwise.py
+++ b/theano/tensor/elemwise.py
@@ -537,7 +537,10 @@ class Elemwise(Op):
    def grad(self, inputs, ograds):
        # Gradients (especially on the final costs) don't have to be symbolic
+        # e.g., ograds will be [ 1. ] if your objective is c and the output
+        # of the current apply node is c
        ograds = map(as_tensor_variable, ograds)
        scalar_inputs = [Scalar(dtype = t.type.dtype)() for t in inputs]
        scalar_ograds = [Scalar(dtype = ograd.type.dtype)() for ograd in ograds]
        scalar_igrads = self.scalar_op.grad(scalar_inputs, scalar_ograds)