merge

8a15ca52 · Olivier Breuleux · b8f816d1 · faee95e7 · 8a15ca52 · 8a15ca52
--- a/scripts/docgen.py
+++ b/scripts/docgen.py

 import sys
 import os
+import shutil
 import inspect

 from epydoc import docintrospecter 
@@ -98,13 +99,36 @@ if __name__ == '__main__':
    if options['--all'] or options['--epydoc']:
        from epydoc.cli import cli
        sys.path[0:0] = throot
+
+        #Generate HTML doc
+        #os.system("epydoc --config doc/api/epydoc.conf -o html/api")
        sys.argv[:] = ['', '--config', '%s/doc/api/epydoc.conf' % throot, '-o', 'api']
        cli()
-#        os.system("epydoc --config doc/api/epydoc.conf -o html/api")
+
+        # Generate PDF doc
+        # TODO

    if options['--all'] or options['--rst']:
        import sphinx
        sys.path[0:0] = [os.path.join(throot, 'doc')]
        sphinx.main(['', '-E', os.path.join(throot, 'doc'), '.'])

+        # Generate latex file in a temp directory
+        import tempfile
+        workdir = tempfile.mkdtemp()
+        sphinx.main(['', '-E', '-b', 'latex',
+            os.path.join(throot, 'doc'), workdir])
+        # Compile to PDF
+        currentdir = os.getcwd()
+        os.chdir(workdir)
+        os.system('make')
+        try:
+            shutil.copy(os.path.join(workdir, 'theano.pdf'), currentdir)
+            os.chdir(currentdir)
+            shutil.rmtree(workdir)
+        except OSError, e:
+            print 'OSError:', e
+
+
+

--- a/theano/compile/debugmode.py
+++ b/theano/compile/debugmode.py
@@ -86,9 +86,13 @@ class BadOptimization(DebugModeError):
        self.old_graph = old_graph
        self.new_graph = new_graph

+    def __str__(self):
+        return self.str_diagnostic()
+
    def str_diagnostic(self):
        """Return a pretty multiline string representating the cause of the exception"""
        sio = StringIO()
+        print >> sio, "BadOptimization Error", super(BadOptimization, self).__str__()
        print >> sio, "  Result: id", id(self.new_r), self.new_r 
        print >> sio, "  Op", self.new_r.owner
        print >> sio, "  Value Type:", type(self.new_r_val)
@@ -117,8 +121,8 @@ class BadDestroyMap(DebugModeError):
        print >> sio, "  destroy_map:", getattr(self.node.op, 'destroy_map', {})
        print >> sio, "  changed input idx:", self.idx
        print >> sio, "  changed input type:", self.node.inputs[self.idx].type
-        print >> sio, "  old val:", self.old_val
-        print >> sio, "  new val:", self.new_val
+        print >> sio, "  repr (old val):", repr(self.old_val)
+        print >> sio, "  repr (new val):", repr(self.new_val)
        print >> sio, ""
        print >> sio, "  Hint: this can be caused by a deficient values_eq_approx() or __eq__() implementation that compares node input values"
        return sio.getvalue()
@@ -203,7 +207,7 @@ def _optcheck_env(input_specs, output_specs, accept_inplace = False):
    env.extend(Supervisor(input for spec, input in zip(input_specs, inputs) if not (spec.mutable or (hasattr(env, 'destroyers') and env.destroyers(input)))))
    return env, map(SymbolicOutput, updates), equivalence_tracker

-def _check_inputs(node, storage_map, r_vals, dr_vals, active_nodes):
+def _check_inputs(node, storage_map, r_vals, dr_vals, active_nodes, clobber_dr_vals=True):
    """Raise BadDestroyMap if necessary, update dr_vals"""
    destroyed_idx_list = []
    destroy_map = getattr(node.op, 'destroy_map', {})
@@ -221,10 +225,98 @@ def _check_inputs(node, storage_map, r_vals, dr_vals, active_nodes):
                    if dr_vals.get(r, (0, node))[1] is not node:
                        # bad: there should only be one active node that destroys any result
                        raise Exception('failure in topological ordering')
-                    dr_vals[r] = (storage_map[r][0], node) #no copy, this is the last use of this variable
+                    if clobber_dr_vals:
+                        dr_vals[r] = (storage_map[r][0], node) #no copy, this is the last use of this variable
+                    storage_map[r][0] = None #make sure that dr_vals[r] doens't get used again
            else:
                raise BadDestroyMap(node, r_idx, r_vals[r], storage_map[r][0])

+def _lessbroken_deepcopy(a):
+    if type(a) is numpy.ndarray:
+        rval = numpy.array(a, copy=True, dtype=a.dtype)
+    else:
+        rval = copy.deepcopy(a)
+
+    assert type(rval) == type(a)
+    if isinstance(rval, numpy.ndarray):
+        assert rval.dtype == a.dtype
+    return rval
+
+def _find_bad_optimizations0(order, reasons, r_vals):
+    """Use a simple algorithm to find broken optimizations.  This algorithm is simple to
+    understand, but sometimes when there's a problem it identifies the wrong optimization as
+    the culprit.
+    """
+    # iterate over results looking for values that don't match the values of the
+    # results they replaced.  This is the sign of a broken optimization.
+    for i, node in enumerate(order):
+        for new_r in node.outputs:
+            for reason, r, old_graph_str, new_graph_str in reasons[new_r]:
+                problem = False
+
+                #check if the value for new_r doesn't match the value for r
+                new_r_val = r_vals[new_r]
+                r_val = r_vals[r]
+                assert r.type == new_r.type
+
+                if not r.type.values_eq_approx(r_val, new_r_val):
+                    raise BadOptimization(old_r=r,
+                            new_r=new_r, 
+                            old_r_val=r_val, 
+                            new_r_val=new_r_val,
+                            reason=reason,
+                            old_graph=old_graph_str,
+                            new_graph=new_graph_str)
+
+def _find_bad_optimizations1(order, reasons, r_vals):
+    # iterate over results looking for values that don't match the values of the
+    # results they replaced.  This is the sign of a broken optimization.
+
+    #identify sets of results that are supposed to be equivalent
+    equivalence_sets = {}
+    program_position = {} #node -> order idx
+
+    for i, node in enumerate(order):
+        program_position[node] = i
+        for new_r in node.outputs:
+            equivalence_sets.setdefault(new_r, set([new_r]))
+            for reason, r, old_graph_str, new_graph_str in reasons[new_r]:
+                equivalence_sets[new_r].update(equivalence_sets.setdefault(r, set([r])))
+                for er in equivalence_sets[r]:
+                    equivalence_sets[er] = equivalence_sets[new_r]
+
+    #identify equivalence sets that are broken
+    equivalence_sets_broken = {} #id(set) -> Bool
+    there_is_a_problem = False
+    for r, r_equiv in equivalence_sets.iteritems():
+        if id(r_equiv) not in equivalence_sets_broken:
+            equivalence_sets_broken[id(r_equiv)] = False
+            #loop over the results in the set comparing them to be equal enough
+            re0 = None
+            for re in r_equiv:
+                if re0:
+                    new_r_val = r_vals[re]
+                    r_val = r_vals[re0]
+                    assert re.type == re0.type
+                    if not re.type.values_eq_approx(r_val, new_r_val):
+                        equivalence_sets_broken[id(r_equiv)] = True
+                        there_is_a_problem = True
+                re0 = re
+
+    if there_is_a_problem:
+        # which broken equivalence set has the earliest-occurring element?
+        first_broken_set = None
+        for i, node in enumerate(order):
+            for r in node.outputs:
+                r_equiv = equivalence_sets[r]
+                if equivalence_sets_broken[id(r_equiv)]:
+                    first_broken_set = r_equiv
+        #TODO finish this to produce good diagnostic information
+        print first_broken_set
+        raise Exception('broken')
+
+
+

 class _EnvEvent(object):
    """A record of an event in the life of an Env.
@@ -425,12 +517,12 @@ class _Linker(gof.link.LocalLinker):

    def make_all(self, profiler = None, input_storage = None, output_storage = None):
        env = self.env
+        input_storage_ = input_storage
+        output_storage_ = output_storage
        #order = env.toposort()

        #Compute a topological ordering that IGNORES the destroy_map of destructive Ops.
        #This will be OK, because every thunk is evaluated on a copy of its input.
-        # If the copy.copy function produces an object that is aliased to the original one,
-        # then this evaluation mode will not work.  It works for ndarrays.
        order_outputs = copy.copy(env.equivalence_tracker.all_results_ever)
        order_outputs.reverse()
        order = graph.io_toposort(env.inputs, order_outputs)
@@ -440,7 +532,8 @@ class _Linker(gof.link.LocalLinker):

        no_recycling = self.no_recycling

-        input_storage, output_storage, storage_map = link.map_storage(env, order, input_storage, output_storage)
+        input_storage, output_storage, storage_map = link.map_storage(env, order,
+                input_storage_, output_storage_)

        thunks_py = [] #python thunks
        thunks_c = [] #c thunks
@@ -481,10 +574,10 @@ class _Linker(gof.link.LocalLinker):
                thunk.inputs = node_input_storage
                thunk.outputs = node_output_storage
                thunks_c.append(thunk)
+
            except (NotImplementedError, utils.AbstractFunctionError):
                thunks_c.append(None)

-
            p = node.op.perform
            thunk = (lambda p = p, i = node_input_storage, o = node_output_storage, n =
                    node: p(n, [x[0] for x in i], o))
@@ -521,11 +614,11 @@ class _Linker(gof.link.LocalLinker):

            # transfer the initial values from the storage_map to the r_vals
            for r in storage_map:
-                if storage_map[r][0] is not None:
-                    if r.owner is not None:
-                        # DEBUG
-                        print r, storage_map[r], type(storage_map[r]), id(storage_map[r])
-                    assert r.owner is None
+                if (r.owner is None):
+                    if (storage_map[r][0] is None):
+                        raise Exception('Missing input', r)
+                    if not r.type.is_valid_value(storage_map[r][0]):
+                        raise InvalidValueError(r, storage_map[r][0])
                    r_vals[r] = storage_map[r][0]
                    storage_map[r][0] = None
            #####
@@ -541,13 +634,18 @@ class _Linker(gof.link.LocalLinker):

                    # put a copy of each input into the storage_map
                    for r in node.inputs:
-                        storage_map[r][0] = copy.copy(r_vals[r])
+                        assert isinstance(r, gof.Result)
+                        assert r in r_vals
+                        storage_map[r][0] = _lessbroken_deepcopy(r_vals[r])
+                        if not r.type.is_valid_value(storage_map[r][0]):
+                            raise InvalidValueError(r, storage_map[r][0])

                    thunk_py()

-                    _check_inputs(node, storage_map, r_vals, dr_vals, active_order_set)
+                    _check_inputs(node, storage_map, r_vals, dr_vals, active_order_set,
+                            clobber_dr_vals=True)

-                    #retrieve a copy of each output from the storage_map
+                    #retrieve each output from the storage_map
                    for r in node.outputs:
                        if not r.type.is_valid_value(storage_map[r][0]):
                            raise InvalidValueError(r, storage_map[r][0])
@@ -561,11 +659,12 @@ class _Linker(gof.link.LocalLinker):

                        for r in node.inputs:
                            # TODO:  we only need to overwrite the non-destroyed inputs
-                            storage_map[r][0] = copy.copy(r_vals[r])
+                            storage_map[r][0] = _lessbroken_deepcopy(r_vals[r])

                        thunk_c()

-                        _check_inputs(node, storage_map, r_vals, dr_vals, active_order_set)
+                        _check_inputs(node, storage_map, r_vals, dr_vals, active_order_set,
+                                clobber_dr_vals=False)

                        for r in node.outputs:
                            if not r.type.is_valid_value(storage_map[r][0]):
@@ -584,27 +683,7 @@ class _Linker(gof.link.LocalLinker):
            except:
                raise_with_op(node)

-            # iterate over results looking for values that don't match the values of the
-            # results they replaced.  This is the sign of a broken optimization.
-            for i, node in enumerate(order):
-                for new_r in node.outputs:
-                    for reason, r, old_graph_str, new_graph_str in env.equivalence_tracker.reasons[new_r]:
-                        problem = False
-
-                        #check if the value for new_r doesn't match the value for r
-                        new_r_val = r_vals[new_r]
-                        r_val = r_vals[r]
-                        assert r.type == new_r.type
-
-                        if not r.type.values_eq_approx(r_val, new_r_val):
-                            raise BadOptimization(old_r=r,
-                                    new_r=new_r, 
-                                    old_r_val=r_val, 
-                                    new_r_val=new_r_val,
-                                    reason=reason,
-                                    old_graph=old_graph_str,
-                                    new_graph=new_graph_str)
-            
+            _find_bad_optimizations0(order, env.equivalence_tracker.reasons, r_vals)

            #####
            #  Postcondition: the input and output results are in the storage map, nothing more
@@ -629,6 +708,7 @@ class _Linker(gof.link.LocalLinker):

            # if an input was destroyed, the destroyed value should be returned
            for r in dr_vals:
+                assert dr_vals[r][0] is not None
                if r.owner is None:
                    assert r in env.inputs
                    #HACK TO LOOK LIKE A REAL DESTRUCTIVE ACTION TOOK PLACE
@@ -645,6 +725,9 @@ class _Linker(gof.link.LocalLinker):
            #print output_storage
            #print dr_vals
            #print storage_map
+            for r in storage_map:
+                if (r.owner is None):
+                    assert storage_map[r][0] is not None

            ###############
            # Done f

--- a/theano/compile/function_module.py
+++ b/theano/compile/function_module.py
@@ -288,8 +288,12 @@ class Function(object):
        # if we are allowing garbage collection, remove the input and output reference from the internal
        # storage cells
        if getattr(self.fn, 'allow_gc', False):
-            for x in self.output_storage:
-                x.storage[0] = None  #WARNING: This circumvents the 'readonly' attribute in x
+            assert len(self.output_storage) == len(self.maker.env.outputs)
+            for o_container, o_result in zip(self.output_storage, self.maker.env.outputs):
+                if o_result.owner is not None:
+                    # this node is the result of computation
+                    # WARNING: This circumvents the 'readonly' attribute in x
+                    o_container.storage[0] = None

        # Update the inputs that have an update function
        for input, storage in reversed(zip(self.maker.expanded_inputs, self.input_storage)):

--- a/theano/tensor/elemwise.py
+++ b/theano/tensor/elemwise.py
@@ -160,6 +160,8 @@ class DimShuffle(Op):
    def perform(self, node, (input, ), (storage, )):
        # drop
        res = input
+        if type(res) != numpy.ndarray:
+            raise TypeError(res)
        shape = list(res.shape)
        for drop in reversed(self.drop):
            shape.pop(drop)
@@ -178,7 +180,7 @@ class DimShuffle(Op):
        if not self.inplace:
            res = numpy.copy(res)

-        storage[0] = res
+        storage[0] = numpy.asarray(res) #asarray puts scalars back into array

    def c_code(self, node, name, (input,), (res,), sub):
        def statements(lst):