Merge pull request #4404 from abergeron/stack_nanguard

Convert NanGuardMode to use the VM linker instead of WrapLinker.

Merge pull request #4404 from abergeron/stack_nanguard
e845b755 · Frédéric Bastien · df0292e6 · c8f4b611 · e845b755 · e845b755
--- a/doc/tutorial/modes.txt
+++ b/doc/tutorial/modes.txt
@@ -168,8 +168,8 @@ Linkers
 =======
 A mode is composed of 2 things: an optimizer and a linker. Some modes,
-like ``NanGuardMode`` and ``DebugMode``, add logic around the optimizer and
+like ``NanGuardMode`` and ``DebugMode``, add logic around the
-linker. ``NanGuardMode`` and ``DebugMode`` use their own linker.
+optimizer and linker. ``DebugMode`` uses its own linker.
 You can select which linker to use with the Theano flag :attr:`config.linker`.
 Here is a table to compare the different linkers.
@@ -183,7 +183,7 @@ c|py [#cpy1]_  yes        yes                "+++"      Try C code. If none exis
 c|py_nogc      no         yes                "++"       As c|py, but without gc
 c              no         yes                "+"        Use only C code (if none available for an op, raise an error)
 py             yes        yes                "+++"      Use only Python code
-NanGuardMode    no         no                 "++++"    Check if nodes generate NaN
+NanGuardMode   yes        yes                "++++"     Check if nodes generate NaN
 DebugMode      no         yes                VERY HIGH  Make many checks on what Theano computes
 =============  =========  =================  =========  ===

--- a/theano/compile/nanguardmode.py
+++ b/theano/compile/nanguardmode.py
@@ -73,7 +73,7 @@ def contains_nan(arr, node=None):
    elif arr.size == 0:
        return False
    elif cuda.cuda_available and isinstance(arr, cuda.CudaNdarray):
-        if (hasattr(theano.sandbox, 'rng_mrg') and
+        if (node and hasattr(theano.sandbox, 'rng_mrg') and
            isinstance(
                node.op,
                # It store ints in float container
@@ -119,7 +119,7 @@ def contains_inf(arr, node=None):
    elif arr.size == 0:
        return False
    elif cuda.cuda_available and isinstance(arr, cuda.CudaNdarray):
-        if (hasattr(theano.sandbox, 'rng_mrg') and
+        if (node and hasattr(theano.sandbox, 'rng_mrg') and
            isinstance(
                node.op,
                # It store ints in float container
@@ -215,7 +215,7 @@ class NanGuardMode(Mode):
        assert nan_is_error or inf_is_error or big_is_error
        compile_gpu_func(nan_is_error, inf_is_error, big_is_error)
-        def do_check_on(var, nd, f, is_input):
+        def do_check_on(var, nd):
            """
            Checks `var` for NaNs / Infs. If detected, raises an exception
            and / or prints information about `nd`, `f`, and `is_input` to
@@ -227,11 +227,6 @@ class NanGuardMode(Mode):
                The value to be checked.
            nd : theano.gof.Apply
                The Apply node being executed.
-            f : callable
-                The thunk for the apply node.
-            is_input : bool
-                If True, `var` is an input to `nd`.
-                If False, it is an output.
            """
            error = False
@@ -262,17 +257,13 @@ class NanGuardMode(Mode):
                    print('Big value detected', file=sio)
                    error = True
            if error:
-                if not is_input:
+                if nd:
-                    print("NanGuardMode found an error in the"
+                    print("NanGuardMode found an error in the "
-                          " output of a node in this variable:", file=sio)
+                          "output of a node in this variable:", file=sio)
                    print(theano.printing.debugprint(nd, file='str'), file=sio)
                else:
-                    print("NanGuardMode found an error in an"
+                    print("NanGuardMode found an error in an input of the "
-                          " input of this node.", file=sio)
+                          "graph.", file=sio)
-                    print('Node:', file=sio)
-                    print(nd, file=sio)
-                    print("The input variable that cause problem:", file=sio)
-                    print(theano.printing.debugprint(nd, file='str'), file=sio)
                msg = sio.getvalue()
                if config.NanGuardMode.action == 'raise':
                    raise AssertionError(msg)
@@ -283,36 +274,16 @@ class NanGuardMode(Mode):
                elif config.NanGuardMode.action == 'warn':
                    logger.error(msg)
-        def nan_check(i, node, fn):
+        def nan_check(node, thunk, storage_map, compute_map):
-            """
+            for var in node.outputs:
-            Runs `fn` while checking its inputs and outputs for NaNs / Infs.
-            Parameters
-            ----------
-            i :
-                Currently ignored.
-                TODO: determine why it is here or remove).
-            node : theano.gof.Apply
-                The Apply node currently being executed.
-            fn : callable
-                The thunk to execute for this Apply node.
-            """
-            inputs = fn.inputs
-            for x, var in zip(inputs, node.inputs):
-                # If the input is the result of computation, then we
-                # don't need to check it. It is already done after the
-                # computation.
-                if (var.owner is None and
-                        getattr(var.tag, 'nan_guard_mode_check', True)):
-                    do_check_on(x[0], node, fn, True)
-            fn()
-            outputs = fn.outputs
-            for x, var in zip(outputs, node.outputs):
                if getattr(var.tag, 'nan_guard_mode_check', True):
-                    do_check_on(x[0], node, fn, False)
+                    do_check_on(storage_map[var][0], node)
+        def nan_check_input(var, value):
+            if getattr(var.tag, 'nan_guard_mode_check', True):
+                do_check_on(value, None)
-        wrap_linker = theano.gof.WrapLinker([theano.gof.OpWiseCLinker()],
+        wrap_linker = theano.gof.vm.VM_Linker(callback=nan_check,
-                                            nan_check)
+                                              callback_input=nan_check_input)
        super(NanGuardMode, self).__init__(wrap_linker,
                                           optimizer=self.provided_optimizer)
--- a/theano/gof/vm.py
+++ b/theano/gof/vm.py
@@ -327,7 +327,7 @@ class Stack(VM):
    def __init__(self, nodes, thunks, pre_call_clear,
                 storage_map, compute_map, fgraph, allow_gc,
-                 dependencies=None, callback=None):
+                 dependencies=None, callback=None, callback_input=None):
        super(Stack, self).__init__(nodes, thunks, pre_call_clear)
        self.allow_gc = allow_gc
@@ -340,6 +340,7 @@ class Stack(VM):
        self.compute_map = compute_map
        self.node_idx = node_idx = {}
        self.callback = callback
+        self.callback_input = callback_input
        ords = fgraph.orderings()
@@ -406,6 +407,8 @@ class Stack(VM):
        for k in self.storage_map:
            compute_map[k][0] = (k.owner is None)
+            if self.callback_input and compute_map[k][0]:
+                self.callback_input(k, self.storage_map[k][0])
        # apply_stack contains nodes
        if output_subset is not None:
@@ -679,6 +682,11 @@ class VM_Linker(link.LocalLinker):
        A callable object to call after each call to a thunk within
        the virtual machine.  It will be called with four arguments called
        'node', 'thunk', 'storage_map', and 'compute_map'.
+    callback_input
+        A callable object to call on each input to the graph
+        (variables with no owner).  This includes constants and shared
+        variables values.  It will be called with two arguments:
+        'var', 'value'.
    lazy
        Useful only when use_cloop is False. When lazy is None, use the
        theano flag vm.lazy value. Then if we have a None (default) we auto
@@ -695,8 +703,8 @@ class VM_Linker(link.LocalLinker):
    """
    def __init__(self, allow_gc=None, use_cloop=False, callback=None,
-                 lazy=None, schedule=None, c_thunks=None,
+                 callback_input=None, lazy=None, schedule=None,
-                 allow_partial_eval=None):
+                 c_thunks=None, allow_partial_eval=None):
        # Note: if more parameters are added to __init__, make sure to forward
        # them in the "type(self)(...)" call in the "accept" method below.
        if allow_gc is None:
@@ -705,6 +713,7 @@ class VM_Linker(link.LocalLinker):
        self.allow_gc = allow_gc
        self.use_cloop = use_cloop
        self.callback = callback
+        self.callback_input = callback_input
        self.lazy = lazy
        self.c_thunks = c_thunks
        self.allow_partial_eval = allow_partial_eval
@@ -752,9 +761,11 @@ class VM_Linker(link.LocalLinker):
                allow_gc=self.allow_gc,
                use_cloop=self.use_cloop,
                callback=self.callback,
+                callback_input=self.callback_input,
                lazy=self.lazy,
                schedule=self.schedule,
                c_thunks=self.c_thunks,
+                allow_partial_eval=self.allow_partial_eval
            ).accept(fgraph, no_recycling)
        self.fgraph = fgraph
        self.no_recycling = no_recycling
@@ -821,16 +832,17 @@ class VM_Linker(link.LocalLinker):
        pre_call_clear = [storage_map[v] for v in self.no_recycling]
-        if (self.callback is not None or
+        if (self.callback is not None or self.callback_input is not None or
                (config.profile and config.profile_memory) or
-                getattr(self, 'allow_partial_eval', False)):
+                self.allow_partial_eval):
-            if self.use_cloop and self.callback is not None:
+            if self.use_cloop and (self.callback is not None or
+                                   self.callback_input is not None):
                logger.warn('CVM does not support callback, using Stack VM.')
            if self.use_cloop and config.profile_memory:
                warnings.warn(
                    'CVM does not support memory profile, using Stack VM.')
-            if self.use_cloop and getattr(self, 'allow_partial_eval', False):
+            if self.use_cloop and self.allow_partial_eval:
                warnings.warn(
                    'CVM does not support partial evaluation yet, '
                    'using Stack VM.')
@@ -841,7 +853,8 @@ class VM_Linker(link.LocalLinker):
                storage_map, compute_map,
                self.fgraph, self.allow_gc,
                dependencies=deps,
-                callback=self.callback)
+                callback=self.callback,
+                callback_input=self.callback_input)
        elif self.use_cloop:
            # create a map from nodes to ints and vars to ints
            nodes_idx = {}
@@ -1038,7 +1051,7 @@ class VM_Linker(link.LocalLinker):
        if lazy is None:
            lazy = not all([(not th.lazy) for th in thunks])
        if not (lazy or (config.profile and config.profile_memory) or
-                self.use_cloop or self.callback):
+                self.use_cloop or self.callback or self.callback_input):
            for pair in itervalues(reallocated_info):
                storage_map[pair[1]] = storage_map[pair[0]]
@@ -1080,3 +1093,7 @@ class VM_Linker(link.LocalLinker):
        self.__dict__.update(d)
        if not hasattr(self, 'c_thunks'):
            self.c_thunks = True
+        if not hasattr(self, 'allow_partial_eval'):
+            self.allow_partial_eval = None
+        if not hasattr(self, 'callback_input'):
+            self.callback_input = None