Fix for SupportCodeError and KeyError

9dfbff30 · sentient07 · 3f9d0601 · 9dfbff30 · 9dfbff30
--- a/theano/compile/profiling.py
+++ b/theano/compile/profiling.py
@@ -54,7 +54,7 @@ def _atexit_print_fn():
        destination_file = open(config.profiling.destination, 'w')
    for ps in _atexit_print_list:
-        if ps.fct_callcount or ps.compile_time > 0:
+        if ps.fct_callcount > 1 or ps.compile_time > 1:
            ps.summary(file=destination_file,
                       n_ops_to_print=config.profiling.n_ops,
                       n_apply_to_print=config.profiling.n_apply)

--- a/theano/gpuarray/opt.py
+++ b/theano/gpuarray/opt.py
@@ -164,12 +164,7 @@ def op_lifter(OP, cuda_only=False):
                clients = [c for o in node.outputs for c in o.clients]
                # list of list containing clients
                # it is clients per node basis
-                out_clients = []
+                out_clients = [o.clients for o in node.outputs]
-                for o in node.outputs:
-                    if o.clients:
-                        out_clients.append(o.clients)
-                    else:
-                        out_clients.append([])
                if not replace:
                    # We replace if *all* clients are on the GPU
@@ -268,7 +263,6 @@ class GraphToGPU(Optimizer):
    def apply(self, fgraph):
        mapping = {}
-        move_to_GPU = True
        # Building a new graph
        # Iterating through inputs of graph
@@ -288,27 +282,22 @@ class GraphToGPU(Optimizer):
                continue
            # Move only if any of the inputs are on the GPU.
-            move_to_GPU = True
+            move_to_GPU = False
-            '''
            if any([isinstance(i, GpuArrayVariable) or
                    isinstance(i, GpuArraySharedVariable)
                    for i in [mapping[v] for v in node.inputs] +
                              node.outputs]):
                move_to_GPU = True
-            '''
-            out_clients = []
+            out_clients = [o.clients for o in node.outputs]
-            for o in node.outputs:
-                if o.clients:
-                    out_clients.append(o.clients)
-                else:
-                    out_clients.append([])
            context_name = None
            for i in [mapping[i] for i in node.inputs]:
                if isinstance(i.type, GpuArrayType):
                    context_name = i.type.context_name
+                    move_to_GPU = True
                    break
            new_ops = None
@@ -769,7 +758,6 @@ def local_gpua_split(op, context_name, inputs):
 @register_opt2([tensor.Subtensor], 'fast_compile')
 def local_gpua_subtensor(op, context_name, inputs, clients):
    x = inputs[0]
-    node = op.make_node(*inputs)
    if (x.owner and isinstance(x.owner.op, HostFromGpu)):
        gpu_x = x.owner.inputs[0]
        if (gpu_x.owner and
@@ -781,8 +769,6 @@ def local_gpua_subtensor(op, context_name, inputs, clients):
                                              for v in n.inputs + n.outputs])
                        for n, _ in clients[0]]):
                    return
-                else:
-                    return [host_from_gpu(gpu_x.owner.op(node.outputs[0]))]
    return GpuSubtensor(op.idx_list)