fixes to make the behaviour of the cuda shared constructor more strict on…

fixes to make the behaviour of the cuda shared constructor more strict on accepting only float32 ndarrays

fixes to make the behaviour of the cuda shared constructor more strict on…
5ae8bc0c · James Bergstra · 91aa8472 · 5ae8bc0c · 5ae8bc0c
--- a/theano/sandbox/cuda/__init__.py
+++ b/theano/sandbox/cuda/__init__.py
@@ -94,7 +94,7 @@ if enable_cuda:
    from theano.sandbox.cuda.var import (CudaNdarrayVariable,
            CudaNdarrayConstant,
            CudaNdarraySharedVariable,
-            shared_constructor)
+            float32_shared_constructor)
    import basic_ops
    from basic_ops import (GpuFromHost, HostFromGpu, GpuElemwise, 
@@ -139,7 +139,7 @@ def handle_shared_float32(tf):
    """
    if tf:
        import theano.compile
-        theano.compile.shared_constructor(shared_constructor)
+        theano.compile.shared_constructor(float32_shared_constructor)
    else:
        raise NotImplementedError('removing our handler')

--- a/theano/sandbox/cuda/var.py
+++ b/theano/sandbox/cuda/var.py
@@ -65,7 +65,7 @@ class CudaNdarraySharedVariable(SharedVariable, _operators):
 CudaNdarrayType.SharedVariable = CudaNdarraySharedVariable
-def shared_constructor(value, name, strict=False, broadcastable=None):
+def cuda_shared_constructor(value, name, strict=False, broadcastable=None):
    """SharedVariable Constructor for TensorType"""
    #TODO: what should strict mean in this context, since we always have to make a copy?
@@ -82,17 +82,31 @@ def shared_constructor(value, name, strict=False, broadcastable=None):
    if broadcastable is None:
        broadcastable = (False,) * len(value.shape)
    type = CudaNdarrayType(broadcastable=broadcastable)
-    return CudaNdarraySharedVariable(type=type, value=_value, name=name, strict=strict)
+    print "trying to return?"
+    try:
+        rval = CudaNdarraySharedVariable(type=type, value=_value, name=name, strict=strict)
+    except Exception, e:
+        print "ERROR", e
+        raise
+    return rval
+def float32_shared_constructor(value, name, strict=False, broadcastable=None):
+    """SharedVariable Constructor for TensorType"""
-def unset_shared_for_numpy():
+    # if value isn't a float32 ndarray, then raise
-    raise NotImplementedError()
+    if not isinstance(value, numpy.ndarray):
+        raise TypeError('ndarray required')
+    if value.dtype.num != CudaNdarrayType.typenum:
+        raise TypeError('float32 ndarray required')
-def set_shared_for_numpy():
+    if broadcastable is None:
-    """
+        broadcastable = (False,) * len(value.shape)
-    Set the gpu_tensor_constructor as the handler for ndarray
+    type = CudaNdarrayType(broadcastable=broadcastable)
-    """
+    deviceval = type_support_filter(value, broadcastable, False)
-    shared_constructor(shared_constructor)
+    try:
+        rval = CudaNdarraySharedVariable(type=type, value=deviceval, name=name, strict=strict)
+    except Exception, e:
+        print "ERROR", e
+        raise
+    return rval