Implement a struct generator for wrapping ops params.

8160671a · notoraptor · 0c53fb52 · 8160671a · 8160671a · 8160671a
--- a/theano/common/__init__.py
+++ b/theano/common/__init__.py
+from __future__ import absolute_import, print_function, division
+from .wrapper import Wrapper, Wrap
--- a/theano/common/tests/__init__.py
+++ b/theano/common/tests/__init__.py
+from __future__ import absolute_import, print_function, division
--- a/theano/common/tests/test_wrapper.py
+++ b/theano/common/tests/test_wrapper.py
+from __future__ import absolute_import, print_function, division
+import theano
+import numpy
+from theano.gof import Op, Apply
+from theano.tensor import TensorType
+from theano.common import Wrapper, Wrap
+from theano import config
+from theano import tensor
+from theano.tests import unittest_tools as utt
+dtype = config.floatX
+ScalarType = TensorType(dtype, tuple())
+# A test op to compute `y = a*x^2 + bx + c` for any tensor x,
+# such that a, b, c are parameters of that op.
+class QuadraticFunction(Op):
+    __props__ = ('a', 'b', 'c')
+    params_type = Wrapper(a=ScalarType, b=ScalarType, c=ScalarType)
+    def __init__(self, a, b, c):
+        self.a = a
+        self.b = b
+        self.c = c
+    def get_params(self, node):
+        return Wrap(a=self.a, b=self.b, c=self.c)
+    def make_node(self, x):
+        x = tensor.as_tensor_variable(x)
+        return Apply(self, [x], [x.type()])
+    def perform(self, node, inputs, output_storage, coefficients):
+        x = inputs[0]
+        y = output_storage[0]
+        y[0] = coefficients.a * (x**2) + coefficients.b * x + coefficients.c
+    def c_code_cache_version(self):
+        return (1, 1)
+    def c_support_code_apply(self, node, name):
+        float_type = node.inputs[0].type.dtype_specs()[1]
+        return """
+        /* Computes: x = a*x*x + b*x + c for x in matrix. */
+        int quadratic_%(float_type)s(PyArrayObject* matrix, %(float_type)s a, %(float_type)s b, %(float_type)s c) {
+            NpyIter* iterator = NpyIter_New(matrix,
+                NPY_ITER_READWRITE | NPY_ITER_EXTERNAL_LOOP | NPY_ITER_REFS_OK,
+                NPY_KEEPORDER, NPY_NO_CASTING, NULL);
+            if(iterator == NULL) {
+                PyErr_SetString(PyExc_RuntimeError, "Unable to iterate over a matrix for an elemwise operation.");
+                return -1;
+            }
+            NpyIter_IterNextFunc* get_next = NpyIter_GetIterNext(iterator, NULL);
+            char** data_ptr = NpyIter_GetDataPtrArray(iterator);
+            npy_intp* stride_ptr = NpyIter_GetInnerStrideArray(iterator);
+            npy_intp* innersize_ptr = NpyIter_GetInnerLoopSizePtr(iterator);
+            do {
+                char* data = *data_ptr;
+                npy_intp stride = *stride_ptr;
+                npy_intp count = *innersize_ptr;
+                while(count) {
+                    %(float_type)s x = *((%(float_type)s*)data);
+                    *((%(float_type)s*)data) = a*x*x + b*x + c;
+                    data += stride;
+                    --count;
+                }
+            } while(get_next(iterator));
+            NpyIter_Deallocate(iterator);
+            return 0;
+        }
+        """ % {'float_type': float_type}
+    def c_code(self, node, name, inputs, outputs, sub):
+        X = inputs[0]
+        Y = outputs[0]
+        coeff = sub['params']
+        fail = sub['fail']
+        float_type = node.inputs[0].type.dtype_specs()[1]
+        float_typenum = numpy.dtype(node.inputs[0].type.dtype).num
+        coeff_type = 'npy_' + numpy.dtype(dtype).name
+        return """
+        PyArrayObject* o_a = %(coeff)s.a;
+        PyArrayObject* o_b = %(coeff)s.b;
+        PyArrayObject* o_c = %(coeff)s.c;
+        %(float_type)s a = (%(float_type)s) (*(%(coeff_type)s*) PyArray_GETPTR1(o_a, 0));
+        %(float_type)s b = (%(float_type)s) (*(%(coeff_type)s*) PyArray_GETPTR1(o_b, 0));
+        %(float_type)s c = (%(float_type)s) (*(%(coeff_type)s*) PyArray_GETPTR1(o_c, 0));
+        Py_XDECREF(%(Y)s);
+        %(Y)s = (PyArrayObject*)PyArray_EMPTY(PyArray_NDIM(%(X)s), PyArray_DIMS(%(X)s), %(float_typenum)s, PyArray_IS_F_CONTIGUOUS(%(X)s));
+        if (PyArray_CopyInto(%(Y)s, %(X)s) != 0) {
+            PyErr_SetString(PyExc_RuntimeError, "Unable to copy input into output.");
+            %(fail)s
+        };
+        if (quadratic_%(float_type)s(%(Y)s, a, b, c) != 0) {
+            PyErr_SetString(PyExc_RuntimeError, "Unable to compute quadratic function.");
+            %(fail)s
+        }
+        """ % locals()
+def test_wrapper():
+    a, b, c = 2, 3, -7
+    x = tensor.matrix()
+    y = QuadraticFunction(a, b, c)(x)
+    f = theano.function([x], y)
+    shape = (100, 100)
+    # The for-loop is here just to force profiling print something interesting.
+    # When running this test without this loop, profiling does not print neither list of classes nor list of ops
+    # (maybe because the function is extremely fast ?).
+    for i in range(50):
+        vx = numpy.random.normal(size=shape[0] * shape[1]).astype(dtype).reshape(*shape)
+        vy = f(vx)
+        ref = a * (vx**2) + b * vx + c
+        utt.assert_allclose(ref, vy)
--- a/theano/common/wrapper.py
+++ b/theano/common/wrapper.py
--- a/theano/tests/test_flake8.py
+++ b/theano/tests/test_flake8.py
@@ -36,6 +36,7 @@ whitelist_flake8 = [
    "compat/six.py",  # This is bundled code that will be deleted, don't fix it
    "__init__.py",
    "tests/__init__.py",
+    "common/__init__.py",
    "compile/__init__.py",
    "compile/sandbox/__init__.py",
    "compile/tests/__init__.py",