initial changes

304a4fd9 · Amjad Almahairi · 3431cc8d · 304a4fd9 · 304a4fd9
--- a/theano/sandbox/multinomial.py
+++ b/theano/sandbox/multinomial.py
@@ -33,7 +33,7 @@ class MultinomialFromUniform(Op):
        except AttributeError:
            self.odtype = 'auto'
-    def make_node(self, pvals, unis):
+    def make_node(self, pvals, unis, n):
        pvals = T.as_tensor_variable(pvals)
        unis = T.as_tensor_variable(unis)
        if pvals.ndim != 2:
@@ -45,18 +45,18 @@ class MultinomialFromUniform(Op):
        else:
            odtype = self.odtype
        out = T.tensor(dtype=odtype, broadcastable=pvals.type.broadcastable)
-        return Apply(self, [pvals, unis], [out])
+        return Apply(self, [pvals, unis, n], [out])
    def grad(self, ins, outgrads):
-        pvals, unis = ins
+        pvals, unis, n = ins
        (gz,) = outgrads
        return [T.zeros_like(x) for x in ins]
-    def c_code_cache_version(self):
+#    def c_code_cache_version(self):
-        return (6,)
+#        return (6,)
    def c_code(self, node, name, ins, outs, sub):
-        (pvals, unis) = ins
+        (pvals, unis, ns) = ins
        (z,) = outs
        if self.odtype == 'auto':
            t = "PyArray_TYPE(%(pvals)s)" % locals()
@@ -106,29 +106,42 @@ class MultinomialFromUniform(Op):
        const int nb_multi = PyArray_DIMS(%(pvals)s)[0];
        const int nb_outcomes = PyArray_DIMS(%(pvals)s)[1];
+        const int nb_samples = %(ns)s;
        //
        // For each multinomial, loop over each possible outcome
        //
-        for (int n = 0; n < nb_multi; ++n)
+        for (int c = 0; c < nb_samples; ++c){
-        {
+            for (int n = 0; n < nb_multi; ++n)
-            int waiting = 1;
-            dtype_%(pvals)s cummul = 0.;
-            const dtype_%(unis)s* unis_n = (dtype_%(unis)s*)PyArray_GETPTR1(%(unis)s, n);
-            for (int m = 0; m < nb_outcomes; ++m)
            {
-                dtype_%(z)s* z_nm = (dtype_%(z)s*)PyArray_GETPTR2(%(z)s, n,m);
+                int waiting = 1;
-                const dtype_%(pvals)s* pvals_nm = (dtype_%(pvals)s*)PyArray_GETPTR2(%(pvals)s, n,m);
+                dtype_%(pvals)s cummul = 0.;
-                cummul += *pvals_nm;
+                const dtype_%(unis)s* unis_n = (dtype_%(unis)s*)PyArray_GETPTR1(%(unis)s, c*nb_samples + n);
-                if (waiting && (cummul > *unis_n))
+                for (int m = 0; m < nb_outcomes; ++m)
                {
-                    *z_nm = 1.;
+                    dtype_%(z)s* z_nm = (dtype_%(z)s*)PyArray_GETPTR2(%(z)s, n,m);
-                    waiting = 0;
+                    const dtype_%(pvals)s* pvals_nm = (dtype_%(pvals)s*)PyArray_GETPTR2(%(pvals)s, n,m);
-                }
+                    cummul += *pvals_nm;
-                else
+                    if (c == 0)
-                {
+                    {
-                    // if we re-used old z pointer, we have to clear it out.
+                        if (waiting && (cummul > *unis_n))
-                    *z_nm = 0.;
+                        {
+                            *z_nm = 1.;
+                            waiting = 0;
+                        }
+                        else
+                        {
+                            // if we re-used old z pointer, we have to clear it out.
+                            *z_nm = 0.;
+                        }
+                    }
+                    else {
+                        if (waiting && (cummul > *unis_n))
+                        {
+                            *z_nm = *z_nm + 1.;
+                            waiting = 0;
+                        }
+                    }
                }
            }
        }
@@ -136,10 +149,10 @@ class MultinomialFromUniform(Op):
        """ % locals()
    def perform(self, node, ins, outs):
-        (pvals, unis) = ins
+        (pvals, unis, n_samples) = ins
        (z,) = outs
-        if unis.shape[0] != pvals.shape[0]:
+        if unis.shape[0] * n_samples != pvals.shape[0]:
            raise ValueError("unis.shape[0] != pvals.shape[0]",
                             unis.shape[0], pvals.shape[0])
        if z[0] is None or z[0].shape != pvals.shape:
@@ -346,7 +359,7 @@ class GpuMultinomialFromUniform(MultinomialFromUniform, GpuOp):
 @local_optimizer([MultinomialFromUniform])
 def local_gpu_multinomial(node):
    if type(node.op) is MultinomialFromUniform:
-        p, u = node.inputs
+        p, u, n_samples = node.inputs
        m, = node.outputs
        if (p.dtype == u.dtype == m.dtype == 'float32' and
            any([i.owner and isinstance(i.owner.op,
@@ -359,7 +372,7 @@ def local_gpu_multinomial(node):
            node.inputs[0].owner and
            type(node.inputs[0].owner.op) is MultinomialFromUniform):
        multi = node.inputs[0].owner
-        p, u = multi.inputs
+        p, u, n_samples = multi.inputs
        m, = multi.outputs
        if (p.dtype == u.dtype == m.dtype == 'float32'):
            gpu_op = GpuMultinomialFromUniform(multi.op.odtype)

--- a/theano/sandbox/rng_mrg.py
+++ b/theano/sandbox/rng_mrg.py
@@ -19,7 +19,7 @@ from theano.tensor import (raw_random, TensorType, as_tensor_variable,
 from theano.tensor import sqrt, log, sin, cos, join, prod
 from theano.compile import optdb
 from theano.gof import local_optimizer
+from theano.scalar import constant
 from . import multinomial
 from theano.sandbox.cuda import cuda_available, cuda_enabled, GpuOp
@@ -1318,9 +1318,10 @@ class MRG_RandomStreams(object):
    def multinomial(self, size=None, n=1, pvals=None, ndim=None, dtype='int64',
                    nstreams=None):
        """
-        Sample `n` (currently `n` needs to be 1) times from a multinomial
+        Sample `n` (currently `n` needs to be > 1) times from a multinomial
        distribution defined by probabilities pvals.
+        TODO: MODIFY_ME
        Example : pvals = [[.98, .01, .01], [.01, .98, .01]] will
        probably result in [[1,0,0],[0,1,0]].
@@ -1345,25 +1346,31 @@ class MRG_RandomStreams(object):
                    "The specified size contains a dimension with value <= 0",
                    size)
-        if n == 1 and pvals.ndim == 2:
+        if size is not None:
-            if size is not None:
+            raise ValueError("Provided a size argument to "
-                raise ValueError("Provided a size argument to "
+                             "MRG_RandomStreams.multinomial, which does not use "
-                        "MRG_RandomStreams.multinomial, which does not use "
+                             "the size argument.")
-                        "the size argument.")
+        if ndim is not None:
-            if ndim is not None:
+            raise ValueError("Provided an ndim argument to "
-                raise ValueError("Provided an ndim argument to "
+                             "MRG_RandomStreams.multinomial, which does not use "
-                        "MRG_RandomStreams.multinomial, which does not use "
+                             "the ndim argument.")
-                        "the ndim argument.")
+        if pvals.ndim == 2:
-            ndim, size, bcast = raw_random._infer_ndim_bcast(
+            if n == 1:
-                    ndim, size, pvals[:, 0])
+                size = pvals[:,0].shape
-            assert ndim == 1
+                unis = self.uniform(size=size, ndim=1, nstreams=nstreams)
-            bcast = bcast + (pvals.type.broadcastable[-1],)
+                op = multinomial.MultinomialFromUniform(dtype)
-            unis = self.uniform(size=size, ndim=1, nstreams=nstreams)
+                n_samples = constant(n)
-            op = multinomial.MultinomialFromUniform(dtype)
+                return op(pvals, unis, n_samples)
-            return op(pvals, unis)
+            elif n > 1:
+                # size = pvals[:,0].shape * n
+                # unis = self.uniform(size=size, ndim=1, nstreams=nstreams)
+                raise NotImplementedError('under construction!')
+            else:
+                raise NotImplementedError(("MRG_RandomStreams.multinomial only"
+                                           " implemented for n > 0"))
        else:
            raise NotImplementedError(("MRG_RandomStreams.multinomial only"
-                " implemented with n == 1 and pvals.ndim = 2"))
+                                       " implemented for pvals.ndim = 2"))
    def normal(self, size, avg=0.0, std=1.0, ndim=None,
               dtype=None, nstreams=None):