Merge pull request #2222 from SinaHonari/issue2196

DownsampleFactorMax support strides: issue #2196

Merge pull request #2222 from SinaHonari/issue2196
c2895dcf · Pascal Lamblin · 0bee6bb1 · 7518621d · c2895dcf · c2895dcf
--- a/theano/tensor/signal/downsample.py
+++ b/theano/tensor/signal/downsample.py
--- a/theano/tensor/signal/tests/test_downsample.py
+++ b/theano/tensor/signal/tests/test_downsample.py
 import unittest
+import __builtin__
 import numpy
 import theano.tensor as tensor
 from theano.tests import unittest_tools as utt
@@ -14,7 +15,7 @@ class TestDownsampleFactorMax(utt.InferShapeTester):
        '''Helper function, implementing max_pool_2d in pure numpy'''
        if len(input.shape) < 2:
            raise NotImplementedError('input should have at least 2 dim,'
-                                      ' shape is %s'\
+                                      ' shape is %s'
                                      % str(input.shape))
        xi = 0
        yi = 0
@@ -37,6 +38,64 @@ class TestDownsampleFactorMax(utt.InferShapeTester):
                    output_val[k][i, j] = numpy.max(patch)
        return output_val

+    @staticmethod
+    def numpy_max_pool_2d_stride(input, ds, ignore_border=False, st=None):
+        '''Helper function, implementing max_pool_2d in pure numpy
+           this function provides st input to indicate the stide size
+           for the pooling regions. if not indicated, st == sd.'''
+        if len(input.shape) < 2:
+            raise NotImplementedError('input should have at least 2 dim,'
+                                      ' shape is %s'
+                                      % str(input.shape))
+
+        if st is None:
+            st = ds
+        xi = 0
+        yi = 0
+        img_rows = input.shape[-2]
+        img_cols = input.shape[-1]
+
+        out_r = 0
+        out_c = 0
+        if img_rows - ds[0] >= 0:
+            out_r = (img_rows - ds[0]) // st[0] + 1
+        if img_cols - ds[1] >= 0:
+            out_c = (img_cols - ds[1]) // st[1] + 1
+
+        if not ignore_border:
+            if out_r > 0:
+                if img_rows - ((out_r - 1) * st[0] + ds[0]) > 0:
+                    rr = img_rows - out_r * st[0]
+                    if rr > 0:
+                        out_r += 1
+            else:
+                if img_rows > 0:
+                        out_r += 1
+            if out_c > 0:
+                if img_cols - ((out_c - 1) * st[1] + ds[1]) > 0:
+                    cr = img_cols - out_c * st[1]
+                    if cr > 0:
+                        out_c += 1
+            else:
+                if img_cols > 0:
+                        out_c += 1
+
+        out_shp = list(input.shape[:-2])
+        out_shp.append(out_r)
+        out_shp.append(out_c)
+
+        output_val = numpy.zeros(out_shp)
+        for k in numpy.ndindex(*input.shape[:-2]):
+            for i in range(output_val.shape[-2]):
+                ii_st = i * st[0]
+                ii_end = __builtin__.min(ii_st + ds[0], img_rows)
+                for j in range(output_val.shape[-1]):
+                    jj_st = j * st[1]
+                    jj_end = __builtin__.min(jj_st + ds[1], img_cols)
+                    patch = input[k][ii_st:ii_end, jj_st:jj_end]
+                    output_val[k][i, j] = numpy.max(patch)
+        return output_val
+
    def test_DownsampleFactorMax(self):
        rng = numpy.random.RandomState(utt.fetch_seed())
        # generate random images
@@ -59,10 +118,83 @@ class TestDownsampleFactorMax(utt.InferShapeTester):

                #DownsampleFactorMax op
                maxpool_op = DownsampleFactorMax(maxpoolshp,
-                                                 ignore_border=ignore_border)(images)
+                                                 ignore_border=
+                                                 ignore_border)(images)
                f = function([images], maxpool_op)
                output_val = f(imval)
-                assert (numpy.abs(output_val - numpy_output_val) < 1e-5).all()
+                utt.assert_allclose(output_val, numpy_output_val)
+
+    def test_DownsampleFactorMaxStride(self):
+        rng = numpy.random.RandomState(utt.fetch_seed())
+        maxpoolshps = ((1, 1), (3, 3), (5, 3))
+        stridesizes = ((1, 1), (3, 3), (5, 7))
+        # generate random images
+        imval = rng.rand(4, 10, 16, 16)
+        outputshps = ((4, 10, 16, 16), (4, 10, 6, 6), (4, 10, 4, 3),
+                      (4, 10, 16, 16), (4, 10, 6, 6), (4, 10, 4, 3),
+                      (4, 10, 14, 14), (4, 10, 5, 5), (4, 10, 3, 2),
+                      (4, 10, 14, 14), (4, 10, 6, 6), (4, 10, 4, 3),
+                      (4, 10, 12, 14), (4, 10, 4, 5), (4, 10, 3, 2),
+                      (4, 10, 12, 14), (4, 10, 5, 6), (4, 10, 4, 3))
+        images = tensor.dtensor4()
+        indx = 0
+        for maxpoolshp in maxpoolshps:
+            for ignore_border in [True, False]:
+                for stride in stridesizes:
+                    outputshp = outputshps[indx]
+                    indx += 1
+                    #DownsampleFactorMax op
+                    numpy_output_val = \
+                        self.numpy_max_pool_2d_stride(imval, maxpoolshp,
+                                                      ignore_border, stride)
+                    assert numpy_output_val.shape == outputshp, (
+                        "outshape is %s, calculated shape is %s"
+                        % (outputshp, numpy_output_val.shape))
+                    maxpool_op = \
+                        DownsampleFactorMax(maxpoolshp,
+                                            ignore_border=ignore_border,
+                                            st=stride)(images)
+                    f = function([images], maxpool_op)
+                    output_val = f(imval)
+                    utt.assert_allclose(output_val, numpy_output_val)
+
+    def test_DownsampleFactorMaxStrideExtra(self):
+        rng = numpy.random.RandomState(utt.fetch_seed())
+        maxpoolshps = ((5, 3), (5, 3), (5, 3), (5, 5), (3, 2), (7, 7), (9, 9))
+        stridesizes = ((3, 2), (7, 5), (10, 6), (1, 1),
+                       (2, 3), (10, 10), (1, 1))
+        imvsizs = ((16, 16), (16, 16), (16, 16), (8, 5),
+                   (8, 5), (8, 5), (8, 5))
+        outputshps = ((4, 10, 4, 7), (4, 10, 5, 8), (4, 10, 2, 3),
+                      (4, 10, 3, 4), (4, 10, 2, 3), (4, 10, 2, 3),
+                      (4, 10, 4, 1), (4, 10, 4, 1), (4, 10, 3, 2),
+                      (4, 10, 4, 2), (4, 10, 1, 0), (4, 10, 1, 1),
+                      (4, 10, 0, 0), (4, 10, 1, 1))
+        images = tensor.dtensor4()
+        for indx in numpy.arange(len(maxpoolshps)):
+            imvsize = imvsizs[indx]
+            imval = rng.rand(4, 10, imvsize[0], imvsize[1])
+            stride = stridesizes[indx]
+            maxpoolshp = maxpoolshps[indx]
+            for ignore_border in [True, False]:
+                indx_out = indx * 2
+                if not ignore_border:
+                    indx_out += 1
+                outputshp = outputshps[indx_out]
+                #DownsampleFactorMax op
+                numpy_output_val = \
+                    self.numpy_max_pool_2d_stride(imval, maxpoolshp,
+                                                  ignore_border, stride)
+                assert numpy_output_val.shape == outputshp, (
+                    "outshape is %s, calculated shape is %s"
+                    % (outputshp, numpy_output_val.shape))
+                maxpool_op = \
+                    DownsampleFactorMax(maxpoolshp,
+                                        ignore_border=ignore_border,
+                                        st=stride)(images)
+                f = function([images], maxpool_op)
+                output_val = f(imval)
+                utt.assert_allclose(output_val, numpy_output_val)

    def test_DownsampleFactorMax_grad(self):
        rng = numpy.random.RandomState(utt.fetch_seed())
@@ -76,7 +208,8 @@ class TestDownsampleFactorMax(utt.InferShapeTester):
                #print 'ignore_border =', ignore_border
                def mp(input):
                    return DownsampleFactorMax(maxpoolshp,
-                                    ignore_border=ignore_border)(input)
+                                               ignore_border=
+                                               ignore_border)(input)
                utt.verify_grad(mp, [imval], rng=rng)

    def test_DownsampleFactorMaxGrad_grad(self):
@@ -133,7 +266,10 @@ class TestDownsampleFactorMax(utt.InferShapeTester):
                                                          ignore_border)
                output = max_pool_2d(images, maxpoolshp, ignore_border)
                output_val = function([images], output)(imval)
-                assert numpy.all(output_val == numpy_output_val)
+                assert numpy.all(output_val == numpy_output_val), (
+                    "output_val is %s, numpy_output_val is %s"
+                    % (output_val, numpy_output_val))
+
                def mp(input):
                    return max_pool_2d(input, maxpoolshp, ignore_border)
                utt.verify_grad(mp, [imval], rng=rng)
@@ -152,7 +288,9 @@ class TestDownsampleFactorMax(utt.InferShapeTester):
                                                          ignore_border)
                output = max_pool_2d(images, maxpoolshp, ignore_border)
                output_val = function([images], output)(imval)
-                assert numpy.all(output_val == numpy_output_val)
+                assert numpy.all(output_val == numpy_output_val), (
+                    "output_val is %s, numpy_output_val is %s"
+                    % (output_val, numpy_output_val))
                c = tensor.sum(output)
                c_val = function([images], c)(imval)
                g = tensor.grad(c, images)
@@ -218,7 +356,8 @@ class TestDownsampleFactorMax(utt.InferShapeTester):
                gz_val = rng.rand(*out_shapes[i][j])
                self._compile_and_check([image, maxout, gz],
                                        [DownsampleFactorMaxGrad(maxpoolshp,
-                        ignore_border=ignore_border)(image, maxout, gz)],
+                                        ignore_border=ignore_border)
+                                        (image, maxout, gz)],
                                        [image_val, maxout_val, gz_val],
                                        DownsampleFactorMaxGrad,
                                        warn=False)