Documentation

444f7d56 · Vikram · d6a9018a · 444f7d56 · 444f7d56 · 444f7d56
--- a/theano/gpuarray/blas.py
+++ b/theano/gpuarray/blas.py
@@ -449,8 +449,8 @@ class BaseGpuCorrMM(CGpuKernelBase):
    Parameters
    ----------
    border_mode : {'valid', 'full', 'half'}
-        Additionally, the padding size could be directly specified by an integer
+        Additionally, the padding size could be directly specified by an integer,
-        or a pair of integers
+        a pair of integers, or two pairs of integers.
    subsample
        Perform subsampling of the output (default: (1, 1)).
    filter_dilation

--- a/theano/tensor/nnet/__init__.py
+++ b/theano/tensor/nnet/__init__.py
@@ -72,21 +72,30 @@ def conv2d(input, filters, input_shape=None, filter_shape=None,
        You can give ``None`` for any element of the list to specify that this
        element is not known at compile time.
-    border_mode: str, int or tuple of two int
+     border_mode: str, int or tuple of ``convdim`` elements where each element
+        is an integer or a tuple of length 2.
        Either of the following:
        ``'valid'``: apply filter wherever it completely overlaps with the
            input. Generates output of shape: input shape - filter shape + 1
        ``'full'``: apply filter wherever it partly overlaps with the input.
            Generates output of shape: input shape + filter shape - 1
-        ``'half'``: pad input with a symmetric border of ``filter rows // 2``
+        ``'half'``: pad input with a symmetric border of ``filter size // 2``
-            rows and ``filter columns // 2`` columns, then perform a valid
+            in each convolution dimension, then perform a valid convolution.
-            convolution. For filters with an odd number of rows and columns, this
+            For filters with an odd filter size, this leads to the output
-            leads to the output shape being equal to the input shape.
+            shape being equal to the input shape.
        ``int``: pad input with a symmetric border of zeros of the given
            width, then perform a valid convolution.
-        ``(int1, int2)``: pad input with a symmetric border of ``int1`` rows
+        ``(int1, int2)``: (for 2D) pad input with a symmetric border of ``int1``,
-            and ``int2`` columns, then perform a valid convolution.
+            ``int2``, then perform a valid convolution.
+        ``(int1, (int2, int3))`` or ``((int1, int2), int3)``: (for 2D)
+            pad input with one symmetric border of `int1`` or ``int3``, and
+            one asymmetric border of ``(int2, int3)`` or ``(int1, int2)``.
+        ``((int1, int2), (int3, int4))``: (for 2D) pad input with an asymmetric
+            border of ``(int1, int2)`` along one dimension and ``(int3, int4)``
+            along the second dimension.
+        ``(int1, int2, int3)``: (for 3D) pad input with a symmetric border of
+            ``int1``, ``int2`` and ``int3``, then perform a valid convolution.
    subsample: tuple of len 2
        Factor by which to subsample the output.
@@ -199,7 +208,7 @@ def conv2d_transpose(input, filters, output_shape, filter_shape=None,
        You can give ``None`` for any element of the list to specify that this
        element is not known at compile time.
-    border_mode: str, int or tuple of two int
+    border_mode: str, int or tuple of two elements
        Refers to the ``border_mode`` argument of the corresponding forward
        (non-transposed) convolution. See the argument description in
        ``conv2d``.  What was ``padding`` for the forward convolution means

--- a/theano/tensor/nnet/abstract_conv.py
+++ b/theano/tensor/nnet/abstract_conv.py
@@ -55,7 +55,8 @@ def get_conv_output_shape(image_shape, kernel_shape,
    border_mode: string, int (symbolic or numeric) or tuple of int (symbolic
        or numeric). If it is a string, it must be 'valid', 'half' or 'full'.
        If it is a tuple, its two (or three) elements respectively correspond
-        to the padding on height and width (and possibly depth) axis.
+        to the padding (possibly left and right) on height and width
+        (and possibly depth) axis.
    subsample: tuple of int (symbolic or numeric). Its two or three elements
        espectively correspond to the subsampling on height and width (and
        possibly depth) axis.
@@ -103,9 +104,10 @@ def get_conv_shape_1axis(image_shape, kernel_shape, border_mode,
        given axis. None if undefined.
    kernel_shape: int or None. Corresponds to the kernel shape on a given
        axis. None if undefined.
-    border_mode: string or int. If it is a string, it must be
+    border_mode: string, int or tuple. If it is a string, it must be
        'valid', 'half' or 'full'. If it is an integer, it must correspond to
-        the padding on the considered axis.
+        the padding on the considered axis. If it is a tuple, its two elements
+        must correspond to the padding (left and right) on the desired axis.
    subsample: int. It must correspond to the subsampling on the
        considered axis.
    dilation: int. It must correspond to the dilation on the
@@ -174,7 +176,8 @@ def get_conv_gradweights_shape(image_shape, top_shape,
    border_mode: string, int (symbolic or numeric) or tuple of int (symbolic
        or numeric). If it is a string, it must be 'valid', 'half' or 'full'.
        If it is a tuple, its two (or three) elements respectively correspond
-        to the padding on height and width (and possibly depth) axis.
+        to the padding (possibly left and right) on height and width
+        (and possibly depth) axis.
    subsample: tuple of int (symbolic or numeric). Its two or three elements
        respectively correspond to the subsampling on height and width (and
        possibly depth) axis.
@@ -231,9 +234,10 @@ def get_conv_gradweights_shape_1axis(image_shape, top_shape, border_mode,
        given axis. None if undefined.
    top_shape: int or None. Corresponds to the top shape on a given axis.
        None if undefined.
-    border_mode: string or int. If it is a string, it must be
+    border_mode: string, int or tuple. If it is a string, it must be
        'valid', 'half' or 'full'. If it is an integer, it must correspond to
-        the padding on the considered axis.
+        the padding on the considered axis. If it is a tuple, its two elements
+        must correspond to the padding (left and right) on the desired axis.
    subsample: int. It must correspond to the subsampling on the
        considered axis.
    dilation: int. It must correspond to the dilation on the
@@ -295,7 +299,8 @@ def get_conv_gradinputs_shape(kernel_shape, top_shape,
    border_mode: string, int (symbolic or numeric) or tuple of int (symbolic
        or numeric). If it is a string, it must be 'valid', 'half' or 'full'.
        If it is a tuple, its two (or three) elements respectively correspond
-        to the padding on height and width (and possibly depth) axis.
+        to the padding (possibly left and right) on height and width
+        (and possibly depth) axis.
    subsample: tuple of int (symbolic or numeric). Its two or three elements
        respectively correspond to the subsampling on height and width (and
        possibly depth) axis.
@@ -349,9 +354,10 @@ def get_conv_gradinputs_shape_1axis(kernel_shape, top_shape, border_mode,
        axis. None if undefined.
    top_shape: int or None. Corresponds to the top shape on a given axis.
        None if undefined.
-    border_mode: string or int. If it is a string, it must be
+    border_mode: string, int or tuple. If it is a string, it must be
        'valid', 'half' or 'full'. If it is an integer, it must correspond to
-        the padding on the considered axis.
+        the padding on the considered axis. If it is a tuple, its two elements
+        must correspond to the padding (left and right) on the desired axis.
    subsample: int. It must correspond to the subsampling on the
        considered axis.
    dilation: int. It must correspond to the dilation on the
@@ -417,8 +423,9 @@ def check_conv_gradinputs_shape(image_shape, kernel_shape, output_shape,
        output shape. Its four (or five) elements must correspond respectively
        to: batch size, number of output channels, height and width
        (and possibly depth) of the output. None where undefined.
-    border_mode: string, int (symbolic or numeric) or tuple of int (symbolic
+    border_mode: string, int (symbolic or numeric) or tuple where each element
-        or numeric). If it is a string, it must be 'valid', 'half' or 'full'.
+        is either an int or a tuple of length 2 (symbolic or numeric).
+        If it is a string, it must be 'valid', 'half' or 'full'.
        If it is a tuple, its two (or three) elements respectively correspond
        to the padding on height and width (and possibly depth) axis.
    subsample: tuple of int (symbolic or numeric). Its two or three elements
@@ -547,6 +554,26 @@ def assert_shape(x, expected_shape, msg='Unexpected shape.'):
 def mode_to_pad(mode, convdim, kshp):
+    """ Computes a tuple for padding given the border_mode parameter
+    Parameters
+    ----------
+    mode : int or tuple
+        One of "valid", "full", "half", an integer, or a tuple where each
+        member is either an integer or a tuple of 2 positive integers.
+    convdim : int
+        The dimensionality of the convolution.
+    kshp : List/tuple of length 'convdim', indicating the size of the
+        kernel in the spatial dimensions.
+    Returns
+    -------
+    A tuple containing 'convdim' elements, each of which is a tuple of
+    two positive integers corresponding to the padding on the left
+    and the right sides respectively.
+    """
    if isinstance(mode, tuple):
        if len(mode) != convdim:
            raise ValueError(
@@ -681,6 +708,12 @@ def separable_conv2d(input,
            width, then perform a valid convolution.
        ``(int1, int2)``: pad input with a symmetric border of ``int1`` rows
            and ``int2`` columns, then perform a valid convolution.
+        ``(int1, (int2, int3))`` or ``((int1, int2), int3)``: (for 2D)
+            pad input with one symmetric border of `int1`` or ``int3``, and
+            one asymmetric border of ``(int2, int3)`` or ``(int1, int2)``.
+        ``((int1, int2), (int3, int4))``: (for 2D) pad input with an asymmetric
+            border of ``(int1, int2)`` along one dimension and ``(int3, int4)``
+            along the second dimension.
    subsample: tuple of len 2
        Factor by which to subsample the output.
@@ -1008,7 +1041,8 @@ def conv2d_grad_wrt_inputs(output_grad,
        Optional, possibly used  to choose an optimal implementation.
        You can give ``None`` for any element of the list to specify that
        this element is not known at compile time.
-    border_mode : str, int or tuple of two int
+     border_mode: str, int or tuple of 2 elements where each element
+        is an integer or a tuple of length 2.
        Either of the following:
          ``'valid'``
@@ -1035,6 +1069,14 @@ def conv2d_grad_wrt_inputs(output_grad,
            pad input with a symmetric border of ``int1`` rows and
            ``int2`` columns, then perform a valid convolution.
+          ``(int1, (int2, int3))`` or ``((int1, int2), int3)``
+            pad input with one symmetric border of `int1`` or ``int3``, and
+            one asymmetric border of ``(int2, int3)`` or ``(int1, int2)``.
+          ``((int1, int2), (int3, int4))``: (for 2D) pad input with an asymmetric
+            border of ``(int1, int2)`` along one dimension and ``(int3, int4)``
+            along the second dimension.
    subsample : tuple of len 2
        The subsampling used in the forward pass.  Also called strides
        elsewhere.
@@ -1294,7 +1336,8 @@ def conv2d_grad_wrt_weights(input,
        Optional, possibly used to choose an optimal implementation.
        You can give ``None`` for any element of the list to specify
        that this element is not known at compile time.
-    border_mode : str, int or tuple of two ints
+     border_mode: str, int or tuple of 2 elements where each element
+        is an integer or a tuple of length 2.
        Either of the following:
          ``'valid'``
@@ -1320,6 +1363,14 @@ def conv2d_grad_wrt_weights(input,
          ``(int1, int2)``
            pad input with a symmetric border of ``int1`` rows and
            ``int2`` columns, then perform a valid convolution.
+          ``(int1, (int2, int3))`` or ``((int1, int2), int3)``
+            pad input with one symmetric border of `int1`` or ``int3``, and
+            one asymmetric border of ``(int2, int3)`` or ``(int1, int2)``.
+          ``((int1, int2), (int3, int4))``: (for 2D) pad input with an asymmetric
+            border of ``(int1, int2)`` along one dimension and ``(int3, int4)``
+            along the second dimension.
    subsample : tuple of len 2
        The subsampling used in the forward pass of the convolutional
        operation.  Also called strides elsewhere.
@@ -1542,6 +1593,54 @@ def causal_conv(input,
                filter_dilation=1,
                num_groups=1,
                unshared=False):
+    """Computes (dilated) causal convolution
+    The output at time t depends only on the inputs till t-1. Used for
+    modelling temporal data.
+    See [WaveNet: A Generative Model for Raw Audio, section 2.1]
+    (https://arxiv.org/abs/1609.03499).
+    Parameters
+    ----------
+    input : symbolic 3D tensor
+        mini-batch of feature vector stacks, of shape
+        (batch_size, input_channels, input_length)
+        See the optional parameter ``input_shape``
+    filters : symbolic 3D tensor
+        Set of filters used in the CNN, of shape
+        (output_channels, input_channels, filter_length)
+    filter_shape : [None/int/Constant] * 2 + [Tensor/int/Constant]
+        The shape of the filters parameter.
+        A tuple/list of len 3, with the first two dimensions
+        being None or int or Constant and the last dimension being
+        Tensor or int or Constant.
+        Not optional, since the filter length is needed to calculate
+        the left padding for causality.
+    input_shape : None or [None/int/Constant] * 3
+        The shape of the input parameter.
+        None, or a tuple/list of len 3.
+        Optional, possibly used to choose an optimal implementation.
+    subsample : int
+        The factor by which to subsample the output. Also called strides
+        elsewhere.
+    filter_dilation : int
+        Factor by which to subsample (stride) the input. Also called
+        dilation factor.
+    num_groups : int
+        Divides the image, kernel and output tensors into num_groups
+        separate groups. Each which carry out convolutions separately
+    unshared: bool
+        If true, then unshared or 'locally connected' convolution will be
+        performed. A different filter will be used for each region of the
+        input.
+    Returns
+    -------
+    Symbolic 3D tensor.
+        Set of feature vectors generated by convolutional layer. Tensor is
+        of shape (batch_size, output_channels, output_length)
+    """
    input = as_tensor_variable(input)
    filters = as_tensor_variable(filters)
@@ -1786,7 +1885,8 @@ class BaseAbstractConv(Op):
        element is not known at compile time.
        kshp is defined w.r.t the forward conv.
-     border_mode: str, int or tuple of ``convdim`` ints
+     border_mode: str, int or tuple of ``convdim`` elements where each element
+        is an integer or a tuple of length 2.
        Either of the following:
        ``'valid'``: apply filter wherever it completely overlaps with the
@@ -1801,6 +1901,12 @@ class BaseAbstractConv(Op):
            width, then perform a valid convolution.
        ``(int1, int2)``: (for 2D) pad input with a symmetric border of ``int1``,
            ``int2``, then perform a valid convolution.
+        ``(int1, (int2, int3))`` or ``((int1, int2), int3)``: (for 2D)
+            pad input with one symmetric border of `int1`` or ``int3``, and
+            one asymmetric border of ``(int2, int3)`` or ``(int1, int2)``.
+        ``((int1, int2), (int3, int4))``: (for 2D) pad input with an asymmetric
+            border of ``(int1, int2)`` along one dimension and ``(int3, int4)``
+            along the second dimension.
        ``(int1, int2, int3)``: (for 3D) pad input with a symmetric border of
            ``int1``, ``int2`` and ``int3``, then perform a valid convolution.

--- a/theano/tensor/nnet/corr.py
+++ b/theano/tensor/nnet/corr.py
@@ -34,8 +34,8 @@ class BaseCorrMM(gof.OpenMPOp):
    Parameters
    ----------
    border_mode : {'valid', 'full', 'half'}
-        Additionally, the padding size could be directly specified by an integer
+        Additionally, the padding size could be directly specified by an integer,
-        or a pair of integers
+        a pair of integers, or two pairs of integers.
    subsample
        Perform subsampling of the output (default: (1, 1)).
    filter_dilation