custom_layers.py

__author__ = 'dudevil'

import theano
import theano.tensor as T
import numpy as np
from lasagne import layers
from theano.sandbox.rng_mrg import MRG_RandomStreams as RandomStreams


def leaky_relu(x, alpha=3.0):
    return T.maximum(x, x * (1.0 / alpha))

# Partition image into square chunks of equal size
class ImagePartitionLayer(layers.Layer):

    def __init__(self, incoming, image_side_ = 1024, patch_side_ = 128, name = None):
        super(ImagePartitionLayer, self).__init__(incoming, name)
        self.patch_side = patch_side_
        self.image_side = image_side_
        self.patches_per_side = self.image_side / self.patch_side
        self.patches_count = self.patches_per_side * self.patches_per_side
        
    def image_partition(self, image):
        parts = [None] * self.patches_count
        for x in range(self.patches_count):
            i1 = x % self.patches_per_side * self.patch_side
            i2 = i1 + self.patch_side
            j1 = x / self.patches_per_side * self.patch_side
            j2 = j1 + self.patch_side
            parts[x] = image[:, j1:j2, i1:i2].reshape((1,image.shape[0],self.patch_side,self.patch_side))
        return T.concatenate(parts, axis=0)   

    def get_output_shape_for(self, input_shape):
        out_shape = (input_shape[0] * self.patches_per_side * self.patches_per_side, input_shape[1], self.patch_side, self.patch_side)
        return out_shape

    def get_output_for(self, input, **kwargs):
        return T.concatenate([self.image_partition(input[i]) for i in range(self.input_shape[0])], axis=0)

# Assemble image from square chunks
class ImageAssembleLayer(layers.Layer):

    def __init__(self, incoming, image_side = 1024, patch_side = 128, name = None):
        super(ImageAssembleLayer, self).__init__(incoming, name)
        self.patch_side = patch_side
        self.image_side = image_side
        self.patches_per_side = self.image_side / self.patch_side
        self.patches_count = self.patches_per_side * self.patches_per_side

    def get_output_shape_for(self, input_shape):
        self.patches_per_side = (self.image_side / self.patch_side)
        out_shape = (input_shape[0] / (self.patches_per_side * self.patches_per_side), input_shape[1], input_shape[2] * self.patches_per_side, input_shape[3] * self.patches_per_side)
        return out_shape

    def get_chunks(self, l, n):
        """ Yield successive n-sized chunks from l."""
        for i in xrange(0, len(l), n):
            yield l[i:i+n]
        
    def get_output_for(self, input, **kwargs):
        chunks = list(self.get_chunks([input[i] for i in range(input.shape.eval()[0])], self.patches_count))
        result = [[T.concatenate([T.concatenate(line, axis=2) for line in list(self.get_chunks(chunk, self.patches_per_side))], axis=1)] for chunk in chunks]
        return T.concatenate(result, axis=0)


class SliceRotateLayer(layers.Layer):

    def __init__(self, incoming, name=None, patch_shape=(64, 64)):
        super(SliceRotateLayer, self).__init__(incoming, name)
        self.slice_shape = patch_shape

    def get_output_shape_for(self, input_shape):
        return input_shape[0] * 4, input_shape[1], self.slice_shape[0], self.slice_shape[1]

    def get_output_for(self, input, **kwargs):
        px, py = self.slice_shape # shortcut
        part0 = input[:, :, :px, :py] # 0 degrees
        part1 = input[:, :, :px, :-py-1:-1].dimshuffle(0, 1, 3, 2) # 90 degrees
        part2 = input[:, :, :-px-1:-1, :-py-1:-1] # 180 degrees
        part3 = input[:, :, :-px-1:-1, :py].dimshuffle(0, 1, 3, 2) # 270 degrees

        return T.concatenate([part0, part1, part2, part3], axis=0)


class RotateMergeLayer(layers.Layer):

    def get_output_shape_for(self, input_shape):
        return input_shape[0] // 4, np.prod(input_shape[1:]) * 4

    def get_output_for(self, input, **kwargs):
        input_r = input.reshape((4, self.input_shape[0] // 4, int(np.prod(self.input_shape[1:])))) # split out the 4* dimension
        return input_r.transpose(1, 0, 2).reshape(self.get_output_shape())


class StochasticPoolLayer(layers.Layer):

    def __init__(self, incoming, ds, strides=None, ignore_border=False, pad=(0, 0), random_state=42, **kwargs):
        super(StochasticPoolLayer, self).__init__(incoming, **kwargs)
        self.ds = ds
        self.ignore_border = ignore_border
        self.pad = pad
        self.st = ds if strides is None else strides
        if hasattr(random_state, 'multinomial'):
            self.rng = random_state
        else:
            self.rng = RandomStreams(seed=random_state)

    def get_output_shape_for(self, input_shape):
        output_shape = list(input_shape)  # copy / convert to mutable list
        output_shape[2] = pool_output_length(input_shape[2],
                                             ds=self.ds[0],
                                             st=self.st[0],
                                             ignore_border=self.ignore_border,
                                             pad=self.pad[0],
                                             )

        output_shape[3] = pool_output_length(input_shape[3],
                                             ds=self.ds[1],
                                             st=self.st[1],
                                             ignore_border=self.ignore_border,
                                             pad=self.pad[1],
                                             )

        return tuple(output_shape)

    def get_output_for(self, input, deterministic=False, **kwargs):
        # inspired by:
        # https://github.com/lisa-lab/pylearn2/blob/14b2f8bebce7cc938cfa93e640008128e05945c1/pylearn2/expr/stochastic_pool.py#L23
        batch, channels, nr, nc = self.input_shape
        pr, pc = self.ds
        sr, sc = self.st
        output_shape = self.get_output_shape()
        out_r, out_c = output_shape[2:]
        # calculate shape needed for padding
        pad_shape = list(output_shape)
        pad_shape[2] = (pad_shape[2] - 1) * sr + pr
        pad_shape[3] = (pad_shape[3] - 1) * sc + pc
        # allocate a new input tensor
        padded = T.alloc(0.0, *pad_shape)
        # get padding offset
        offset_x = (pad_shape[2] - nr) // 2
        offset_y = (pad_shape[3] - nc) // 2

        padded = T.set_subtensor(padded[:, :, offset_x:(offset_x + nr), offset_y:(offset_y + nc)], input)
        window = T.alloc(0.0, batch, channels, out_r, out_c, pr, pc)
        for row_within_pool in xrange(pr):
            row_stop = (output_shape[2] - 1) * sr + row_within_pool + 1
            for col_within_pool in xrange(pc):
                col_stop = (output_shape[3] - 1) * sc + col_within_pool + 1
                # theano dark magic
                win_cell = padded[:, :, row_within_pool:row_stop:sr, col_within_pool:col_stop:sc]
                window = T.set_subtensor(window[:, :, :, :, row_within_pool, col_within_pool], win_cell)
        # sum across pooling regions
        norm = window.sum(axis=[4, 5])
        norm = T.switch(T.eq(norm, 0.0), 1.0, norm)
        norm = window / norm.dimshuffle(0, 1, 2, 3, 'x', 'x')

        if deterministic:
            res = (window * norm).sum(axis=[4, 5])
        else:
            prob = self.rng.multinomial(pvals=norm.reshape((batch * channels * out_r * out_c, pr * pc)),
                                        dtype=theano.config.floatX)
            # double max because of grad problems
            res = (window * prob.reshape((batch, channels, out_r, out_c,  pr, pc))).max(axis=5).max(axis=4)

        return T.cast(res, theano.config.floatX)


class FractionalPool2DLayer(layers.Layer):
    """
    Fractional pooling as described in http://arxiv.org/abs/1412.6071
    Only the random overlapping mode is currently implemented.

    Implementaion adopted from this pull-request: https://github.com/Lasagne/Lasagne/pull/171/files
    """
    def __init__(self, incoming, ds, pool_function=T.max, random_state=42, **kwargs):
        super(FractionalPool2DLayer, self).__init__(incoming, **kwargs)
        if type(ds) is not tuple:
            raise ValueError("ds must be a tuple")
        if (not 1 <= ds[0] <= 2) or (not 1 <= ds[1] <= 2):
            raise ValueError("ds must be between 1 and 2")
        self.ds = ds  # a tuple
        self.rng = T.shared_randomstreams.RandomStreams(seed=random_state)
        if len(self.input_shape) != 4:
            raise ValueError("Only bc01 currently supported")
        self.pool_function = pool_function
        _, _, n_in0, n_in1 = self.input_shape
        _, _, n_out0, n_out1 = self.get_output_shape()
        self.a_init = np.array([2] * (n_in0 - n_out0) + [1] * (2 * n_out0 - n_in0), dtype=np.int8)
        self.b_init = np.array([2] * (n_in1 - n_out1) + [1] * (2 * n_out1 - n_in1), dtype=np.int8)
        self.a_shared = theano.shared(self.a_init, borrow=True)
        self.b_shared = theano.shared(self.b_init, borrow=True)

    def _theano_shuffled(self, input):
        n = input.shape[0]
        shuffled = T.permute_row_elements(input.T, self.rng.permutation(n=n)).T
        return shuffled

    def get_output_shape_for(self, input_shape):
        output_shape = list(input_shape) # copy / convert to mutable list
        output_shape[2] = int(np.ceil(float(output_shape[2]) / self.ds[0]))
        output_shape[3] = int(np.ceil(float(output_shape[3]) / self.ds[1]))

        return tuple(output_shape)

    def get_output_for(self, input, **kwargs):
        # _, _, n_in0, n_in1 = self.input_shape
        # _, _, n_out0, n_out1 = self.get_output_shape()

        # Variable stride across the input creates fractional reduction
        # a = theano.shared(
        #     np.array([2] * (n_in0 - n_out0) + [1] * (2 * n_out0 - n_in0), dtype=np.int8),
        #     borrow=True)
        # b = theano.shared(
        #     np.array([2] * (n_in1 - n_out1) + [1] * (2 * n_out1 - n_in1), dtype=np.int8),
        #     borrow=True)
        self.a_shared.set_value(self.a_init, borrow=True)
        self.b_shared.set_value(self.b_init, borrow=True)

        a, b = self.a_shared, self.b_shared
        # Randomize the input strides
        a = self._theano_shuffled(a)
        b = self._theano_shuffled(b)

        # Convert to input positions, starting at 0
        a = T.concatenate(([0], a[:-1]))
        b = T.concatenate(([0], b[:-1]))
        a = T.cumsum(a)
        b = T.cumsum(b)

        # Positions of the other corners
        c = T.clip(a + 1, 0, self.input_shape[2] - 1)
        d = T.clip(b + 1, 0, self.input_shape[3] - 1)

        # Index the four positions in the pooling window and stack them
        #shit won't fit in GPU memory
        temp = T.stack(input[:, :, a, :][:, :, :, b],
                       input[:, :, c, :][:, :, :, b],
                       input[:, :, a, :][:, :, :, d],
                       input[:, :, c, :][:, :, :, d])

        return self.pool_function(temp, axis=0)


class RandomizedReLu(layers.Layer):

    def __init__(self, input_layer, a_min=3., a_max=8., random_state=42):
        super(RandomizedReLu, self).__init__(input_layer)
        self.a_min = a_min
        self.a_max = a_max
        self.rng = RandomStreams(seed=random_state)

    def get_output_for(self, input, deterministic=False, **kwargs):
        if deterministic:
            res = T.maximum(input, 2 * input / (self.a_max - self.a_min))
        else:
            batch_size, channels, _, _ = self.get_output_shape()
            a = self.rng.uniform(size=(batch_size, channels), low=self.a_min, high=self.a_max)
            a = a.dimshuffle((0, 1, 'x', 'x'))
            res = T.maximum(input, input / a)
        return res


class ParametrizedReLu(layers.Layer):

    def __init__(self, input_layer, a_init=0.25):
        super(ParametrizedReLu, self).__init__(input_layer)
        self.input = input_layer
        self.a = theano.shared(np.cast[theano.config.floatX](a_init), name='a')

    def get_output_for(self, input, **kwargs):
        return T.maximum(0, input) + self.a * T.minimum(0, input)

    def get_bias_params(self):
        return [self.a]