zoo/squeezenet/squeezenet_bypass_c.py

# Copyright 2019 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     https://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# SqueezeNet v1.0 with simple bypass/composable (2016)
# Paper: https://arxiv.org/pdf/1602.07360.pdf

import tensorflow as tf
from tensorflow.keras import Input, Model
from tensorflow.keras.layers import Conv2D, MaxPooling2D, Concatenate, Add, Dropout
from tensorflow.keras.layers import GlobalAveragePooling2D, Activation
from tensorflow.keras.regularizers import l2

import sys
sys.path.append('../')
from models_c import Composable

class SqueezeNetBypass(Composable):
    ''' Construct a SqueezeNet Bypass Convolution Neural Network '''
    # Meta-parameter: number of blocks and filters per group
    # Fire blocks with simple bypass on blocks 2, 4, 6 and 8 
    groups = [ [ { 'n_filters' : 16, 'bypass': False }, 
                 { 'n_filters' : 16, 'bypass': True }, 
                 { 'n_filters' : 32, 'bypass': False } ],
               [ { 'n_filters' : 32, 'bypass': True }, 
                 { 'n_filters' : 48, 'bypass': False }, 
                 { 'n_filters' : 48, 'bypass': True },  
                 { 'n_filters' : 64, 'bypass': False } ],
               [ { 'n_filters' : 64, 'bypass': True } ] ]

    # Initial Hyperparameters
    hyperparameters = { 'initializer': 'glorot_uniform',
                        'regularizer': l2(0.001),
                        'relu_clip'  : None,
                        'bn_epsilon' : None,
                        'use_bias'   : True
                      }

    def __init__(self, groups=None, dropout=0.5, 
                 input_shape=(224, 224, 3), n_classes=1000, include_top=True,
                 **hyperparameters):
        ''' Construct a SqueezeNet Bypass Convolution Neural Network
            dropout     : percentage of dropout
            input_shape : input shape to model
            n_classes   : number of output classes
            include_top : whether to include classifier
            initializer : kernel initialization
            regularizer : kernel regularization
            relu_clip   : max value to relu
            bn_epsilon  : epsilon for batch norm
            use_bias    : whether to use bias in conjunction with batch norm
        '''
        # Configure base (super) class
        Composable.__init__(self, input_shape, include_top, self.hyperparameters, **hyperparameters)
        
        if groups is None:
            groups = list(SqueezeNetBypass.groups)

        # The input shape
        inputs = Input(shape=input_shape)

        # The Stem Group
        x = self.stem(inputs)

        # The Learner
        outputs = self.learner(x, groups=groups, dropout=dropout)

        # The Classifier
        if include_top:
            outputs = self.classifier(outputs, n_classes)

        self._model = Model(inputs, outputs)

    def stem(self, inputs):
        ''' Construct the Stem Group
            inputs : input to the stem
        '''
        x = self.Conv2D(inputs, 96, (7, 7), strides=2, padding='same')
        x = self.ReLU(x)
        x = MaxPooling2D(3, strides=2)(x)
        return x

    def learner(self, x, **metaparameters):
        ''' Construct the Learner
            x      : input to the learner
            groups : blocks/filters/bypass per group
            dropout: percent of droput
        '''
        groups  = metaparameters['groups']
        dropout = metaparameters['dropout']

        last = groups.pop()

        # Add Fire groups, progressively increase number of filters
        for group in groups:
            x = self.group(x, blocks=group, **metaparameters)

        # Last fire block
        x = self.fire_block(x, **last[0], **metaparameters)

        # Dropout is delayed to end of fire groups
        x = Dropout(dropout)(x)
        return x

    def group(self, x,  **metaparameters):
        ''' Construct the Fire Group
            x       : input to the group
            blocks  : nuumber of filters/bypass per block in group
        '''
        blocks = metaparameters['blocks']
            
        for block in blocks:
            x = self.fire_block(x, **block, **metaparameters)

        # Delayed downsampling
        x = MaxPooling2D((3, 3), strides=2)(x)
        return x

    def fire_block(self, x, **metaparameters):
        ''' Construct a Fire Block
            x        : input to the block
            n_filters: number of filters in the block
            bypass   : whether block has an identity shortcut
            reg      : kernel regularizer
        '''
        n_filters = metaparameters['n_filters']
        bypass    = metaparameters['bypass']
            
        # remember the input
        shortcut = x

        # squeeze layer
        squeeze = self.Conv2D(x, n_filters, (1, 1), strides=1, padding='same')
        squeeze = self.ReLU(squeeze)

        # branch the squeeze layer into a 1x1 and 3x3 convolution and double the number
        # of filters
        expand1x1 = self.Conv2D(squeeze, n_filters * 4, (1, 1), strides=1, padding='same')
        expand1x1 = self.ReLU(expand1x1)
        expand3x3 = self.Conv2D(squeeze, n_filters * 4, (3, 3), strides=1, padding='same')
        expand3x3 = self.ReLU(expand3x3)

        # concatenate the feature maps from the 1x1 and 3x3 branches
        x = Concatenate()([expand1x1, expand3x3])
    
        # if identity link, add (matrix addition) input filters to output filters
        if bypass:
            x = Add()([x, shortcut])
        
        return x

    def classifier(self, x, n_classes):
        ''' Construct the Classifier 
            x        : input tensor
            n_classes: number of output classes
        '''
        # Save the encoding layer
        self.encoding = x

        # set the number of filters equal to number of classes
        x = self.Conv2D(x, n_classes, (1, 1), strides=1, padding='same')
        x = self.ReLU(x)
        
        # reduce each filter (class) to a single value
        x = GlobalAveragePooling2D()(x)

        # Save the pre-activation probabilities
        self.probabilities = x
        outputs = Activation('softmax')(x)
        # Save the post-activation probabilities
        self.softmax = outputs
        return outputs

# Example
# squeezenet = SqueezeNetBypass()

def example():
    ''' Example for constructing/training a SqueezeNet Bypass model on CIFAR-10
    '''
    # Example of constructing a mini-SqueezeNet
    groups = [ [ { 'n_filters' : 16, 'bypass': False },
                 { 'n_filters' : 16, 'bypass': True },
                 { 'n_filters' : 32, 'bypass': False } ],
               [ { 'n_filters' : 32, 'bypass': True } ] ]
    squeezenet = SqueezeNetBypass(groups, input_shape=(32, 32, 3), n_classes=10)
    squeezenet.model.summary()
    squeezenet.cifar10()

# example()