Source code for nupic.research.frameworks.pytorch.models.mobilenetv1

#  Numenta Platform for Intelligent Computing (NuPIC)
#  Copyright (C) 2019, Numenta, Inc.  Unless you have an agreement
#  with Numenta, Inc., for a separate license for this software code, the
#  following terms and conditions apply:
#  This program is free software: you can redistribute it and/or modify
#  it under the terms of the GNU Affero Public License version 3 as
#  published by the Free Software Foundation.
#  This program is distributed in the hope that it will be useful,
#  but WITHOUT ANY WARRANTY; without even the implied warranty of
#  See the GNU Affero Public License for more details.
#  You should have received a copy of the GNU Affero Public License
#  along with this program.  If not, see

import torch.nn as nn

from nupic.torch.modules import Flatten, KWinners2d

[docs]def separable_convolution2d( in_channels, out_channels, kernel_size=(3, 3), stride=1, width_mult=1.0 ): """Depth wise separable convolution 2D. This network block is used by MobileNet to factorize a standard convolution into a depth wise convolution and a 1x1 point wise convolution. The depth wise convolution applies a single filter for each input channel and the point wise applies 1x1 convolution to combine the outputs of the depth wise convolution. See :param in_channels: Input channels :param out_channels: Output channels :param kernel_size: Kernel size to use, always 3x3 for mobilenet :param stride: Stride of the convolution :param width_mult: Width multiplier, used to thin the network """ # Apply width multiplier (alpha) in_channels = int(in_channels * width_mult) out_channels = int(out_channels * width_mult) return nn.Sequential( # Depth wise convolution nn.Conv2d( in_channels=in_channels, out_channels=in_channels, kernel_size=kernel_size, stride=stride, padding=1, groups=in_channels, bias=False, ), nn.BatchNorm2d(in_channels), nn.ReLU(True), # Point wise convolution nn.Conv2d( in_channels=in_channels, out_channels=out_channels, kernel_size=(1, 1), stride=1, padding=0, groups=1, bias=False, ), nn.BatchNorm2d(out_channels), nn.ReLU(True), )
[docs]class MobileNetV1(nn.Module): """See""" def __init__(self, num_classes=1001, width_mult=1.0): """Inspired by cifar/blob/master/models/ :param num_classes: Number of output classes (10 for CIFAR10) :param width_mult: Width multiplier, used to thin the network """ super(MobileNetV1, self).__init__() # Check for CIFAR10 if num_classes == 10: first_stride = 1 avgpool_size = 2 else: first_stride = 2 avgpool_size = 7 # First 3x3 convolution layer self.conv = nn.Sequential( nn.Conv2d( in_channels=3, out_channels=int(32 * width_mult), kernel_size=3, stride=first_stride, padding=1, bias=False, ), nn.BatchNorm2d(int(32 * width_mult)), nn.ReLU(True), ) # Depthwise Separable Convolution layers self.deepwise = nn.Sequential( separable_convolution2d( in_channels=32, out_channels=64, stride=1, width_mult=width_mult ), separable_convolution2d( in_channels=64, out_channels=128, stride=2, width_mult=width_mult ), separable_convolution2d( in_channels=128, out_channels=128, stride=1, width_mult=width_mult ), separable_convolution2d( in_channels=128, out_channels=256, stride=2, width_mult=width_mult ), separable_convolution2d( in_channels=256, out_channels=256, stride=1, width_mult=width_mult ), separable_convolution2d( in_channels=256, out_channels=512, stride=2, width_mult=width_mult ), separable_convolution2d( in_channels=512, out_channels=512, stride=1, width_mult=width_mult ), separable_convolution2d( in_channels=512, out_channels=512, stride=1, width_mult=width_mult ), separable_convolution2d( in_channels=512, out_channels=512, stride=1, width_mult=width_mult ), separable_convolution2d( in_channels=512, out_channels=512, stride=1, width_mult=width_mult ), separable_convolution2d( in_channels=512, out_channels=512, stride=1, width_mult=width_mult ), separable_convolution2d( in_channels=512, out_channels=1024, stride=2, width_mult=width_mult ), separable_convolution2d( in_channels=1024, out_channels=1024, stride=1, width_mult=width_mult ), ) # Classifier self.classifier = nn.Sequential( nn.AvgPool2d(avgpool_size), Flatten(), nn.Linear(in_features=int(1024 * width_mult), out_features=num_classes), )
[docs] def forward(self, x): y = self.conv(x) y = self.deepwise(y) y = self.classifier(y) return y
[docs]def mobile_net_v1_sparse_depth( num_classes=1001, width_mult=1.0, percent_on=0.1, k_inference_factor=1.0, boost_strength=1.0, boost_strength_factor=1.0, duty_cycle_period=1000, ): """Create a MobileNetV1 network with sparse deep wise layers by replacing the Depth wise (3x3) convolution activation function from ReLU with k-winners. :param num_classes: Number of output classes (10 for CIFAR10) :type num_classes: int :param width_mult: Width multiplier, used to thin the network :type width_mult: float :param percent_on: The activity of the top k = percent_on * number of input units will be allowed to remain, the rest are set to zero. :type percent_on: float :param kInferenceFactor: During inference (training=False) we increase percent_on by this factor. percent_on * kInferenceFactor must be strictly less than 1.0, ideally much lower than 1.0 :type kInferenceFactor: float :param boostStrength: boost strength (0.0 implies no boosting). :type boostStrength: float :param boostStrengthFactor: Boost strength factor to use [0..1] :type boostStrengthFactor: float :param dutyCyclePeriod: The period used to calculate duty cycles :type dutyCyclePeriod: int :return: Depth wise Sparse MoblineNetV1 model """ model = MobileNetV1(num_classes=num_classes, width_mult=width_mult) # Replace Deep wise ReLU (3rd layer) with k-winners for block in model.deepwise: # Get number of features from previous BatchNorm2d layer channels = block[1].num_features block[2] = KWinners2d( channels, percent_on=percent_on, k_inference_factor=k_inference_factor, boost_strength=boost_strength, boost_strength_factor=boost_strength_factor, duty_cycle_period=duty_cycle_period, ) return model
[docs]def mobile_net_v1_sparse_point( num_classes=1001, width_mult=1.0, percent_on=0.1, k_inference_factor=1.0, boost_strength=1.0, boost_strength_factor=1.0, duty_cycle_period=1000, ): """Create a MobileNetV1 network with sparse point wise layers by replacing the Point wise (1x1) convolution activation function from ReLU with k-winners. :param num_classes: Number of output classes (10 for CIFAR10) :type num_classes: int :param width_mult: Width multiplier, used to thin the network :type width_mult: float :param percent_on: The activity of the top k = percent_on * number of input units will be allowed to remain, the rest are set to zero. :type percent_on: float :param kInferenceFactor: During inference (training=False) we increase percent_on by this factor. percent_on * kInferenceFactor must be strictly less than 1.0, ideally much lower than 1.0 :type kInferenceFactor: float :param boostStrength: boost strength (0.0 implies no boosting). :type boostStrength: float :param boostStrengthFactor: Boost strength factor to use [0..1] :type boostStrengthFactor: float :param dutyCyclePeriod: The period used to calculate duty cycles :type dutyCyclePeriod: int :return: Point wise Sparse MoblineNetV1 model """ model = MobileNetV1(num_classes=num_classes, width_mult=width_mult) # Replace Point wise ReLU (6th layer) with k-winners for block in model.deepwise: # Get number of features from previous BatchNorm2d layer channels = block[4].num_features block[5] = KWinners2d( channels, percent_on=percent_on, k_inference_factor=k_inference_factor, boost_strength=boost_strength, boost_strength_factor=boost_strength_factor, duty_cycle_period=duty_cycle_period, ) return model