Add CaffeResnet101

Cadene · Cadene · commit 68f6f50840fc · 2018-03-22T18:28:58.000+01:00
diff --git a/README.md b/README.md
@@ -6,6 +6,7 @@ The goal of this repo is:
 - to access pretrained ConvNets with a unique interface/API inspired by torchvision.
 
 News:
+- 22/03/2018: CaffeResNet101 (good for localization with FasterRCNN)
 - 21/03/2018: NASNet Mobile thanks to [Veronika Yurchuk](https://github.com/veronikayurchuk) and [Anastasiia](https://github.com/DagnyT)
 - 25/01/2018: DualPathNetworks thanks to [Ross Wightman](https://github.com/rwightman/pytorch-dpn-pretrained), Xception thanks to [T Standley](https://github.com/tstandley/Xception-PyTorch), improved TransformImage API
 - 13/01/2018: `pip install pretrainedmodels`, `pretrainedmodels.model_names`, `pretrainedmodels.pretrained_settings`
@@ -32,6 +33,7 @@ News:
     - [Available models](https://github.com/Cadene/pretrained-models.pytorch#available-models)
         - [AlexNet](https://github.com/Cadene/pretrained-models.pytorch#torchvision)
         - [BNInception](https://github.com/Cadene/pretrained-models.pytorch#bninception)
+        - [CaffeResNet101](https://github.com/Cadene/pretrained-models.pytorch#caffe-resnet)
         - [DenseNet121](https://github.com/Cadene/pretrained-models.pytorch#torchvision)
         - [DenseNet161](https://github.com/Cadene/pretrained-models.pytorch#torchvision)
         - [DenseNet169](https://github.com/Cadene/pretrained-models.pytorch#torchvision)
@@ -42,6 +44,7 @@ News:
         - [DualPathNet98](https://github.com/Cadene/pretrained-models.pytorch#dualpathnetworks)
         - [DualPathNet107](https://github.com/Cadene/pretrained-models.pytorch#dualpathnetworks)
         - [DualPathNet113](https://github.com/Cadene/pretrained-models.pytorch#dualpathnetworks)
+        - [FBResNet152](https://github.com/Cadene/pretrained-models.pytorch#facebook-resnet)
         - [InceptionResNetV2](https://github.com/Cadene/pretrained-models.pytorch#inception)
         - [InceptionV3](https://github.com/Cadene/pretrained-models.pytorch#inception)
         - [InceptionV4](https://github.com/Cadene/pretrained-models.pytorch#inception)
@@ -107,7 +110,7 @@ import pretrainedmodels
 
 ```python
 print(pretrainedmodels.model_names)
-> ['fbresnet152', 'bninception', 'resnext101_32x4d', 'resnext101_64x4d', 'inceptionv4', 'inceptionresnetv2', 'alexnet', 'densenet121', 'densenet169', 'densenet201', 'densenet161', 'resnet18', 'resnet34', 'resnet50', 'resnet101', 'resnet152', 'inceptionv3', 'squeezenet1_0', 'squeezenet1_1', 'vgg11', 'vgg11_bn', 'vgg13', 'vgg13_bn', 'vgg16', 'vgg16_bn', 'vgg19_bn', 'vgg19', 'nasnetalarge', 'nasnetamobile']
+> ['fbresnet152', 'bninception', 'resnext101_32x4d', 'resnext101_64x4d', 'inceptionv4', 'inceptionresnetv2', 'alexnet', 'densenet121', 'densenet169', 'densenet201', 'densenet161', 'resnet18', 'resnet34', 'resnet50', 'resnet101', 'resnet152', 'inceptionv3', 'squeezenet1_0', 'squeezenet1_1', 'vgg11', 'vgg11_bn', 'vgg13', 'vgg13_bn', 'vgg16', 'vgg16_bn', 'vgg19_bn', 'vgg19', 'nasnetalarge', 'nasnetamobile', 'cafferesnet101']
 ```
 
 - To print the available pretrained settings for a chosen model:
@@ -215,6 +218,8 @@ FBResNet152 | [Torch7](https://github.com/facebook/fb.resnet.torch) | 77.84 | 93
 [InceptionV3](https://github.com/Cadene/pretrained-models.pytorch#inception) | [Pytorch](https://github.com/pytorch/vision#models) | 77.294 | 93.454
 [DenseNet201](https://github.com/Cadene/pretrained-models.pytorch#torchvision) | [Pytorch](https://github.com/pytorch/vision#models) | 77.152 | 93.548
 [DualPathNet68b_5k](https://github.com/Cadene/pretrained-models.pytorch#dualpathnetworks) | Our porting | 77.034 | 93.590
+[CaffeResnet101](https://github.com/Cadene/pretrained-models.pytorch#caffe-resnet) | [Caffe](https://github.com/KaimingHe/deep-residual-networks) | 76.400 | 92.900
+[CaffeResnet101](https://github.com/Cadene/pretrained-models.pytorch#caffe-resnet) | Our porting | 76.200 | 92.766
 [DenseNet169](https://github.com/Cadene/pretrained-models.pytorch#torchvision) | [Pytorch](https://github.com/pytorch/vision#models) | 76.026 | 92.992
 [ResNet50](https://github.com/Cadene/pretrained-models.pytorch#torchvision) | [Pytorch](https://github.com/pytorch/vision#models) | 76.002 | 92.980
 [DualPathNet68](https://github.com/Cadene/pretrained-models.pytorch#dualpathnetworks) | Our porting | 75.868 | 92.774
@@ -265,6 +270,13 @@ There are a bit different from the ResNet* of torchvision. ResNet152 is currentl
 
 - `fbresnet152(num_classes=1000, pretrained='imagenet')`
 
+#### Caffe ResNet*
+
+Source: [Caffe repo of KaimingHe](https://github.com/KaimingHe/deep-residual-networks)
+
+- `cafferesnet101(num_classes=1000, pretrained='imagenet')`
+
+
 #### Inception*
 
 Source: [TensorFlow Slim repo](https://github.com/tensorflow/models/tree/master/slim) and [Pytorch/Vision repo](https://github.com/pytorch/vision/tree/master/torchvision) for `inceptionv3`
diff --git a/pretrainedmodels/__init__.py b/pretrainedmodels/__init__.py
@@ -8,6 +8,7 @@
 # to support pretrainedmodels.__dict__['nasnetalarge']
 # but depreciated
 from .models.fbresnet import fbresnet152
+from .models.cafferesnet import cafferesnet101
 from .models.bninception import bninception
 from .models.resnext import resnext101_32x4d
 from .models.resnext import resnext101_64x4d
diff --git a/pretrainedmodels/models/__init__.py b/pretrainedmodels/models/__init__.py
@@ -1,5 +1,7 @@
 from .fbresnet import fbresnet152
 
+from .cafferesnet import cafferesnet101
+
 from .bninception import bninception
 
 from .resnext import resnext101_32x4d
diff --git a/pretrainedmodels/models/cafferesnet.py b/pretrainedmodels/models/cafferesnet.py
@@ -0,0 +1,177 @@
+import math
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+import torch.utils.model_zoo as model_zoo
+
+pretrained_settings = {
+    'cafferesnet101': {
+        'imagenet': {
+            'url': 'http://data.lip6.fr/cadene/pretrainedmodels/cafferesnet101-9cf32c75.pth',
+            'input_space': 'BGR',
+            'input_size': [3, 224, 224],
+            'input_range': [0, 255],
+            'mean': [102.9801, 115.9465, 122.7717],
+            'std': [1, 1, 1],
+            'num_classes': 1000
+        }
+    }
+}
+
+
+def conv3x3(in_planes, out_planes, stride=1):
+  "3x3 convolution with padding"
+  return nn.Conv2d(in_planes, out_planes, kernel_size=3, stride=stride,
+           padding=1, bias=False)
+
+
+class BasicBlock(nn.Module):
+  expansion = 1
+
+  def __init__(self, inplanes, planes, stride=1, downsample=None):
+    super(BasicBlock, self).__init__()
+    self.conv1 = conv3x3(inplanes, planes, stride)
+    self.bn1 = nn.BatchNorm2d(planes)
+    self.relu = nn.ReLU(inplace=True)
+    self.conv2 = conv3x3(planes, planes)
+    self.bn2 = nn.BatchNorm2d(planes)
+    self.downsample = downsample
+    self.stride = stride
+
+  def forward(self, x):
+    residual = x
+
+    out = self.conv1(x)
+    out = self.bn1(out)
+    out = self.relu(out)
+
+    out = self.conv2(out)
+    out = self.bn2(out)
+
+    if self.downsample is not None:
+      residual = self.downsample(x)
+
+    out += residual
+    out = self.relu(out)
+
+    return out
+
+
+class Bottleneck(nn.Module):
+  expansion = 4
+
+  def __init__(self, inplanes, planes, stride=1, downsample=None):
+    super(Bottleneck, self).__init__()
+    self.conv1 = nn.Conv2d(inplanes, planes, kernel_size=1, stride=stride, bias=False) # change
+    self.bn1 = nn.BatchNorm2d(planes)
+    self.conv2 = nn.Conv2d(planes, planes, kernel_size=3, stride=1, # change
+                 padding=1, bias=False)
+    self.bn2 = nn.BatchNorm2d(planes)
+    self.conv3 = nn.Conv2d(planes, planes * 4, kernel_size=1, bias=False)
+    self.bn3 = nn.BatchNorm2d(planes * 4)
+    self.relu = nn.ReLU(inplace=True)
+    self.downsample = downsample
+    self.stride = stride
+
+  def forward(self, x):
+    residual = x
+
+    out = self.conv1(x)
+    out = self.bn1(out)
+    out = self.relu(out)
+
+    out = self.conv2(out)
+    out = self.bn2(out)
+    out = self.relu(out)
+
+    out = self.conv3(out)
+    out = self.bn3(out)
+
+    if self.downsample is not None:
+      residual = self.downsample(x)
+
+    out += residual
+    out = self.relu(out)
+
+    return out
+
+
+class ResNet(nn.Module):
+
+  def __init__(self, block, layers, num_classes=1000):
+    self.inplanes = 64
+    super(ResNet, self).__init__()
+    self.conv1 = nn.Conv2d(3, 64, kernel_size=7, stride=2, padding=3,
+                 bias=False)
+    self.bn1 = nn.BatchNorm2d(64)
+    self.relu = nn.ReLU(inplace=True)
+    self.maxpool = nn.MaxPool2d(kernel_size=3, stride=2, padding=0, ceil_mode=True) # change
+    self.layer1 = self._make_layer(block, 64, layers[0])
+    self.layer2 = self._make_layer(block, 128, layers[1], stride=2)
+    self.layer3 = self._make_layer(block, 256, layers[2], stride=2)
+    self.layer4 = self._make_layer(block, 512, layers[3], stride=2)
+    # it is slightly better whereas slower to set stride = 1
+    # self.layer4 = self._make_layer(block, 512, layers[3], stride=1)
+    self.avgpool = nn.AvgPool2d(7)
+    self.fc = nn.Linear(512 * block.expansion, num_classes)
+
+    for m in self.modules():
+      if isinstance(m, nn.Conv2d):
+        n = m.kernel_size[0] * m.kernel_size[1] * m.out_channels
+        m.weight.data.normal_(0, math.sqrt(2. / n))
+      elif isinstance(m, nn.BatchNorm2d):
+        m.weight.data.fill_(1)
+        m.bias.data.zero_()
+
+  def _make_layer(self, block, planes, blocks, stride=1):
+    downsample = None
+    if stride != 1 or self.inplanes != planes * block.expansion:
+      downsample = nn.Sequential(
+        nn.Conv2d(self.inplanes, planes * block.expansion,
+              kernel_size=1, stride=stride, bias=False),
+        nn.BatchNorm2d(planes * block.expansion),
+      )
+
+    layers = []
+    layers.append(block(self.inplanes, planes, stride, downsample))
+    self.inplanes = planes * block.expansion
+    for i in range(1, blocks):
+      layers.append(block(self.inplanes, planes))
+
+    return nn.Sequential(*layers)
+
+  def forward(self, x):
+    x = self.conv1(x)
+    x = self.bn1(x)
+    x = self.relu(x)
+    x = self.maxpool(x)
+
+    x = self.layer1(x)
+    x = self.layer2(x)
+    x = self.layer3(x)
+    x = self.layer4(x)
+
+    x = self.avgpool(x)
+    x = x.view(x.size(0), -1)
+    x = self.fc(x)
+
+    return x
+
+
+def cafferesnet101(num_classes=1000, pretrained='imagenet'):
+    """Constructs a ResNet-101 model.
+    Args:
+    pretrained (bool): If True, returns a model pre-trained on ImageNet
+    """
+    model = ResNet(Bottleneck, [3, 4, 23, 3], num_classes=num_classes)
+    if pretrained is not None:
+        settings = pretrained_settings['cafferesnet101'][pretrained]
+        assert num_classes == settings['num_classes'], \
+            "num_classes should be {}, but is {}".format(settings['num_classes'], num_classes)
+        model.load_state_dict(model_zoo.load_url(settings['url']))
+        model.input_space = settings['input_space']
+        model.input_size = settings['input_size']
+        model.input_range = settings['input_range']
+        model.mean = settings['mean']
+        model.std = settings['std']
+    return model
diff --git a/pretrainedmodels/version.py b/pretrainedmodels/version.py
@@ -1 +1 @@
-__version__ = '0.3.0'
+__version__ = '0.4.0'

Original file line number	Diff line number	Diff line change
`@@ -1 +1 @@`
`1`		`-__version__ = '0.3.0'`
	`1`	`+__version__ = '0.4.0'`