| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342 |
- # Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- import paddle
- from paddle import nn
- from paddle.utils.download import get_weights_path_from_url
- __all__ = []
- model_urls = {
- 'vgg16': (
- 'https://paddle-hapi.bj.bcebos.com/models/vgg16.pdparams',
- '89bbffc0f87d260be9b8cdc169c991c4',
- ),
- 'vgg19': (
- 'https://paddle-hapi.bj.bcebos.com/models/vgg19.pdparams',
- '23b18bb13d8894f60f54e642be79a0dd',
- ),
- }
- class VGG(nn.Layer):
- """VGG model from
- `"Very Deep Convolutional Networks For Large-Scale Image Recognition" <https://arxiv.org/pdf/1409.1556.pdf>`_.
- Args:
- features (nn.Layer): Vgg features create by function make_layers.
- num_classes (int, optional): Output dim of last fc layer. If num_classes <= 0, last fc layer
- will not be defined. Default: 1000.
- with_pool (bool, optional): Use pool before the last three fc layer or not. Default: True.
- Returns:
- :ref:`api_paddle_nn_Layer`. An instance of VGG model.
- Examples:
- .. code-block:: python
- >>> import paddle
- >>> from paddle.vision.models import VGG
- >>> from paddle.vision.models.vgg import make_layers
- >>> vgg11_cfg = [64, 'M', 128, 'M', 256, 256, 'M', 512, 512, 'M', 512, 512, 'M']
- >>> features = make_layers(vgg11_cfg)
- >>> vgg11 = VGG(features)
- >>> x = paddle.rand([1, 3, 224, 224])
- >>> out = vgg11(x)
- >>> print(out.shape)
- [1, 1000]
- """
- def __init__(self, features, num_classes=1000, with_pool=True):
- super().__init__()
- self.features = features
- self.num_classes = num_classes
- self.with_pool = with_pool
- if with_pool:
- self.avgpool = nn.AdaptiveAvgPool2D((7, 7))
- if num_classes > 0:
- self.classifier = nn.Sequential(
- nn.Linear(512 * 7 * 7, 4096),
- nn.ReLU(),
- nn.Dropout(),
- nn.Linear(4096, 4096),
- nn.ReLU(),
- nn.Dropout(),
- nn.Linear(4096, num_classes),
- )
- def forward(self, x):
- x = self.features(x)
- if self.with_pool:
- x = self.avgpool(x)
- if self.num_classes > 0:
- x = paddle.flatten(x, 1)
- x = self.classifier(x)
- return x
- def make_layers(cfg, batch_norm=False):
- layers = []
- in_channels = 3
- for v in cfg:
- if v == 'M':
- layers += [nn.MaxPool2D(kernel_size=2, stride=2)]
- else:
- conv2d = nn.Conv2D(in_channels, v, kernel_size=3, padding=1)
- if batch_norm:
- layers += [conv2d, nn.BatchNorm2D(v), nn.ReLU()]
- else:
- layers += [conv2d, nn.ReLU()]
- in_channels = v
- return nn.Sequential(*layers)
- cfgs = {
- 'A': [64, 'M', 128, 'M', 256, 256, 'M', 512, 512, 'M', 512, 512, 'M'],
- 'B': [
- 64,
- 64,
- 'M',
- 128,
- 128,
- 'M',
- 256,
- 256,
- 'M',
- 512,
- 512,
- 'M',
- 512,
- 512,
- 'M',
- ],
- 'D': [
- 64,
- 64,
- 'M',
- 128,
- 128,
- 'M',
- 256,
- 256,
- 256,
- 'M',
- 512,
- 512,
- 512,
- 'M',
- 512,
- 512,
- 512,
- 'M',
- ],
- 'E': [
- 64,
- 64,
- 'M',
- 128,
- 128,
- 'M',
- 256,
- 256,
- 256,
- 256,
- 'M',
- 512,
- 512,
- 512,
- 512,
- 'M',
- 512,
- 512,
- 512,
- 512,
- 'M',
- ],
- }
- def _vgg(arch, cfg, batch_norm, pretrained, **kwargs):
- model = VGG(make_layers(cfgs[cfg], batch_norm=batch_norm), **kwargs)
- if pretrained:
- assert (
- arch in model_urls
- ), f"{arch} model do not have a pretrained model now, you should set pretrained=False"
- weight_path = get_weights_path_from_url(
- model_urls[arch][0], model_urls[arch][1]
- )
- param = paddle.load(weight_path)
- model.load_dict(param)
- return model
- def vgg11(pretrained=False, batch_norm=False, **kwargs):
- """VGG 11-layer model from
- `"Very Deep Convolutional Networks For Large-Scale Image Recognition" <https://arxiv.org/pdf/1409.1556.pdf>`_.
- Args:
- pretrained (bool, optional): Whether to load pre-trained weights. If True, returns a model pre-trained
- on ImageNet. Default: False.
- batch_norm (bool, optional): If True, returns a model with batch_norm layer. Default: False.
- **kwargs (optional): Additional keyword arguments. For details, please refer to :ref:`VGG <api_paddle_vision_models_VGG>`.
- Returns:
- :ref:`api_paddle_nn_Layer`. An instance of VGG 11-layer model.
- Examples:
- .. code-block:: python
- >>> import paddle
- >>> from paddle.vision.models import vgg11
- >>> # build model
- >>> model = vgg11()
- >>> # build vgg11 model with batch_norm
- >>> model = vgg11(batch_norm=True)
- >>> x = paddle.rand([1, 3, 224, 224])
- >>> out = model(x)
- >>> print(out.shape)
- [1, 1000]
- """
- model_name = 'vgg11'
- if batch_norm:
- model_name += '_bn'
- return _vgg(model_name, 'A', batch_norm, pretrained, **kwargs)
- def vgg13(pretrained=False, batch_norm=False, **kwargs):
- """VGG 13-layer model from
- `"Very Deep Convolutional Networks For Large-Scale Image Recognition" <https://arxiv.org/pdf/1409.1556.pdf>`_.
- Args:
- pretrained (bool, optional): Whether to load pre-trained weights. If True, returns a model pre-trained
- on ImageNet. Default: False.
- batch_norm (bool): If True, returns a model with batch_norm layer. Default: False.
- **kwargs (optional): Additional keyword arguments. For details, please refer to :ref:`VGG <api_paddle_vision_models_VGG>`.
- Returns:
- :ref:`api_paddle_nn_Layer`. An instance of VGG 13-layer model.
- Examples:
- .. code-block:: python
- >>> import paddle
- >>> from paddle.vision.models import vgg13
- >>> # build model
- >>> model = vgg13()
- >>> # build vgg13 model with batch_norm
- >>> model = vgg13(batch_norm=True)
- >>> x = paddle.rand([1, 3, 224, 224])
- >>> out = model(x)
- >>> print(out.shape)
- [1, 1000]
- """
- model_name = 'vgg13'
- if batch_norm:
- model_name += '_bn'
- return _vgg(model_name, 'B', batch_norm, pretrained, **kwargs)
- def vgg16(pretrained=False, batch_norm=False, **kwargs):
- """VGG 16-layer model from
- `"Very Deep Convolutional Networks For Large-Scale Image Recognition" <https://arxiv.org/pdf/1409.1556.pdf>`_.
- Args:
- pretrained (bool, optional): Whether to load pre-trained weights. If True, returns a model pre-trained
- on ImageNet. Default: False.
- batch_norm (bool, optional): If True, returns a model with batch_norm layer. Default: False.
- **kwargs (optional): Additional keyword arguments. For details, please refer to :ref:`VGG <api_paddle_vision_models_VGG>`.
- Returns:
- :ref:`api_paddle_nn_Layer`. An instance of VGG 16-layer model.
- Examples:
- .. code-block:: python
- >>> import paddle
- >>> from paddle.vision.models import vgg16
- >>> # build model
- >>> model = vgg16()
- >>> # build vgg16 model with batch_norm
- >>> model = vgg16(batch_norm=True)
- >>> x = paddle.rand([1, 3, 224, 224])
- >>> out = model(x)
- >>> print(out.shape)
- [1, 1000]
- """
- model_name = 'vgg16'
- if batch_norm:
- model_name += '_bn'
- return _vgg(model_name, 'D', batch_norm, pretrained, **kwargs)
- def vgg19(pretrained=False, batch_norm=False, **kwargs):
- """VGG 19-layer model from
- `"Very Deep Convolutional Networks For Large-Scale Image Recognition" <https://arxiv.org/pdf/1409.1556.pdf>`_.
- Args:
- pretrained (bool, optional): Whether to load pre-trained weights. If True, returns a model pre-trained
- on ImageNet. Default: False.
- batch_norm (bool, optional): If True, returns a model with batch_norm layer. Default: False.
- **kwargs (optional): Additional keyword arguments. For details, please refer to :ref:`VGG <api_paddle_vision_models_VGG>`.
- Returns:
- :ref:`api_paddle_nn_Layer`. An instance of VGG 19-layer model.
- Examples:
- .. code-block:: python
- >>> import paddle
- >>> from paddle.vision.models import vgg19
- >>> # build model
- >>> model = vgg19()
- >>> # build vgg19 model with batch_norm
- >>> model = vgg19(batch_norm=True)
- >>> x = paddle.rand([1, 3, 224, 224])
- >>> out = model(x)
- >>> print(out.shape)
- [1, 1000]
- """
- model_name = 'vgg19'
- if batch_norm:
- model_name += '_bn'
- return _vgg(model_name, 'E', batch_norm, pretrained, **kwargs)
|