Source code for monai.networks.nets.torchvision_fc

# Copyright 2020 - 2021 MONAI Consortium
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#     http://www.apache.org/licenses/LICENSE-2.0
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

from typing import Any, Dict, Optional, Tuple, Union

from monai.networks.nets import NetAdapter
from monai.utils import deprecated, optional_import

models, _ = optional_import("torchvision.models")


__all__ = ["TorchVisionFCModel", "TorchVisionFullyConvModel"]


[docs]class TorchVisionFCModel(NetAdapter): """ Customize the fully connected layer of TorchVision model or replace it by convolutional layer. Args: model_name: name of any torchvision model with fully connected layer at the end. ``resnet18`` (default), ``resnet34m``, ``resnet50``, ``resnet101``, ``resnet152``, ``resnext50_32x4d``, ``resnext101_32x8d``, ``wide_resnet50_2``, ``wide_resnet101_2``. model details: https://pytorch.org/vision/stable/models.html. n_classes: number of classes for the last classification layer. Default to 1. dim: number of spatial dimensions, default to 2. in_channels: number of the input channels of last layer. if None, get it from `in_features` of last layer. use_conv: whether use convolutional layer to replace the last layer, default to False. pool: parameters for the pooling layer, it should be a tuple, the first item is name of the pooling layer, the second item is dictionary of the initialization args. if None, will not replace the `layers[-2]`. default to `("avg", {"kernel_size": 7, "stride": 1})`. bias: the bias value when replacing the last layer. if False, the layer will not learn an additive bias, default to True. pretrained: whether to use the imagenet pretrained weights. Default to False. """ def __init__( self, model_name: str = "resnet18", n_classes: int = 1, dim: int = 2, in_channels: Optional[int] = None, use_conv: bool = False, pool: Optional[Tuple[str, Dict[str, Any]]] = ("avg", {"kernel_size": 7, "stride": 1}), bias: bool = True, pretrained: bool = False, ): model = getattr(models, model_name)(pretrained=pretrained) # check if the model is compatible, should have a FC layer at the end if not str(list(model.children())[-1]).startswith("Linear"): raise ValueError(f"Model ['{model_name}'] does not have a Linear layer at the end.") super().__init__( model=model, n_classes=n_classes, dim=dim, in_channels=in_channels, use_conv=use_conv, pool=pool, bias=bias, )
[docs]@deprecated(since="0.6.0", removed="0.7.0", msg_suffix="Please consider using `TorchVisionFCModel` instead.") class TorchVisionFullyConvModel(TorchVisionFCModel): """ Customize TorchVision models to replace fully connected layer by convolutional layer. Args: model_name: name of any torchvision with adaptive avg pooling and fully connected layer at the end. ``resnet18`` (default), ``resnet34m``, ``resnet50``, ``resnet101``, ``resnet152``, ``resnext50_32x4d``, ``resnext101_32x8d``, ``wide_resnet50_2``, ``wide_resnet101_2``. n_classes: number of classes for the last classification layer. Default to 1. pool_size: the kernel size for `AvgPool2d` to replace `AdaptiveAvgPool2d`. Default to (7, 7). pool_stride: the stride for `AvgPool2d` to replace `AdaptiveAvgPool2d`. Default to 1. pretrained: whether to use the imagenet pretrained weights. Default to False. """ def __init__( self, model_name: str = "resnet18", n_classes: int = 1, pool_size: Union[int, Tuple[int, int]] = (7, 7), pool_stride: Union[int, Tuple[int, int]] = 1, pretrained: bool = False, ): super().__init__( model_name=model_name, n_classes=n_classes, use_conv=True, pool=("avg", {"kernel_size": pool_size, "stride": pool_stride}), pretrained=pretrained, )