models/MobileNetV2/models.py

import torch
import torch.nn as nn
import numpy as np
from .blocks import *

__all__ = ["MobileNetV2", "MobileNetV2_10", "MobileNetV2_075", "MobileNetV2_05"]


class MobileNetV2(nn.Module):
    def __init__(
        self,
        image_channels: int,
        num_classes: int,
        alpha: float = 1.0,
        dropout_rate: float = 0.5,
    ) -> None:
        super().__init__()
        self.alpha = alpha

        self.feature_extractor = nn.Sequential(
            ConvBlock(
                in_channels=image_channels,
                out_channels=self._multiply_width(32),
                kernel_size=3,
                stride=2,
                padding=1,
                act="ReLU6",
            ),
            BottleNeck(
                dim=[self._multiply_width(32), self._multiply_width(16)],
                factor=1,
                iterate=1,
                stride=1,
            ),
            BottleNeck(
                dim=[self._multiply_width(16), self._multiply_width(24)],
                factor=6,
                iterate=2,
                stride=2,
            ),
            BottleNeck(
                dim=[self._multiply_width(24), self._multiply_width(32)],
                factor=6,
                iterate=3,
                stride=2,
            ),
            BottleNeck(
                dim=[self._multiply_width(32), self._multiply_width(64)],
                factor=6,
                iterate=4,
                stride=2,
            ),
            BottleNeck(
                dim=[self._multiply_width(64), self._multiply_width(96)],
                factor=6,
                iterate=3,
                stride=1,
            ),
            BottleNeck(
                dim=[self._multiply_width(96), self._multiply_width(160)],
                factor=6,
                iterate=3,
                stride=2,
            ),
            BottleNeck(
                dim=[self._multiply_width(160), self._multiply_width(320)],
                factor=6,
                iterate=1,
                stride=1,
            ),
            ConvBlock(
                in_channels=self._multiply_width(320),
                out_channels=self._multiply_width(1280),
                kernel_size=1,
                act="ReLU6",
            ),
            nn.AdaptiveAvgPool2d(1),
        )
        self.classifier = Classifier(
            in_features=self._multiply_width(1280),
            out_features=num_classes,
            dropout_rate=dropout_rate,
        )

    def forward(self, x: torch.Tensor) -> torch.Tensor:
        x = self.feature_extractor(x)
        x = torch.flatten(x, 1)
        logits = self.classifier(x)
        return logits

    def _multiply_width(self, dim: int) -> int:
        return int(np.ceil(self.alpha * dim))


def MobileNetV2_10(
    image_channels: int, num_classes: int, dropout_rate: float = 0.5
) -> MobileNetV2:
    return MobileNetV2(image_channels, num_classes, 1.0, dropout_rate)


def MobileNetV2_075(
    image_channels: int, num_classes: int, dropout_rate: float = 0.5
) -> MobileNetV2:
    return MobileNetV2(image_channels, num_classes, 0.75, dropout_rate)


def MobileNetV2_05(
    image_channels: int, num_classes: int, dropout_rate: float = 0.5
) -> MobileNetV2:
    return MobileNetV2(image_channels, num_classes, 0.5, dropout_rate)