EfficientNet.py

# -*- coding: utf-8 -*-
"""
Created on Wed Mar  3 00:05:30 2021

@author: Admin
"""


import torch
import torch.nn as nn
from math import ceil
from torchsummary import summary

base_model = [
    #Expand Ratio, channels, repeats, strides, kernel_size
    [1,16,1,1,3],
    [6,24,2,2,3],
    [6,40,2,2,5],
    [6,80,3,2,3],
    [6,112,3,1,5],
    [6,192,4,2,5],
    [6,320,1,1,3]
    ]

phi_values = {
    #(phi_value, resolution, drop_rate)
    'b0': (0,224,0.2),
    'b1': (0.5,240,0.2),
    'b2': (1,260,0.3),
    'b3': (2,300,0.4),
    'b4': (3,380,0.4),
    'b5': (4,456,0.4),
    'b6': (5,528,0.5),
    'b7': (6,600,0.5)
    }

class CNNBlock(nn.Module):
    def __init__(self,in_channels,out_channels,kernel_size, stride,padding, groups = 1):
        super(CNNBlock, self).__init__()
        self.cnn = nn.Conv2d(
            in_channels,
            out_channels,
            kernel_size,
            stride,
            padding,
            groups = groups  #If group = 1 => Normal Convolution but groups = in_channels => Depthwise Convolution
            )
        self.bn = nn.BatchNorm2d(out_channels)
        self.silu = nn.SiLU()
        
    def forward(self,x):
        return self.silu(self.bn(self.cnn(x)))


class SqueezeAndExcitation(nn.Module):
    
    def __init__(self, in_channels, reduce_dim):
        super(SqueezeAndExcitation, self).__init__()
        self.SE = nn.Sequential(
            nn.AdaptiveAvgPool2d(1),
            nn.Conv2d(in_channels, reduce_dim,1),
            nn.SiLU(),
            nn.Conv2d(reduce_dim,in_channels, 1),
            nn.Sigmoid()
            )
        
    def forward(self, x):
        
        return x * self.SE(x) #Each channels is multiplied with the value which comes out of Conv layers and tells us how much should we prioritize a particular channels 

class InvertedResBlock(nn.Module):
    
    def __init__(self, in_channels, out_channels, kernel_size,
                 stride, padding, expand_ratio, reduction = 4, survival_prob = 0.8):
        
        super(InvertedResBlock, self).__init__()
        self.survival_prob = survival_prob
        self.use_residual = in_channels == out_channels and stride == 1
        hidden_dim = in_channels * expand_ratio
        self.expand = in_channels != hidden_dim
        reduced_dim = int(in_channels / reduction)
        
        if self.expand:
            
            self.expand_conv = CNNBlock(
                in_channels, hidden_dim, kernel_size=3, stride = 1, padding = 1
                )
            
        self.conv = nn.Sequential(
            CNNBlock(hidden_dim, hidden_dim, kernel_size, stride, padding, groups = hidden_dim),
            SqueezeAndExcitation(hidden_dim, reduced_dim),
            nn.Conv2d(hidden_dim, out_channels, 1, bias = False),
            nn.BatchNorm2d(out_channels)
        )
        
    def stochastic_depth(self, x):
        if not self.training:
            return x
        binary_tensor = torch.rand(x.shape[0], 1,1,1, device = x.device) < self.survival_prob
        return torch.div(x, self.survival_prob) * binary_tensor
    
    def forward(self, inputs):
        x = self.expand_conv(inputs) if self.expand else inputs
        
        if self.use_residual:
            return self.stochastic_depth(self.conv(x)) + inputs
        else:
            return self.conv(x)
        
    
    
class EfficientNet(nn.Module):
    
    def __init__(self, version, num_classes):
        super(EfficientNet, self).__init__()
        
        width_factor, depth_factor, dropout_rate = self.calculate_factors(version)
        last_channels = ceil(1280 * width_factor)
        self.pool = nn.AdaptiveAvgPool2d(1)
        self.features = self.create_features(width_factor, depth_factor, last_channels)
        self.classifier = nn.Sequential(
            nn.Dropout(dropout_rate),
            nn.Linear(last_channels, num_classes)
            )
        
    def calculate_factors(self, version, alpha = 1.2, beta = 1.1):
        phi,res,drop_rate = phi_values[version]
        depth_factor = alpha ** phi
        width_factor = beta ** phi
        return width_factor, depth_factor, drop_rate
    
    def create_features(self, depth_factor, width_factor, last_channels):
        channels = int(32 * width_factor)
        features = [CNNBlock(3, channels, 3, stride = 2, padding=1)]
        in_channels = channels
        
        for expand_ratio, channels, repeats, stride, kernel_size in base_model:
            out_channels = 4 * ceil(int(channels * width_factor) / 4)
            layer_repeat = ceil(repeats * depth_factor)
            
            for layer in range(layer_repeat):
                
                features.append(
                    InvertedResBlock(
                        in_channels, 
                        out_channels,
                        expand_ratio = expand_ratio,
                        stride = stride if layer == 0 else 1,
                        kernel_size = kernel_size,
                        padding = kernel_size//2
                        )
                    )
                
                in_channels = out_channels

        features.append(
            CNNBlock(in_channels, last_channels, kernel_size=1, stride = 1, padding = 0)
            )            
        
        return nn.Sequential(*features)
    
    def forward(self, x):
        x = self.pool(self.features(x))
        return self.classifier(x.view(x.shape[0], -1))
    

def test():
    
    device = torch.device('cuda')
    version = 'b0'
    phi,res,drop_rate = phi_values[version]
    num_ex, num_classes = 4,10
    x = torch.randn((num_ex, 3, res, res)).to(device)
    model = EfficientNet(
        version = version,
        num_classes = num_classes,
        ).to(device)
    
    print(model(x).shape)
    print(summary(model.to(device), (3,res,res)))
    

test()