junxiaoyao
/
YOLO-Tutorial-v2


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170
							import torch
import torch.nn as nn

try:
    from .modules import BasicConv, CSPBlock
except:
    from  modules import BasicConv, CSPBlock


# ---------------------------- CSPDarkNet ----------------------------
# CSPDarkNet
class CSPDarkNet(nn.Module):
    def __init__(self, img_dim=3, width=1.0, depth=1.0, act_type='silu', norm_type='BN', depthwise=False, num_classes=1000):
        super(CSPDarkNet, self).__init__()
        # ---------------- Basic parameters ----------------
        self.width_factor = width
        self.depth_factor = depth
        self.feat_dims = [round(64 * width),
                          round(128 * width),
                          round(256 * width),
                          round(512 * width),
                          round(1024 * width)
                          ]

        # ---------------- Model parameters ----------------
        ## P1/2
        self.layer_1 = BasicConv(img_dim, self.feat_dims[0],
                                 kernel_size=6, padding=2, stride=2,
                                 act_type=act_type, norm_type=norm_type, depthwise=depthwise)
        
        ## P2/4
        self.layer_2 = nn.Sequential(
            BasicConv(self.feat_dims[0], self.feat_dims[1],
                      kernel_size=3, padding=1, stride=2,
                      act_type=act_type, norm_type=norm_type, depthwise=depthwise),
            CSPBlock(self.feat_dims[1],
                     self.feat_dims[1],
                     num_blocks   = round(3*depth),
                     expand_ratio = 0.5,
                     shortcut     = True,
                     act_type     = act_type,
                     norm_type    = norm_type,
                     depthwise    = depthwise)
        )
        # P3/8
        self.layer_3 = nn.Sequential(
            BasicConv(self.feat_dims[1], self.feat_dims[2],
                      kernel_size=3, padding=1, stride=2,
                      act_type=act_type, norm_type=norm_type, depthwise=depthwise),
            CSPBlock(self.feat_dims[2],
                     self.feat_dims[2],
                     num_blocks   = round(9*depth),
                     expand_ratio = 0.5,
                     shortcut     = True,
                     act_type     = act_type,
                     norm_type    = norm_type,
                     depthwise    = depthwise)
        )
        # P4/16
        self.layer_4 = nn.Sequential(
            BasicConv(self.feat_dims[2], self.feat_dims[3],
                      kernel_size=3, padding=1, stride=2,
                      act_type=act_type, norm_type=norm_type, depthwise=depthwise),
            CSPBlock(self.feat_dims[3],
                     self.feat_dims[3],
                     num_blocks   = round(9*depth),
                     expand_ratio = 0.5,
                     shortcut     = True,
                     act_type     = act_type,
                     norm_type    = norm_type,
                     depthwise    = depthwise)
        )
        # P5/32
        self.layer_5 = nn.Sequential(
            BasicConv(self.feat_dims[3], self.feat_dims[4],
                      kernel_size=3, padding=1, stride=2,
                      act_type=act_type, norm_type=norm_type, depthwise=depthwise),
            CSPBlock(self.feat_dims[4],
                     self.feat_dims[4],
                     num_blocks   = round(3*depth),
                     expand_ratio = 0.5,
                     shortcut     = True,
                     act_type     = act_type,
                     norm_type    = norm_type,
                     depthwise    = depthwise)
        )
        self.avgpool = nn.AdaptiveAvgPool2d((1, 1))
        self.fc = nn.Linear(self.feat_dims[4], num_classes)


    def forward(self, x):
        c1 = self.layer_1(x)
        c2 = self.layer_2(c1)
        c3 = self.layer_3(c2)
        c4 = self.layer_4(c3)
        c5 = self.layer_5(c4)

        c5 = self.avgpool(c5)
        c5 = torch.flatten(c5, 1)
        c5 = self.fc(c5)

        return c5


# ---------------------------- Functions ----------------------------
## build ELAN-Net
# ------------------------ Model Functions ------------------------
def cspdarknet_n(img_dim=3, num_classes=1000) -> CSPDarkNet:
    return CSPDarkNet(img_dim=img_dim,
                       width=0.25,
                       depth=0.34,
                       act_type='silu',
                       norm_type='BN',
                       depthwise=False,
                       num_classes=num_classes
                       )

def cspdarknet_s(img_dim=3, num_classes=1000) -> CSPDarkNet:
    return CSPDarkNet(img_dim=img_dim,
                       width=0.50,
                       depth=0.34,
                       act_type='silu',
                       norm_type='BN',
                       depthwise=False,
                       num_classes=num_classes
                       )

def cspdarknet_m(img_dim=3, num_classes=1000) -> CSPDarkNet:
    return CSPDarkNet(img_dim=img_dim,
                       width=0.75,
                       depth=0.67,
                       act_type='silu',
                       norm_type='BN',
                       depthwise=False,
                       num_classes=num_classes
                       )

def cspdarknet_l(img_dim=3, num_classes=1000) -> CSPDarkNet:
    return CSPDarkNet(img_dim=img_dim,
                       width=1.0,
                       depth=1.0,
                       act_type='silu',
                       norm_type='BN',
                       depthwise=False,
                       num_classes=num_classes
                       )

def cspdarknet_x(img_dim=3, num_classes=1000) -> CSPDarkNet:
    return CSPDarkNet(img_dim=img_dim,
                       width=1.25,
                       depth=1.34,
                       act_type='silu',
                       norm_type='BN',
                       depthwise=False,
                       num_classes=num_classes
                       )


if __name__ == '__main__':
    import torch
    from thop import profile

    # build model
    model = cspdarknet_s()

    x = torch.randn(1, 3, 224, 224)
    print('==============================')
    flops, params = profile(model, inputs=(x, ), verbose=False)
    print('GFLOPs : {:.2f}'.format(flops / 1e9 * 2))
    print('Params : {:.2f} M'.format(params / 1e6))