2 ani în urmă · 62a5b79e6a
--- a/config/model_config/rtcdet_config.py
+++ b/config/model_config/rtcdet_config.py
@@ -15,7 +15,7 @@ rtcdet_cfg = {
 
															         'stride': [8, 16, 32],  # P3, P4, P5
														
 
															         'max_stride': 32,
														
 
															         ## Neck: SPP
														
 
															-        'neck': 'csp_sppf',
														
 
															+        'neck': 'sppf',
														
 
															         'neck_expand_ratio': 0.5,
														
 
															         'pooling_size': 5,
														
 
															         'neck_act': 'silu',
														
@@ -71,7 +71,7 @@ rtcdet_cfg = {
 
															         'stride': [8, 16, 32],  # P3, P4, P5
														
 
															         'max_stride': 32,
														
 
															         ## Neck: SPP
														
 
															-        'neck': 'csp_sppf',
														
 
															+        'neck': 'sppf',
														
 
															         'neck_expand_ratio': 0.5,
														
 
															         'pooling_size': 5,
														
 
															         'neck_act': 'silu',
														
@@ -80,7 +80,7 @@ rtcdet_cfg = {
 
															         ## Neck: PaFPN
														
 
															         'fpn': 'rtcdet_pafpn',
														
 
															         'fpn_reduce_layer': 'conv',
														
 
															-        'fpn_downsample_layer': 'conv',
														
 
															+        'fpn_downsample_layer': 'dsblock',
														
 
															         'fpn_core_block': 'elan_block',
														
 
															         'fpn_branch_depth': 3,
														
 
															         'fpn_expand_ratio': 0.5,
														
--- a/models/detectors/rtcdet/rtcdet_basic.py
+++ b/models/detectors/rtcdet/rtcdet_basic.py
@@ -329,5 +329,7 @@ def build_downsample_layer(cfg, in_dim, out_dim):
 
															     elif cfg['fpn_downsample_layer'] == 'maxpool':
														
 
															         assert in_dim == out_dim
														
 
															         layer = nn.MaxPool2d((2, 2), stride=2)
														
 
															+    elif cfg['fpn_downsample_layer'] == 'dsblock':
														
 
															+        layer = DSBlock(in_dim, out_dim, cfg['fpn_act'], cfg['fpn_norm'], cfg['fpn_depthwise'])
														
 
															     return layer
														
--- a/models/detectors/rtcdet/rtcdet_pafpn.py
+++ b/models/detectors/rtcdet/rtcdet_pafpn.py
@@ -17,29 +17,24 @@ class RTCDetPaFPN(nn.Module):
 
															         # --------------------------- Top-down FPN ---------------------------
														
 
															         ## P5 -> P4
														
 
															-        self.reduce_layer_1 = build_reduce_layer(cfg, in_dims[2], round(256*cfg['width']))
														
 
															-        self.reduce_layer_2 = build_reduce_layer(cfg, in_dims[1], round(256*cfg['width']))
														
 
															-        self.top_down_layer_1 = build_fpn_block(cfg, round(256*cfg['width']) + round(256*cfg['width']), round(256*cfg['width']))
														
 
															+        self.reduce_layer_1 = build_reduce_layer(cfg, in_dims[2], round(512*cfg['width']))
														
 
															+        self.reduce_layer_2 = build_reduce_layer(cfg, in_dims[1], round(512*cfg['width']))
														
 
															+        self.top_down_layer_1 = build_fpn_block(cfg, round(512*cfg['width']) + round(512*cfg['width']), round(512*cfg['width']))
														
 
															         ## P4 -> P3
														
 
															-        self.reduce_layer_3 = build_reduce_layer(cfg, round(256*cfg['width']), round(128*cfg['width']))
														
 
															-        self.reduce_layer_4 = build_reduce_layer(cfg, in_dims[0], round(128*cfg['width']))
														
 
															-        self.top_down_layer_2 = build_fpn_block(cfg, round(128*cfg['width']) + round(128*cfg['width']), round(128*cfg['width']))
														
 
															+        self.reduce_layer_3 = build_reduce_layer(cfg, round(512*cfg['width']), round(256*cfg['width']))
														
 
															+        self.reduce_layer_4 = build_reduce_layer(cfg, in_dims[0], round(256*cfg['width']))
														
 
															+        self.top_down_layer_2 = build_fpn_block(cfg, round(256*cfg['width']) + round(256*cfg['width']), round(256*cfg['width']))
														
 
															         # --------------------------- Bottom-up FPN ---------------------------
														
 
															         ## P3 -> P4
														
 
															-        self.downsample_layer_1 = build_downsample_layer(cfg, round(128*cfg['width']), round(256*cfg['width']))
														
 
															-        self.bottom_up_layer_1 = build_fpn_block(cfg, round(256*cfg['width']) + round(256*cfg['width']), round(256*cfg['width']))
														
 
															+        self.downsample_layer_1 = build_downsample_layer(cfg, round(256*cfg['width']), round(256*cfg['width']))
														
 
															+        self.bottom_up_layer_1 = build_fpn_block(cfg, round(256*cfg['width']) + round(256*cfg['width']), round(512*cfg['width']))
														
 
															         ## P4 -> P5
														
 
															-        self.downsample_layer_2 = build_downsample_layer(cfg, round(256*cfg['width']), round(512*cfg['width']))
														
 
															-        self.bottom_up_layer_2 = build_fpn_block(cfg, round(512*cfg['width']) + in_dims[2], round(512*cfg['width']))
														
 
															-                
														
 
															-        ## Head convs
														
 
															-        self.head_conv_1 = Conv(round(128*cfg['width']), round(256*cfg['width']), k=3, s=1, p=1, act_type=cfg['fpn_act'], norm_type=cfg['fpn_norm'])
														
 
															-        self.head_conv_2 = Conv(round(256*cfg['width']), round(512*cfg['width']), k=3, s=1, p=1, act_type=cfg['fpn_act'], norm_type=cfg['fpn_norm'])
														
 
															-        self.head_conv_3 = Conv(round(512*cfg['width']), round(1024*cfg['width']), k=3, s=1, p=1, act_type=cfg['fpn_act'], norm_type=cfg['fpn_norm'])
														
 
															-        
														
 
															+        self.downsample_layer_2 = build_downsample_layer(cfg, round(512*cfg['width']), round(512*cfg['width']))
														
 
															+        self.bottom_up_layer_2 = build_fpn_block(cfg, round(512*cfg['width']) + round(512*cfg['width']), round(1024*cfg['width']))
														
 
															+                        
														
 
															         # --------------------------- Output proj ---------------------------
														
 
															         if out_dim is not None:
														
 
															             self.out_layers = nn.ModuleList([
														
@@ -57,29 +52,26 @@ class RTCDetPaFPN(nn.Module):
 
															         # Top down
														
 
															         ## P5 -> P4
														
 
															         c6 = self.reduce_layer_1(c5)
														
 
															-        c7 = F.interpolate(c6, scale_factor=2.0)
														
 
															-        c8 = torch.cat([c7, self.reduce_layer_2(c4)], dim=1)
														
 
															+        c7 = self.reduce_layer_2(c4)
														
 
															+        c8 = torch.cat([F.interpolate(c6, scale_factor=2.0), c7], dim=1)
														
 
															         c9 = self.top_down_layer_1(c8)
														
 
															         ## P4 -> P3
														
 
															         c10 = self.reduce_layer_3(c9)
														
 
															-        c11 = F.interpolate(c10, scale_factor=2.0)
														
 
															-        c12 = torch.cat([c11, self.reduce_layer_4(c3)], dim=1)
														
 
															+        c11 = self.reduce_layer_4(c3)
														
 
															+        c12 = torch.cat([F.interpolate(c10, scale_factor=2.0), c11], dim=1)
														
 
															         c13 = self.top_down_layer_2(c12)
														
 
															         # Bottom up
														
 
															-        ## p3 -> P4
														
 
															+        # p3 -> P4
														
 
															         c14 = self.downsample_layer_1(c13)
														
 
															-        c15 = torch.cat([c14, c9], dim=1)
														
 
															+        c15 = torch.cat([c14, c10], dim=1)
														
 
															         c16 = self.bottom_up_layer_1(c15)
														
 
															-        ## P4 -> P5
														
 
															+        # P4 -> P5
														
 
															         c17 = self.downsample_layer_2(c16)
														
 
															-        c18 = torch.cat([c17, c5], dim=1)
														
 
															+        c18 = torch.cat([c17, c6], dim=1)
														
 
															         c19 = self.bottom_up_layer_2(c18)
														
 
															-        c20 = self.head_conv_1(c13)
														
 
															-        c21 = self.head_conv_2(c16)
														
 
															-        c22 = self.head_conv_3(c19)
														
 
															-        out_feats = [c20, c21, c22] # [P3, P4, P5]
														
 
															+        out_feats = [c13, c16, c19] # [P3, P4, P5]
														
 
															         # output proj layers
														
 
															         if self.out_layers is not None: