gelan_config.py 6.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215
  1. # Gelan (proposed by yolov9) config
  2. def build_gelan_config(args):
  3. if args.model == 'gelan_s':
  4. return GElanSConfig()
  5. elif args.model == 'gelan_c':
  6. return GElanCConfig()
  7. else:
  8. raise NotImplementedError("No config for model: {}".format(args.model))
  9. # GELAN-Base config
  10. class GElanBaseConfig(object):
  11. def __init__(self) -> None:
  12. # ---------------- Model config ----------------
  13. self.reg_max = 16
  14. self.out_stride = [8, 16, 32]
  15. self.max_stride = 32
  16. self.num_levels = 3
  17. ## Backbone
  18. self.backbone = 'gelan'
  19. self.bk_act = 'silu'
  20. self.bk_norm = 'BN'
  21. self.bk_depthwise = False
  22. self.bk_down_pooling = True
  23. self.use_pretrained = True
  24. self.backbone_feats = {
  25. "c1": [64],
  26. "c2": [128, [128, 64], 256],
  27. "c3": [256, [256, 128], 512],
  28. "c4": [512, [512, 256], 512],
  29. "c5": [512, [512, 256], 512],
  30. }
  31. self.scale = "l"
  32. self.backbone_depth = 1
  33. ## Neck
  34. self.neck = 'spp_elan'
  35. self.neck_act = 'silu'
  36. self.neck_norm = 'BN'
  37. self.spp_pooling_size = 5
  38. self.spp_inter_dim = 256
  39. self.spp_out_dim = 512
  40. ## FPN
  41. self.fpn = 'gelan_pafpn'
  42. self.fpn_act = 'silu'
  43. self.fpn_norm = 'BN'
  44. self.fpn_depthwise = False
  45. self.fpn_down_pooling = True
  46. self.fpn_depth = 1
  47. self.fpn_feats_td = {
  48. "p4": [[512, 256], 512],
  49. "p3": [[256, 128], 256],
  50. }
  51. self.fpn_feats_bu = {
  52. "p4": [[512, 256], 512],
  53. "p5": [[512, 256], 512],
  54. }
  55. ## Head
  56. self.head = 'gelan_head'
  57. self.head_act = 'silu'
  58. self.head_norm = 'BN'
  59. self.head_depthwise = False
  60. self.num_cls_head = 2
  61. self.num_reg_head = 2
  62. # ---------------- Post-process config ----------------
  63. ## Post process
  64. self.val_topk = 1000
  65. self.val_conf_thresh = 0.001
  66. self.val_nms_thresh = 0.7
  67. self.test_topk = 100
  68. self.test_conf_thresh = 0.2
  69. self.test_nms_thresh = 0.5
  70. # ---------------- Assignment config ----------------
  71. ## Matcher
  72. self.tal_topk_candidates = 10
  73. self.tal_alpha = 0.5
  74. self.tal_beta = 6.0
  75. ## Loss weight
  76. self.loss_cls = 0.5
  77. self.loss_box = 7.5
  78. self.loss_dfl = 1.5
  79. # ---------------- ModelEMA config ----------------
  80. self.use_ema = True
  81. self.ema_decay = 0.9998
  82. self.ema_tau = 2000
  83. # ---------------- Optimizer config ----------------
  84. self.trainer = 'yolo'
  85. self.optimizer = 'adamw'
  86. self.per_image_lr = 0.001 / 64
  87. self.base_lr = None # base_lr = per_image_lr * batch_size
  88. self.min_lr_ratio = 0.01 # min_lr = base_lr * min_lr_ratio
  89. self.momentum = 0.9
  90. self.weight_decay = 0.05
  91. self.clip_max_norm = 35.0
  92. self.warmup_bias_lr = 0.1
  93. self.warmup_momentum = 0.8
  94. # ---------------- Lr Scheduler config ----------------
  95. self.warmup_epoch = 3
  96. self.lr_scheduler = "cosine"
  97. self.max_epoch = 300
  98. self.eval_epoch = 10
  99. self.no_aug_epoch = 20
  100. # ---------------- Data process config ----------------
  101. self.aug_type = 'yolo'
  102. self.box_format = 'xyxy'
  103. self.normalize_coords = False
  104. self.mosaic_prob = 0.0
  105. self.mixup_prob = 0.0
  106. self.copy_paste = 0.0 # approximated by the YOLOX's mixup
  107. self.multi_scale = [0.5, 1.25] # multi scale: [img_size * 0.5, img_size * 1.25]
  108. ## Pixel mean & std
  109. self.pixel_mean = [0., 0., 0.]
  110. self.pixel_std = [255., 255., 255.]
  111. ## Transforms
  112. self.train_img_size = 640
  113. self.test_img_size = 640
  114. self.use_ablu = True
  115. self.affine_params = {
  116. 'degrees': 0.0,
  117. 'translate': 0.2,
  118. 'scale': [0.1, 2.0],
  119. 'shear': 0.0,
  120. 'perspective': 0.0,
  121. 'hsv_h': 0.015,
  122. 'hsv_s': 0.7,
  123. 'hsv_v': 0.4,
  124. }
  125. def print_config(self):
  126. config_dict = {key: value for key, value in self.__dict__.items() if not key.startswith('__')}
  127. for k, v in config_dict.items():
  128. print("{} : {}".format(k, v))
  129. # GELAN-C
  130. class GElanCConfig(GElanBaseConfig):
  131. def __init__(self) -> None:
  132. super().__init__()
  133. self.backbone = 'gelan'
  134. self.use_pretrained = True
  135. self.scale = "l"
  136. # ---------------- Data process config ----------------
  137. self.mosaic_prob = 1.0
  138. self.mixup_prob = 0.1
  139. self.copy_paste = 0.5
  140. # GELAN-S
  141. class GElanSConfig(GElanBaseConfig):
  142. def __init__(self) -> None:
  143. super().__init__()
  144. # ---------------- Model config ----------------
  145. self.reg_max = 16
  146. self.out_stride = [8, 16, 32]
  147. self.max_stride = 32
  148. self.num_levels = 3
  149. ## Backbone
  150. self.backbone = 'gelan'
  151. self.bk_act = 'silu'
  152. self.bk_norm = 'BN'
  153. self.bk_depthwise = False
  154. self.use_pretrained = True
  155. self.backbone_feats = {
  156. "c1": [32],
  157. "c2": [64, [64, 32], 64],
  158. "c3": [64, [64, 32], 128],
  159. "c4": [128, [128, 64], 256],
  160. "c5": [256, [256, 128], 256],
  161. }
  162. self.scale = "l"
  163. self.backbone_depth = 3
  164. ## Neck
  165. self.neck = 'spp_elan'
  166. self.neck_act = 'silu'
  167. self.neck_norm = 'BN'
  168. self.spp_pooling_size = 5
  169. self.spp_inter_dim = 128
  170. self.spp_out_dim = 256
  171. ## FPN
  172. self.fpn = 'gelan_pafpn'
  173. self.fpn_act = 'silu'
  174. self.fpn_norm = 'BN'
  175. self.fpn_depthwise = False
  176. self.fpn_depth = 3
  177. self.fpn_feats_td = {
  178. "p4": [[256, 128], 256],
  179. "p3": [[128, 64], 128],
  180. }
  181. self.fpn_feats_bu = {
  182. "p4": [[256, 128], 256],
  183. "p5": [[256, 128], 256],
  184. }
  185. ## Head
  186. self.head = 'gelan_head'
  187. self.head_act = 'silu'
  188. self.head_norm = 'BN'
  189. self.head_depthwise = False
  190. self.num_cls_head = 2
  191. self.num_reg_head = 2
  192. # ---------------- Data process config ----------------
  193. self.mosaic_prob = 1.0
  194. self.mixup_prob = 0.0
  195. self.copy_paste = 0.5 # approximated by the YOLOX's mixup
  196. def print_config(self):
  197. config_dict = {key: value for key, value in self.__dict__.items() if not key.startswith('__')}
  198. for k, v in config_dict.items():
  199. print("{} : {}".format(k, v))