rtpdetr_config.py 1.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657
  1. # Real-time Transformer-based Object Detector
  2. # ------------------- Det task --------------------
  3. rtpdetr_cfg = {
  4. 'rtpdetr_r50':{
  5. # ---------------- Model config ----------------
  6. ## Model scale
  7. 'width': 1.0,
  8. 'depth': 1.0,
  9. 'max_stride': 32,
  10. 'out_stride': 16,
  11. # Image Encoder - Backbone
  12. 'backbone': 'resnet50',
  13. 'backbone_norm': 'FrozeBN',
  14. 'pretrained': True,
  15. 'freeze_at': 0,
  16. 'freeze_stem_only': False,
  17. 'hidden_dim': 256,
  18. 'en_num_heads': 8,
  19. 'en_num_layers': 6,
  20. 'en_ffn_dim': 2048,
  21. 'en_dropout': 0.0,
  22. 'en_act': 'gelu',
  23. # Transformer Decoder
  24. 'transformer': 'plain_detr_transformer',
  25. 'de_num_heads': 8,
  26. 'de_num_layers': 6,
  27. 'de_ffn_dim': 2048,
  28. 'de_dropout': 0.0,
  29. 'de_act': 'gelu',
  30. 'de_pre_norm': True,
  31. 'rpe_hidden_dim': 512,
  32. 'use_checkpoint': False,
  33. 'proposal_feature_levels': 3,
  34. 'proposal_tgt_strides': [8, 16, 32],
  35. 'num_queries_one2one': 300,
  36. 'num_queries_one2many': 1500,
  37. # ---------------- Assignment config ----------------
  38. 'matcher_hpy': {'cost_class': 2.0,
  39. 'cost_bbox': 1.0,
  40. 'cost_giou': 2.0,},
  41. # ---------------- Loss config ----------------
  42. 'k_one2many': 6,
  43. 'lambda_one2many': 1.0,
  44. 'loss_coeff': {'class': 2,
  45. 'bbox': 1,
  46. 'giou': 2,},
  47. # ---------------- Train config ----------------
  48. ## input
  49. 'multi_scale': [0.5, 1.25], # 320 -> 800
  50. 'trans_type': 'rtdetr_l',
  51. # ---------------- Train config ----------------
  52. 'trainer_type': 'rtdetr',
  53. },
  54. }