build.py 1.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263
  1. #!/usr/bin/env python3
  2. # -*- coding:utf-8 -*-
  3. import torch
  4. import torch.nn as nn
  5. from .loss import build_criterion
  6. from .yolox import YOLOX
  7. # build object detector
  8. def build_yolox(args, cfg, device, num_classes=80, trainable=False):
  9. print('==============================')
  10. print('Build {} ...'.format(args.model.upper()))
  11. print('==============================')
  12. print('Model Configuration: \n', cfg)
  13. # -------------- Build YOLO --------------
  14. model = YOLOX(
  15. cfg=cfg,
  16. device=device,
  17. num_classes=num_classes,
  18. trainable=trainable,
  19. conf_thresh=args.conf_thresh,
  20. nms_thresh=args.nms_thresh,
  21. topk=args.topk,
  22. )
  23. # -------------- Initialize YOLO --------------
  24. for m in model.modules():
  25. if isinstance(m, nn.BatchNorm2d):
  26. m.eps = 1e-3
  27. m.momentum = 0.03
  28. # Init bias
  29. init_prob = 0.01
  30. bias_value = -torch.log(torch.tensor((1. - init_prob) / init_prob))
  31. # obj pred
  32. for obj_pred in model.obj_preds:
  33. b = obj_pred.bias.view(1, -1)
  34. b.data.fill_(bias_value.item())
  35. obj_pred.bias = torch.nn.Parameter(b.view(-1), requires_grad=True)
  36. # cls pred
  37. for cls_pred in model.cls_preds:
  38. b = cls_pred.bias.view(1, -1)
  39. b.data.fill_(bias_value.item())
  40. cls_pred.bias = torch.nn.Parameter(b.view(-1), requires_grad=True)
  41. # reg pred
  42. for reg_pred in model.reg_preds:
  43. b = reg_pred.bias.view(-1, )
  44. b.data.fill_(1.0)
  45. reg_pred.bias = torch.nn.Parameter(b.view(-1), requires_grad=True)
  46. w = reg_pred.weight
  47. w.data.fill_(0.)
  48. reg_pred.weight = torch.nn.Parameter(w, requires_grad=True)
  49. # -------------- Build criterion --------------
  50. criterion = None
  51. if trainable:
  52. # build criterion for training
  53. criterion = build_criterion(cfg, device, num_classes)
  54. return model, criterion