dino_r50.yml 1000 B

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849
  1. architecture: DETR
  2. pretrain_weights: https://paddledet.bj.bcebos.com/models/pretrained/ResNet50_cos_pretrained.pdparams
  3. hidden_dim: 256
  4. use_focal_loss: True
  5. DETR:
  6. backbone: ResNet
  7. transformer: DINOTransformer
  8. detr_head: DINOHead
  9. post_process: DETRBBoxPostProcess
  10. ResNet:
  11. # index 0 stands for res2
  12. depth: 50
  13. norm_type: bn
  14. freeze_at: 0
  15. return_idx: [1, 2, 3]
  16. lr_mult_list: [0.0, 0.1, 0.1, 0.1]
  17. num_stages: 4
  18. DINOTransformer:
  19. num_queries: 900
  20. position_embed_type: sine
  21. num_levels: 4
  22. nhead: 8
  23. num_encoder_layers: 6
  24. num_decoder_layers: 6
  25. dim_feedforward: 2048
  26. dropout: 0.0
  27. activation: relu
  28. pe_temperature: 20
  29. pe_offset: 0.0
  30. num_denoising: 100
  31. label_noise_ratio: 0.5
  32. box_noise_scale: 1.0
  33. learnt_init_query: True
  34. DINOHead:
  35. loss:
  36. name: DINOLoss
  37. loss_coeff: {class: 1, bbox: 5, giou: 2}
  38. aux_loss: True
  39. matcher:
  40. name: HungarianMatcher
  41. matcher_coeff: {class: 2, bbox: 5, giou: 2}
  42. DETRBBoxPostProcess:
  43. num_top_queries: 300