mask_rcnn_r50_fpn.yml 1.7 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091
  1. architecture: MaskRCNN
  2. pretrain_weights: https://paddledet.bj.bcebos.com/models/pretrained/ResNet50_cos_pretrained.pdparams
  3. MaskRCNN:
  4. backbone: ResNet
  5. neck: FPN
  6. rpn_head: RPNHead
  7. bbox_head: BBoxHead
  8. mask_head: MaskHead
  9. # post process
  10. bbox_post_process: BBoxPostProcess
  11. mask_post_process: MaskPostProcess
  12. ResNet:
  13. # index 0 stands for res2
  14. depth: 50
  15. norm_type: bn
  16. freeze_at: 0
  17. return_idx: [0,1,2,3]
  18. num_stages: 4
  19. FPN:
  20. out_channel: 256
  21. RPNHead:
  22. anchor_generator:
  23. aspect_ratios: [0.5, 1.0, 2.0]
  24. anchor_sizes: [[32], [64], [128], [256], [512]]
  25. strides: [4, 8, 16, 32, 64]
  26. rpn_target_assign:
  27. batch_size_per_im: 256
  28. fg_fraction: 0.5
  29. negative_overlap: 0.3
  30. positive_overlap: 0.7
  31. use_random: True
  32. train_proposal:
  33. min_size: 0.0
  34. nms_thresh: 0.7
  35. pre_nms_top_n: 2000
  36. post_nms_top_n: 1000
  37. topk_after_collect: True
  38. test_proposal:
  39. min_size: 0.0
  40. nms_thresh: 0.7
  41. pre_nms_top_n: 1000
  42. post_nms_top_n: 1000
  43. BBoxHead:
  44. head: TwoFCHead
  45. roi_extractor:
  46. resolution: 7
  47. sampling_ratio: 0
  48. aligned: True
  49. bbox_assigner: BBoxAssigner
  50. BBoxAssigner:
  51. batch_size_per_im: 512
  52. bg_thresh: 0.5
  53. fg_thresh: 0.5
  54. fg_fraction: 0.25
  55. use_random: True
  56. TwoFCHead:
  57. out_channel: 1024
  58. BBoxPostProcess:
  59. decode: RCNNBox
  60. nms:
  61. name: MultiClassNMS
  62. keep_top_k: 100
  63. score_threshold: 0.05
  64. nms_threshold: 0.5
  65. MaskHead:
  66. head: MaskFeat
  67. roi_extractor:
  68. resolution: 14
  69. sampling_ratio: 0
  70. aligned: True
  71. mask_assigner: MaskAssigner
  72. share_bbox_feat: False
  73. MaskFeat:
  74. num_convs: 4
  75. out_channel: 256
  76. MaskAssigner:
  77. mask_resolution: 28
  78. MaskPostProcess:
  79. binary_thresh: 0.5