heavengate
diff --git a/‎configs/gfl/README.md‎
Lines changed: 37 additions & 0 deletions b/‎configs/gfl/README.md‎
Lines changed: 37 additions & 0 deletions
diff --git a/‎configs/gfl/_base_/gfl_r50_fpn.yml‎
Lines changed: 51 additions & 0 deletions b/‎configs/gfl/_base_/gfl_r50_fpn.yml‎
Lines changed: 51 additions & 0 deletions
diff --git a/‎configs/gfl/_base_/gfl_reader.yml‎
Lines changed: 40 additions & 0 deletions b/‎configs/gfl/_base_/gfl_reader.yml‎
Lines changed: 40 additions & 0 deletions
diff --git a/‎configs/gfl/_base_/gflv2_r50_fpn.yml‎
Lines changed: 56 additions & 0 deletions b/‎configs/gfl/_base_/gflv2_r50_fpn.yml‎
Lines changed: 56 additions & 0 deletions
diff --git a/‎configs/gfl/_base_/optimizer_1x.yml‎
Lines changed: 19 additions & 0 deletions b/‎configs/gfl/_base_/optimizer_1x.yml‎
Lines changed: 19 additions & 0 deletions
diff --git a/‎configs/gfl/gfl_r50_fpn_1x_coco.yml‎
Lines changed: 10 additions & 0 deletions b/‎configs/gfl/gfl_r50_fpn_1x_coco.yml‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎configs/gfl/gflv2_r50_fpn_1x_coco.yml‎
Lines changed: 10 additions & 0 deletions b/‎configs/gfl/gflv2_r50_fpn_1x_coco.yml‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎configs/picodet/README.md‎
Lines changed: 48 additions & 0 deletions b/‎configs/picodet/README.md‎
Lines changed: 48 additions & 0 deletions
diff --git a/‎configs/picodet/_base_/optimizer_280e.yml‎
Lines changed: 18 additions & 0 deletions b/‎configs/picodet/_base_/optimizer_280e.yml‎
Lines changed: 18 additions & 0 deletions
diff --git a/‎configs/picodet/_base_/picodet_320_reader.yml‎
Lines changed: 45 additions & 0 deletions b/‎configs/picodet/_base_/picodet_320_reader.yml‎
Lines changed: 45 additions & 0 deletions
@@ -0,0 +1,37 @@
+# Generalized Focal Loss Model(GFL)
+
+## Introduction
+
+[Generalized Focal Loss: Learning Qualified and Distributed Bounding Boxes for Dense Object Detection](https://arxiv.org/abs/2006.04388) and [Generalized Focal Loss V2](https://arxiv.org/pdf/2011.12885.pdf)
+
+
+
+## Model Zoo
+
+| Backbone        | Model      | images/GPU | lr schedule |FPS | Box AP |                           download                          | config |
+| :-------------- | :------------- | :-----: | :-----: | :------------: | :-----: | :-----------------------------------------------------: | :-----: |
+| ResNet50-FPN    | GFL           |    2    |   1x      |     ----     |  40.1  | [download](https://paddledet.bj.bcebos.com/models/gfl_r50_fpn_1x_coco.pdparams) | [config](https://github.com/PaddlePaddle/PaddleDetection/tree/develop/configs/gfl/gfl_r50_fpn_1x_coco.yml) |
+| ResNet50-FPN    | GFLv2       |    2    |   1x      |     ----     |  40.4  | [download](https://paddledet.bj.bcebos.com/models/gflv2_r50_fpn_1x_coco.pdparams) | [config](https://github.com/PaddlePaddle/PaddleDetection/tree/develop/configs/gfl/gflv2_r50_fpn_1x_coco.yml) |
+
+
+**Notes:**
+
+- GFL is trained on COCO train2017 dataset and evaluated on val2017 results of `mAP(IoU=0.5:0.95)`.
+
+## Citations
+```
+@article{li2020generalized,
+  title={Generalized Focal Loss: Learning Qualified and Distributed Bounding Boxes for Dense Object Detection},
+  author={Li, Xiang and Wang, Wenhai and Wu, Lijun and Chen, Shuo and Hu, Xiaolin and Li, Jun and Tang, Jinhui and Yang, Jian},
+  journal={arXiv preprint arXiv:2006.04388},
+  year={2020}
+}
+
+@article{li2020gflv2,
+  title={Generalized Focal Loss V2: Learning Reliable Localization Quality Estimation for Dense Object Detection},
+  author={Li, Xiang and Wang, Wenhai and Hu, Xiaolin and Li, Jun and Tang, Jinhui and Yang, Jian},
+  journal={arXiv preprint arXiv:2011.12885},
+  year={2020}
+}
+
+```
@@ -0,0 +1,51 @@
+architecture: GFL
+pretrain_weights: https://paddledet.bj.bcebos.com/models/pretrained/ResNet50_cos_pretrained.pdparams
+
+GFL:
+  backbone: ResNet
+  neck: FPN
+  head: GFLHead
+
+ResNet:
+  depth: 50
+  variant: b
+  norm_type: bn
+  freeze_at: 0
+  return_idx: [1,2,3]
+  num_stages: 4
+
+FPN:
+  out_channel: 256
+  spatial_scales: [0.125, 0.0625, 0.03125]
+  extra_stage: 2
+  has_extra_convs: true
+  use_c5: false
+
+GFLHead:
+  conv_feat:
+    name: FCOSFeat
+    feat_in: 256
+    feat_out: 256
+    num_convs: 4
+    norm_type: "gn"
+    use_dcn: false
+  fpn_stride: [8, 16, 32, 64, 128]
+  prior_prob: 0.01
+  reg_max: 16
+  loss_qfl:
+    name: QualityFocalLoss
+    use_sigmoid: True
+    beta: 2.0
+    loss_weight: 1.0
+  loss_dfl:
+    name: DistributionFocalLoss
+    loss_weight: 0.25
+  loss_bbox:
+    name: GIoULoss
+    loss_weight: 2.0
+  nms:
+    name: MultiClassNMS
+    nms_top_k: 1000
+    keep_top_k: 100
+    score_threshold: 0.025
+    nms_threshold: 0.6
@@ -0,0 +1,40 @@
+worker_num: 2
+TrainReader:
+  sample_transforms:
+  - Decode: {}
+  - RandomFlip: {prob: 0.5}
+  - NormalizeImage: {is_scale: true, mean: [0.485,0.456,0.406], std: [0.229, 0.224,0.225]}
+  - Resize: {target_size: [800, 1333], keep_ratio: true, interp: 1}
+  - Permute: {}
+  batch_transforms:
+  - PadBatch: {pad_to_stride: 32}
+  - Gt2GFLTarget:
+      downsample_ratios: [8, 16, 32, 64, 128]
+      grid_cell_scale: 8
+  batch_size: 2
+  shuffle: true
+  drop_last: true
+
+
+EvalReader:
+  sample_transforms:
+  - Decode: {}
+  - NormalizeImage: {is_scale: true, mean: [0.485,0.456,0.406], std: [0.229, 0.224,0.225]}
+  - Resize: {interp: 1, target_size: [800, 1333], keep_ratio: True}
+  - Permute: {}
+  batch_transforms:
+  - PadBatch: {pad_to_stride: 32}
+  batch_size: 2
+  shuffle: false
+
+
+TestReader:
+  sample_transforms:
+  - Decode: {}
+  - NormalizeImage: {is_scale: true, mean: [0.485,0.456,0.406], std: [0.229, 0.224,0.225]}
+  - Resize: {interp: 1, target_size: [800, 1333], keep_ratio: True}
+  - Permute: {}
+  batch_transforms:
+  - PadBatch: {pad_to_stride: 32}
+  batch_size: 1
+  shuffle: false
@@ -0,0 +1,56 @@
+architecture: GFL
+pretrain_weights: https://paddledet.bj.bcebos.com/models/pretrained/ResNet50_cos_pretrained.pdparams
+
+GFL:
+  backbone: ResNet
+  neck: FPN
+  head: GFLHead
+
+ResNet:
+  depth: 50
+  variant: b
+  norm_type: bn
+  freeze_at: 0
+  return_idx: [1,2,3]
+  num_stages: 4
+
+FPN:
+  out_channel: 256
+  spatial_scales: [0.125, 0.0625, 0.03125]
+  extra_stage: 2
+  has_extra_convs: true
+  use_c5: false
+
+GFLHead:
+  conv_feat:
+    name: FCOSFeat
+    feat_in: 256
+    feat_out: 256
+    num_convs: 4
+    norm_type: "gn"
+    use_dcn: false
+  fpn_stride: [8, 16, 32, 64, 128]
+  prior_prob: 0.01
+  reg_max: 16
+  dgqp_module:
+    name: DGQP
+    reg_topk: 4
+    reg_channels: 64
+    add_mean: True
+  loss_qfl:
+    name: QualityFocalLoss
+    use_sigmoid: False
+    beta: 2.0
+    loss_weight: 1.0
+  loss_dfl:
+    name: DistributionFocalLoss
+    loss_weight: 0.25
+  loss_bbox:
+    name: GIoULoss
+    loss_weight: 2.0
+  nms:
+    name: MultiClassNMS
+    nms_top_k: 1000
+    keep_top_k: 100
+    score_threshold: 0.025
+    nms_threshold: 0.6
@@ -0,0 +1,19 @@
+epoch: 12
+
+LearningRate:
+  base_lr: 0.01
+  schedulers:
+  - !PiecewiseDecay
+    gamma: 0.1
+    milestones: [8, 11]
+  - !LinearWarmup
+    start_factor: 0.1
+    steps: 500
+
+OptimizerBuilder:
+  optimizer:
+    momentum: 0.9
+    type: Momentum
+  regularizer:
+    factor: 0.0001
+    type: L2
@@ -0,0 +1,10 @@
+_BASE_: [
+  '../datasets/coco_detection.yml',
+  '../runtime.yml',
+  '_base_/gfl_r50_fpn.yml',
+  '_base_/optimizer_1x.yml',
+  '_base_/gfl_reader.yml',
+]
+
+weights: output/gfl_r50_fpn_1x_coco/model_final
+find_unused_parameters: True
@@ -0,0 +1,10 @@
+_BASE_: [
+  '../datasets/coco_detection.yml',
+  '../runtime.yml',
+  '_base_/gflv2_r50_fpn.yml',
+  '_base_/optimizer_1x.yml',
+  '_base_/gfl_reader.yml',
+]
+
+weights: output/gfl_r50_fpn_1x_coco/model_final
+find_unused_parameters: True
@@ -0,0 +1,48 @@
+# PicoDet
+
+## Introduction
+
+We developed a series of mobile models, which named `PicoDet`.
+Optimizing method of we use:
+- [Generalized Focal Loss V2](https://arxiv.org/pdf/2011.12885.pdf)
+- Lr Cosine Decay
+
+
+
+## Model Zoo
+
+### PicoDet-S
+
+| Backbone                  | Input size | images/GPU | lr schedule |Box AP | FLOPS | Inference Time |                           download                          | config |
+| :------------------------ | :-------: | :-------: | :-----------: | :---: | :-----: | :-----: | :-------------------------------------------------: | :-----: |
+| ShuffleNetv2-1x    | 320*320   |    128    |   280e      |   21.9     |  -- | -- | [download](https://paddledet.bj.bcebos.com/models/picodet_s_shufflenetv2_320_coco.pdparams) | [config](https://github.com/PaddlePaddle/PaddleDetection/tree/develop/configs/picodet/picodet_s_shufflenetv2_320_coco.yml) |
+| MobileNetv3-large-0.5x    | 320*320   |    128    |   280e      |   20.4     |  -- | -- | [download](https://paddledet.bj.bcebos.com/models/picodet_s_mbv3_320_coco.pdparams) | [config](https://github.com/PaddlePaddle/PaddleDetection/tree/develop/configs/picodet/picodet_s_mbv3_320_coco.yml) |
+| ShuffleNetv2-1x    | 416*416   |    96    |   280e      |   24.0     |  -- | -- | [download](https://paddledet.bj.bcebos.com/models/picodet_s_shufflenetv2_416_coco.pdparams) | [config](https://github.com/PaddlePaddle/PaddleDetection/tree/develop/configs/picodet/picodet_s_shufflenetv2_416_coco.yml) |
+| MobileNetv3-large-0.5x    | 416*416   |    96    |   280e      |   23.3     |  -- | -- | [download](https://paddledet.bj.bcebos.com/models/picodet_s_mbv3_416_coco.pdparams) | [config](https://github.com/PaddlePaddle/PaddleDetection/tree/develop/configs/picodet/picodet_s_mbv3_416_coco.yml) |
+
+### PicoDet-M
+
+| Backbone                  | Input size | images/GPU | lr schedule |Box AP | FLOPS | Inference Time |                           download                          | config |
+| :------------------------ | :-------: | :-------: | :-----------: | :---: | :-----: | :-----: | :-------------------------------------------------: | :-----: |
+| ShuffleNetv2-1.5x    | 320*320   |    128    |   280e      |   24.9     |  -- | -- | [download](https://paddledet.bj.bcebos.com/models/picodet_m_shufflenetv2_320_coco.pdparams) | [config](https://github.com/PaddlePaddle/PaddleDetection/tree/develop/configs/picodet/picodet_m_shufflenetv2_320_coco.yml) |
+| MobileNetv3-large-1x    | 320*320   |    128    |   280e      |   26.4     |  -- | -- | [download](https://paddledet.bj.bcebos.com/models/picodet_m_mbv3_320_coco.pdparams) | [config](https://github.com/PaddlePaddle/PaddleDetection/tree/develop/configs/picodet/picodet_m_mbv3_320_coco.yml) |
+| ShuffleNetv2-1.5x    | 416*416   |    128    |   280e      |   27.4     |  -- | -- | [download](https://paddledet.bj.bcebos.com/models/picodet_m_shufflenetv2_416_coco.pdparams) | [config](https://github.com/PaddlePaddle/PaddleDetection/tree/develop/configs/picodet/picodet_m_shufflenetv2_416_coco.yml) |
+| MobileNetv3-large-1x    | 416*416   |    128    |   280e      |   29.2     |  -- | -- | [download](https://paddledet.bj.bcebos.com/models/picodet_m_mbv3_416_coco.pdparams) | [config](https://github.com/PaddlePaddle/PaddleDetection/tree/develop/configs/picodet/picodet_m_mbv3_416_coco.yml) |
+
+
+**Notes:**
+
+- PicoDet inference speed is tested on Kirin 980 with 4 threads by arm8 and with FP16.
+- PicoDet is trained on COCO train2017 dataset and evaluated on val2017 results of `mAP(IoU=0.5:0.95)`.
+- PicoDet used 4 GPUs for training and mini-batch size as 128 or 96 on each GPU.
+
+## Citations
+```
+@article{li2020gflv2,
+  title={Generalized Focal Loss V2: Learning Reliable Localization Quality Estimation for Dense Object Detection},
+  author={Li, Xiang and Wang, Wenhai and Hu, Xiaolin and Li, Jun and Tang, Jinhui and Yang, Jian},
+  journal={arXiv preprint arXiv:2011.12885},
+  year={2020}
+}
+
+```
@@ -0,0 +1,18 @@
+epoch: 280
+
+LearningRate:
+  base_lr: 0.4
+  schedulers:
+  - !CosineDecay
+    max_epochs: 280
+  - !LinearWarmup
+    start_factor: 0.1
+    steps: 300
+
+OptimizerBuilder:
+  optimizer:
+    momentum: 0.9
+    type: Momentum
+  regularizer:
+    factor: 0.0001
+    type: L2
@@ -0,0 +1,45 @@
+worker_num: 6
+TrainReader:
+  sample_transforms:
+  - Decode: {}
+  - RandomDistort: {}
+  - RandomCrop: {}
+  - RandomFlip: {prob: 0.5}
+  - NormalizeImage: {is_scale: true, mean: [0.485,0.456,0.406], std: [0.229, 0.224,0.225]}
+  - Resize: {target_size: [320, 320], keep_ratio: False, interp: 1}
+  - Permute: {}
+  batch_transforms:
+  - PadBatch: {pad_to_stride: 32}
+  - Gt2GFLTarget:
+      downsample_ratios: [8, 16, 32]
+      grid_cell_scale: 5
+      cell_offset: 0.5
+  batch_size: 128
+  shuffle: true
+  drop_last: true
+
+
+EvalReader:
+  sample_transforms:
+  - Decode: {}
+  - NormalizeImage: {is_scale: true, mean: [0.485,0.456,0.406], std: [0.229, 0.224,0.225]}
+  - Resize: {interp: 1, target_size: [320, 320], keep_ratio: False}
+  - Permute: {}
+  batch_transforms:
+  - PadBatch: {pad_to_stride: 32}
+  batch_size: 8
+  shuffle: false
+
+
+TestReader:
+  inputs_def:
+    image_shape: [3, 320, 320]
+  sample_transforms:
+  - Decode: {}
+  - NormalizeImage: {is_scale: true, mean: [0.485,0.456,0.406], std: [0.229, 0.224,0.225]}
+  - Resize: {interp: 1, target_size: [320, 320], keep_ratio: False}
+  - Permute: {}
+  batch_transforms:
+  - PadBatch: {pad_to_stride: 32}
+  batch_size: 1
+  shuffle: false