PaddlePaddle
diff --git a/‎configs/datasets/coco_detection.yml
-1 b/‎configs/datasets/coco_detection.yml
-1
diff --git a/‎configs/datasets/coco_instance.yml
+20 b/‎configs/datasets/coco_instance.yml
+20
diff --git a/‎configs/ppyoloe_seg/README.md
+12 b/‎configs/ppyoloe_seg/README.md
+12
diff --git a/‎configs/ppyoloe_seg/_base_/optimizer_80e.yml
+18 b/‎configs/ppyoloe_seg/_base_/optimizer_80e.yml
+18
diff --git a/‎configs/ppyoloe_seg/_base_/ppyoloe_plus_crn_seg.yml
+49 b/‎configs/ppyoloe_seg/_base_/ppyoloe_plus_crn_seg.yml
+49
diff --git a/‎configs/ppyoloe_seg/_base_/ppyoloe_plus_seg_reader.yml
+43 b/‎configs/ppyoloe_seg/_base_/ppyoloe_plus_seg_reader.yml
+43
diff --git a/‎configs/ppyoloe_seg/ppyoloe_seg_l_80e_coco.yml
+14 b/‎configs/ppyoloe_seg/ppyoloe_seg_l_80e_coco.yml
+14
diff --git a/‎configs/ppyoloe_seg/ppyoloe_seg_m_80e_coco.yml
+14 b/‎configs/ppyoloe_seg/ppyoloe_seg_m_80e_coco.yml
+14
diff --git a/‎configs/ppyoloe_seg/ppyoloe_seg_s_80e_coco.yml
+14 b/‎configs/ppyoloe_seg/ppyoloe_seg_s_80e_coco.yml
+14
diff --git a/‎configs/ppyoloe_seg/ppyoloe_seg_x_80e_coco.yml
+14 b/‎configs/ppyoloe_seg/ppyoloe_seg_x_80e_coco.yml
+14
diff --git a/‎configs/rtmdet/README.md
+11-1 b/‎configs/rtmdet/README.md
+11-1
diff --git a/‎configs/rtmdet/_base_/rtmdet_ins_cspnext.yml
+37 b/‎configs/rtmdet/_base_/rtmdet_ins_cspnext.yml
+37
diff --git a/‎configs/rtmdet/_base_/rtmdet_reader.yml
+1-1 b/‎configs/rtmdet/_base_/rtmdet_reader.yml
+1-1
diff --git a/‎configs/rtmdet/rtmdet_ins_l_300e_coco.yml
+13 b/‎configs/rtmdet/rtmdet_ins_l_300e_coco.yml
+13
diff --git a/‎configs/rtmdet/rtmdet_ins_m_300e_coco.yml
+13 b/‎configs/rtmdet/rtmdet_ins_m_300e_coco.yml
+13
diff --git a/‎configs/rtmdet/rtmdet_ins_s_300e_coco.yml
+14 b/‎configs/rtmdet/rtmdet_ins_s_300e_coco.yml
+14
diff --git a/‎configs/rtmdet/rtmdet_ins_t_300e_coco.yml
+14 b/‎configs/rtmdet/rtmdet_ins_t_300e_coco.yml
+14
diff --git a/‎configs/rtmdet/rtmdet_ins_x_300e_coco.yml
+13 b/‎configs/rtmdet/rtmdet_ins_x_300e_coco.yml
+13
diff --git a/‎configs/yolov5_seg/README.md
+13 b/‎configs/yolov5_seg/README.md
+13
diff --git a/‎configs/yolov5_seg/_base_/optimizer_300e.yml
+19 b/‎configs/yolov5_seg/_base_/optimizer_300e.yml
+19
@@ -12,7 +12,6 @@ EvalDataset:
   name: COCODataSet
   image_dir: val2017
   anno_path: annotations/instances_val2017.json
-  #anno_path: annotations/instances_val2017_rand24.json
   dataset_dir: dataset/coco
 
 TestDataset:
 
@@ -0,0 +1,20 @@
+metric: COCO
+num_classes: 80
+
+TrainDataset:
+  name: COCODataSet
+  image_dir: train2017
+  anno_path: annotations/instances_train2017.json
+  dataset_dir: dataset/coco
+  data_fields: ['image', 'gt_bbox', 'gt_class', 'gt_poly', 'is_crowd']
+
+EvalDataset:
+  name: COCODataSet
+  image_dir: val2017
+  anno_path: annotations/instances_val2017.json
+  dataset_dir: dataset/coco
+
+TestDataset:
+  name: ImageFolder
+  anno_path: annotations/instances_val2017.json # also support txt (like VOC's label_list.txt)
+  dataset_dir: dataset/coco # if set, anno_path will be 'dataset_dir/anno_path'
@@ -0,0 +1,12 @@
+# PP-YOLOE Instance segmentation
+
+## 模型库
+
+### 实例分割模型
+
+| 网络网络        | 输入尺寸   | 图片数/GPU | 学习率策略 | TRT-FP16-Latency(ms) | box AP | mask AP | Params(M) | FLOPs(G) |    下载链接       | 配置文件 |
+| :------------- | :------- | :-------: | :------: | :------------: | :---------------------: | :----------------: |:---------: | :------: |:---------------: |:-----: |
+| PP-YOLOE_seg_s   |  640     |    8      |   80e   |    -   | 42.3 | 32.5 |  8.99   | - | [下载链接](https://paddledet.bj.bcebos.com/models/ppyoloe_seg_s_80e_coco.pdparams) | [配置文件](./ppyoloe_seg_s_80e_coco.yml) |
+| PP-YOLOE_seg_m   |  640     |    8      |   80e   |    -   |  -  | - |  26.03   | - | [下载链接]() | [配置文件](./ppyoloe_seg_m_80e_coco.yml) |
+| PP-YOLOE_seg_l   |  640     |    8      |   80e   |    -   |  -  | - |  57.32   | - | [下载链接]() | [配置文件](./ppyoloe_seg_l_80e_coco.yml) |
+| PP-YOLOE_seg_x   |  640     |    8      |   80e   |    -   |  -  | - |  107.27   | - | [下载链接]() | [配置文件](./ppyoloe_seg_x_80e_coco.yml) |
@@ -0,0 +1,18 @@
+epoch: 80
+
+LearningRate:
+  base_lr: 0.001
+  schedulers:
+    - name: CosineDecay
+      max_epochs: 96
+    - name: LinearWarmup
+      start_factor: 0.
+      epochs: 5
+
+OptimizerBuilder:
+  optimizer:
+    momentum: 0.9
+    type: Momentum
+  regularizer:
+    factor: 0.0005
+    type: L2
@@ -0,0 +1,49 @@
+architecture: PPYOLOE
+norm_type: sync_bn
+use_ema: true
+ema_decay: 0.9998
+ema_black_list: ['proj_conv.weight']
+custom_black_list: ['reduce_mean']
+
+with_mask: True
+
+PPYOLOE:
+  backbone: CSPResNet
+  neck: CustomCSPPAN
+  yolo_head: PPYOLOEInsHead
+  post_process: ~
+  with_mask: True
+
+CSPResNet:
+  layers: [3, 6, 6, 3]
+  channels: [64, 128, 256, 512, 1024]
+  return_idx: [1, 2, 3]
+  use_large_stem: True
+  use_alpha: True
+
+CustomCSPPAN:
+  out_channels: [768, 384, 192]
+  stage_num: 1
+  block_num: 3
+  act: 'swish'
+  spp: true
+
+PPYOLOEInsHead:
+  fpn_strides: [32, 16, 8]
+  grid_cell_scale: 5.0
+  grid_cell_offset: 0.5
+  static_assigner_epoch: -1 # only use TaskAlignedAssigner
+  use_varifocal_loss: True
+  loss_weight: {class: 1.0, iou: 2.5, dfl: 0.5}
+  assigner:
+    name: TaskAlignedAssigner
+    topk: 13
+    alpha: 1.0
+    beta: 6.0
+  nms:
+    name: MultiClassNMS
+    nms_top_k: 1000
+    keep_top_k: 300
+    score_threshold: 0.01
+    nms_threshold: 0.7
+    return_index: True
@@ -0,0 +1,43 @@
+worker_num: 4
+eval_height: &eval_height 640
+eval_width: &eval_width 640
+eval_size: &eval_size [*eval_height, *eval_width]
+
+TrainReader:
+  sample_transforms:
+    - Decode: {}
+    - RandomDistort: {}
+    - RandomExpand: {fill_value: [123.675, 116.28, 103.53]}
+    - RandomCrop: {is_mask_crop: True}
+    - RandomFlip: {}
+    - Resize: {target_size: *eval_size, keep_ratio: False, interp: 2}
+    - Poly2Mask: {del_poly: True}
+  batch_transforms:
+    - NormalizeImage: {mean: [0., 0., 0.], std: [1., 1., 1.], norm_type: none}
+    - Permute: {}
+    - PadGT: {}
+  batch_size: 8
+  shuffle: true
+  drop_last: true
+  use_shared_memory: true
+  collate_batch: False
+
+
+EvalReader:
+  sample_transforms:
+    - Decode: {}
+    - Resize: {target_size: *eval_size, keep_ratio: False, interp: 2}
+    - NormalizeImage: {mean: [0., 0., 0.], std: [1., 1., 1.], norm_type: none}
+    - Permute: {}
+  batch_size: 1
+
+
+TestReader:
+  inputs_def:
+    image_shape: [3, *eval_height, *eval_width]
+  sample_transforms:
+    - Decode: {}
+    - Resize: {target_size: *eval_size, keep_ratio: False, interp: 2}
+    - NormalizeImage: {mean: [0., 0., 0.], std: [1., 1., 1.], norm_type: none}
+    - Permute: {}
+  batch_size: 1
@@ -0,0 +1,14 @@
+_BASE_: [
+  '../datasets/coco_instance.yml',
+  '../runtime.yml',
+  './_base_/optimizer_80e.yml',
+  './_base_/ppyoloe_plus_crn_seg.yml',
+  './_base_/ppyoloe_plus_seg_reader.yml',
+]
+log_iter: 50
+snapshot_epoch: 5
+weights: output/ppyoloe_seg_l_80e_coco/model_final
+
+pretrain_weights: https://bj.bcebos.com/v1/paddledet/models/pretrained/ppyoloe_crn_l_obj365_pretrained.pdparams
+depth_mult: 1.0
+width_mult: 1.0
@@ -0,0 +1,14 @@
+_BASE_: [
+  '../datasets/coco_instance.yml',
+  '../runtime.yml',
+  './_base_/optimizer_80e.yml',
+  './_base_/ppyoloe_plus_crn_seg.yml',
+  './_base_/ppyoloe_plus_seg_reader.yml',
+]
+log_iter: 50
+snapshot_epoch: 5
+weights: output/ppyoloe_seg_m_80e_coco/model_final
+
+pretrain_weights: https://bj.bcebos.com/v1/paddledet/models/pretrained/ppyoloe_crn_l_obj365_pretrained.pdparams
+depth_mult: 0.67
+width_mult: 0.75
@@ -0,0 +1,14 @@
+_BASE_: [
+  '../datasets/coco_instance.yml',
+  '../runtime.yml',
+  './_base_/optimizer_80e.yml',
+  './_base_/ppyoloe_plus_crn_seg.yml',
+  './_base_/ppyoloe_plus_seg_reader.yml',
+]
+log_iter: 50
+snapshot_epoch: 5
+weights: output/ppyoloe_seg_s_80e_coco/model_final
+
+pretrain_weights: https://bj.bcebos.com/v1/paddledet/models/pretrained/ppyoloe_crn_s_obj365_pretrained.pdparams
+depth_mult: 0.33
+width_mult: 0.50
@@ -0,0 +1,14 @@
+_BASE_: [
+  '../datasets/coco_instance.yml',
+  '../runtime.yml',
+  './_base_/optimizer_80e.yml',
+  './_base_/ppyoloe_plus_crn_seg.yml',
+  './_base_/ppyoloe_plus_seg_reader.yml',
+]
+log_iter: 50
+snapshot_epoch: 5
+weights: output/ppyoloe_seg_x_80e_coco/model_final
+
+pretrain_weights: https://bj.bcebos.com/v1/paddledet/models/pretrained/ppyoloe_crn_x_obj365_pretrained.pdparams
+depth_mult: 1.33
+width_mult: 1.25
@@ -7,7 +7,8 @@
 - [引用](#引用)
 
 ## 模型库
-### RTMDet on COCO
+
+### 基础检测模型
 
 | 网络网络        | 输入尺寸   | 图片数/GPU | 学习率策略 | 模型推理耗时(ms) |   mAP  |   AP50  | Params(M) | FLOPs(G) |  下载链接       | 配置文件 |
 | :------------- | :------- | :-------: | :------: | :---------: | :-----: |:-----: | :-----: |:-----: | :-------------: | :-----: |
@@ -17,6 +18,15 @@
 | *RTMDet-l       |  640     |    32      |   300e    |    10.2  |  51.2 | 68.8 |  52.31  | 160.32 |[下载链接](https://paddledet.bj.bcebos.com/models/rtmdet_l_300e_coco.pdparams) | [配置文件](./rtmdet_l_300e_coco.yml) |
 | *RTMDet-x       |  640     |    32      |   300e    |    18.0  |  52.6 | 70.4 |  94.86  | 283.12 |[下载链接](https://paddledet.bj.bcebos.com/models/rtmdet_x_300e_coco.pdparams) | [配置文件](./rtmdet_x_300e_coco.yml) |
 
+### 实例分割模型
+
+| 网络网络        | 输入尺寸   | 图片数/GPU | 学习率策略 | 模型推理耗时(ms) |  box AP  |  mask AP  | Params(M) | FLOPs(G) |  下载链接       | 配置文件 |
+| :------------- | :------- | :-------: | :------: | :---------: | :-----: |:-----: | :-----: |:-----: | :-------------: | :-----: |
+| *RTMDet-t       |  640     |    32      |   300e    |    -   |  40.5 | - |  5.6  | 11.8 |[下载链接](https://paddledet.bj.bcebos.com/models/rtmdet_ins_t_300e_coco.pdparams) | [配置文件](./rtmdet_ins_t_300e_coco.yml) |
+| *RTMDet-s       |  640     |    32      |   300e    |    -   |  44.0 | - |  10.18  | 21.5 |[下载链接](https://paddledet.bj.bcebos.com/models/rtmdet_ins_s_300e_coco.pdparams) | [配置文件](./rtmdet_ins_s_300e_coco.yml) |
+| *RTMDet-m       |  640     |    32      |   300e    |    -   |  48.8 | - |  27.58  | 54.13 |[下载链接](https://paddledet.bj.bcebos.com/models/rtmdet_ins_m_300e_coco.pdparams) | [配置文件](./rtmdet_ins_m_300e_coco.yml) |
+| *RTMDet-l       |  640     |    32      |   300e    |    -  |  51.2 | - |  57.37  | 106.56 |[下载链接](https://paddledet.bj.bcebos.com/models/rtmdet_ins_l_300e_coco.pdparams) | [配置文件](./rtmdet_ins_l_300e_coco.yml) |
+| *RTMDet-x       |  640     |    32      |   300e    |    -  |  52.4 | - |  102.7  | 182.7 |[下载链接](https://paddledet.bj.bcebos.com/models/rtmdet_ins_x_300e_coco.pdparams) | [配置文件](./rtmdet_ins_x_300e_coco.yml) |
 
 **注意:**
   - RTMDet模型暂未支持完全训练，mAP为部署权重在COCO val2017上的`mAP(IoU=0.5:0.95)`结果，且评估未使用`multi_label`等trick；
 
@@ -0,0 +1,37 @@
+architecture: RTMDet
+norm_type: sync_bn
+use_ema: True
+ema_decay: 0.9998
+ema_decay_type: "exponential"
+act: silu
+find_unused_parameters: True
+with_mask: True
+
+depth_mult: 1.0
+width_mult: 1.0
+
+RTMDet:
+  backbone: CSPNeXt
+  neck: CSPNeXtPAFPN
+  head: RTMDetInsHead
+  with_mask: True
+  post_process: ~
+
+CSPNeXt:
+  arch: "P5"
+  return_idx: [2, 3, 4]
+
+# use default config
+# CSPNeXtPAFPN:
+
+RTMDetInsHead:
+  exp_on_reg: False
+  fpn_strides: [8, 16, 32]
+  grid_cell_offset: 0
+  nms:
+    name: MultiClassNMS
+    nms_top_k: 1000
+    keep_top_k: 100
+    score_threshold: 0.05
+    nms_threshold: 0.6
+    return_index: True
@@ -37,7 +37,7 @@ EvalReader:
     - Pad: {size: [640, 640], fill_value: [114., 114., 114.]}
     - NormalizeImage: {mean: [0.485, 0.456, 0.406], std: [0.229, 0.224, 0.225], is_scale: True}
     - Permute: {}
-  batch_size: 4
+  batch_size: 1
 
 
 TestReader:
 
@@ -0,0 +1,13 @@
+_BASE_: [
+  '../datasets/coco_instance.yml',
+  '../runtime.yml',
+  './_base_/optimizer_300e.yml',
+  './_base_/rtmdet_ins_cspnext.yml',
+  './_base_/rtmdet_reader.yml',
+]
+depth_mult: 1.0
+width_mult: 1.0
+
+log_iter: 100
+snapshot_epoch: 10
+weights: output/rtmnet_ins_l_300e_coco/model_final
@@ -0,0 +1,13 @@
+_BASE_: [
+  '../datasets/coco_instance.yml',
+  '../runtime.yml',
+  './_base_/optimizer_300e.yml',
+  './_base_/rtmdet_ins_cspnext.yml',
+  './_base_/rtmdet_reader.yml',
+]
+depth_mult: 0.67
+width_mult: 0.75
+
+log_iter: 100
+snapshot_epoch: 10
+weights: output/rtmnet_ins_m_300e_coco/model_final
@@ -0,0 +1,14 @@
+_BASE_: [
+  '../datasets/coco_instance.yml',
+  '../runtime.yml',
+  './_base_/optimizer_300e.yml',
+  './_base_/rtmdet_ins_cspnext.yml',
+  './_base_/rtmdet_reader.yml',
+]
+depth_mult: 0.33
+width_mult: 0.50
+
+log_iter: 100
+snapshot_epoch: 10
+weights: output/rtmnet_ins_s_300e_coco/model_final
+pretrain_weights: https://bj.bcebos.com/v1/paddledet/models/pretrained/cspnext_s_pretrained.pdparams
@@ -0,0 +1,14 @@
+_BASE_: [
+  '../datasets/coco_instance.yml',
+  '../runtime.yml',
+  './_base_/optimizer_300e.yml',
+  './_base_/rtmdet_ins_cspnext.yml',
+  './_base_/rtmdet_reader.yml',
+]
+depth_mult: 0.167 # 0.33 in yolox-tiny
+width_mult: 0.375
+
+log_iter: 100
+snapshot_epoch: 10
+weights: output/rtmnet_ins_t_300e_coco/model_final
+pretrain_weights: https://bj.bcebos.com/v1/paddledet/models/pretrained/cspnext_t_pretrained.pdparams
@@ -0,0 +1,13 @@
+_BASE_: [
+  '../datasets/coco_instance.yml',
+  '../runtime.yml',
+  './_base_/optimizer_300e.yml',
+  './_base_/rtmdet_ins_cspnext.yml',
+  './_base_/rtmdet_reader.yml',
+]
+depth_mult: 1.33
+width_mult: 1.25
+
+log_iter: 100
+snapshot_epoch: 10
+weights: output/rtmnet_ins_x_300e_coco/model_final
@@ -0,0 +1,13 @@
+# YOLOv5 Instance segmentation
+
+## 模型库
+
+### 实例分割模型
+
+| 网络网络        | 输入尺寸   | 图片数/GPU | 学习率策略 | 模型推理耗时(ms) | box AP | mask AP | Params(M) | FLOPs(G) |    下载链接       | 配置文件 |
+| :------------- | :------- | :-------: | :------: | :------------: | :---------------------: | :----------------: |:---------: | :------: |:---------------: |:-----: |
+| *YOLOv5-n        |  640     |    16      |   300e   |     -    |  27.6  | - |  2.0  | 7.1 | [下载链接](https://paddledet.bj.bcebos.com/models/yolov5_seg_n_300e_coco.pdparams) | [配置文件](./yolov5_seg_n_300e_coco.yml) |
+| *YOLOv5-s        |  640     |    16      |   300e   |     -    |  37.6  | - |  7.8  | 26.4 | [下载链接](https://paddledet.bj.bcebos.com/models/yolov5_seg_s_300e_coco.pdparams) | [配置文件](./yolov5_seg_s_300e_coco.yml) |
+| *YOLOv5-m        |  640     |    16      |   300e   |     -    |  45.0  | - |  22.0  | 70.8 | [下载链接](https://paddledet.bj.bcebos.com/models/yolov5_seg_m_300e_coco.pdparams) | [配置文件](./yolov5_seg_m_300e_coco.yml) |
+| *YOLOv5-l        |  640     |    16      |   300e   |     -    |  48.9  | - |  47.9  | 147.7 | [下载链接](https://paddledet.bj.bcebos.com/models/yolov5_seg_l_300e_coco.pdparams) | [配置文件](./yolov5_seg_l_300e_coco.yml) |
+| *YOLOv5-x        |  640     |    16      |   300e   |     -    |  50.6  | - |  88.8  | 265.7 | [下载链接](https://paddledet.bj.bcebos.com/models/yolov5_seg_x_300e_coco.pdparams) | [配置文件](./yolov5_seg_x_300e_coco.yml) |
@@ -0,0 +1,19 @@
+epoch: 300
+
+LearningRate:
+  base_lr: 0.01
+  schedulers:
+  - !YOLOv5LRDecay
+    max_epochs: 300
+    min_lr_ratio: 0.01
+  - !ExpWarmup
+    epochs: 3
+
+OptimizerBuilder:
+  optimizer:
+    type: Momentum
+    momentum: 0.937
+    use_nesterov: True
+  regularizer:
+    factor: 0.0005
+    type: L2