Deci-AI/super-gradients

  
1

2

3

4

5

6

7

8

            layers: [3, 6, 6, 3]                # model's structure
channels: [64, 128, 256, 512, 1024] # number of outputs channels for step and consecutive feature maps
activation: silu                    # model's width multiplier
return_idx: [1,2,3]                 # Indexes of feature maps to output
use_large_stem: True                # If True, uses 3 conv+bn+act instead of 2 in stem blocks
width_mult:                         # scaling factor to number of channels
depth_mult:                         # scaling factor to number of layers
use_alpha: False                    # If True, enables additional learnable weighting parameter for 1x1 branch in RepVGGBlock

  
1

2

3

4

5

            defaults:
  - csp_resnet_arch_params
depth_mult: 1.0
width_mult: 1.0

  
1

2

3

4

5

            defaults:
  - csp_resnet_arch_params
depth_mult: 0.67
width_mult: 0.75

  
1

2

3

4

5

            defaults:
  - csp_resnet_arch_params
depth_mult: 0.33
width_mult: 0.50

  
1

2

3

4

5

            defaults:
  - csp_resnet_arch_params
depth_mult: 1.33
width_mult: 1.25

  
1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

            depth_mult:
width_mult:
num_classes: 80
backbone:
  layers: [ 3, 6, 6, 3 ]                # Backbone's structure
  channels: [ 64, 128, 256, 512, 1024 ] # Number of outputs channels for stem and consecutive feature maps
  activation: silu
  return_idx: [ 1, 2, 3 ]               # Indexes of feature maps to output, indiced 1,2,3 correspond to feature maps of stride 8,16,32
  use_large_stem: True                  # If True, uses 3 conv+bn+act instead of 2 in stem blocks
  use_alpha: False                      # If True, enables additional learnable weighting parameter for 1x1 branch in RepVGGBlock
  pretrained_weights:
neck:
  in_channels: [256, 512, 1024]
  out_channels: [768, 384, 192]
  activation: silu
  block_num: 3
  stage_num: 1
  spp: True
head:
  in_channels: [768, 384, 192]
  activation: silu
  fpn_strides: [32, 16, 8]
  grid_cell_scale: 5.0
  grid_cell_offset: 0.5
  reg_max: 16 # Number of bins for size prediction
  eval_size:    # Size of the image for evaluation. Setting this value can be beneficial for inference speed since anchors will not be regenerated for each forward call.

  
1

2

3

4

5

6

7

8

9

            defaults:
  - ppyoloe_arch_params
  - _self_
depth_mult: 1.0
width_mult: 1.0
backbone:
  pretrained_weights: https://deci-pretrained-models.s3.amazonaws.com/ppyolo_e/CSPResNetb_l_pretrained.pth

  
1

2

3

4

5

6

7

8

9

            defaults:
  - ppyoloe_arch_params
  - _self_
depth_mult: 0.67
width_mult: 0.75
backbone:
  pretrained_weights: https://deci-pretrained-models.s3.amazonaws.com/ppyolo_e/CSPResNetb_m_pretrained.pth

  
1

2

3

4

5

6

7

8

9

            defaults:
  - ppyoloe_arch_params
  - _self_
depth_mult: 0.33
width_mult: 0.50
backbone:
  pretrained_weights: https://deci-pretrained-models.s3.amazonaws.com/ppyolo_e/CSPResNetb_s_pretrained.pth

  
1

2

3

4

5

6

7

8

9

            defaults:
  - ppyoloe_arch_params
  - _self_
depth_mult: 1.33
width_mult: 1.25
backbone:
  pretrained_weights: https://deci-pretrained-models.s3.amazonaws.com/ppyolo_e/CSPResNetb_x_pretrained.pth

  
    
        
          
1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

32

33

34

35

36

37

38

39

40

41

42

43

44

45

46

47

48

49

50

51

52

53

54

55

56

57

58

59

60

61

          
            # PP-Yolo-E Detection training on COCO2017 Dataset:
# PP-Yolo-E trained in 640x640
# Checkpoints + tensorboards: https://deci-pretrained-models.s3.amazonaws.com/ppyoloe_coco/
# Recipe runs with batch size = 20 X 8 gpus = 160.
# Instructions:
#   0. Make sure that the data is stored in dataset_params.dataset_dir or add "dataset_params.data_dir=<PATH-TO-DATASET>" at the end of the command below (feel free to check ReadMe)
#   1. Move to the project root (where you will find the ReadMe and src folder)
#   2. Run the command you want:
#         ppyoloe_s: python src/super_gradients/examples/train_from_recipe_example/train_from_recipe.py --config-name=coco2017_ppyoloe_s
#         ppyoloe_m: python src/super_gradients/examples/train_from_recipe_example/train_from_recipe.py --config-name=coco2017_ppyoloe_m
#         ppyoloe_l: python src/super_gradients/examples/train_from_recipe_example/train_from_recipe.py --config-name=coco2017_ppyoloe_l
#         ppyoloe_x: python src/super_gradients/examples/train_from_recipe_example/train_from_recipe.py --config-name=coco2017_ppyoloe_x
#
# Training times and accuracies (mAP@0.5-0.95 (COCO API, confidence 0.001, IoU threshold 0.6, test on 640x640 images):
#         ppyoloe_s: 37h on 8 NVIDIA GeForce RTX 3090, mAP: 42.52 (val)
#         ppyoloe_m: 58h on 8 NVIDIA GeForce RTX 3090, mAP: 47.11 (val)
#         ppyoloe_l: COMING SOON
#         ppyoloe_x: COMING SOON
#
defaults:
  - training_hyperparams: coco2017_ppyoloe_train_params
  - dataset_params: coco_detection_ppyoloe_dataset_params
  - arch_params: ppyoloe_l_arch_params
  - checkpoint_params: default_checkpoint_params
  - _self_
train_dataloader: coco2017_train_ppyoloe
val_dataloader: coco2017_val_ppyoloe
load_checkpoint: False
resume: False
dataset_params:
  train_dataloader_params:
    batch_size: 20
training_hyperparams:
  resume: ${resume}
  mixed_precision: True
  initial_lr:  1e-3
architecture: pp_yoloe_l
multi_gpu: DDP
num_gpus: 8
experiment_suffix: ""
experiment_name: coco2017_${architecture}${experiment_suffix}
ckpt_root_dir:
# THE FOLLOWING PARAMS ARE DIRECTLY USED BY HYDRA
hydra:
  run:
    # Set the output directory (i.e. where .hydra folder that logs all the input params will be generated)
    dir: ${hydra_output_dir:${ckpt_root_dir}, ${experiment_name}}

          
        
      

  

  
    
        
          
1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

32

33

34

35

36

37

38

39

40

41

42

43

44

45

46

47

48

49

50

51

52

53

54

55

56

57

58

59

60

61

          
            # PP-Yolo-E Detection training on COCO2017 Dataset:
# PP-Yolo-E trained in 640x640
# Checkpoints + tensorboards: https://deci-pretrained-models.s3.amazonaws.com/ppyoloe_coco/
# Recipe runs with batch size = 24 X 8 gpus = 192.
# Instructions:
#   0. Make sure that the data is stored in dataset_params.dataset_dir or add "dataset_params.data_dir=<PATH-TO-DATASET>" at the end of the command below (feel free to check ReadMe)
#   1. Move to the project root (where you will find the ReadMe and src folder)
#   2. Run the command you want:
#         ppyoloe_s: python src/super_gradients/examples/train_from_recipe_example/train_from_recipe.py --config-name=coco2017_ppyoloe_s
#         ppyoloe_m: python src/super_gradients/examples/train_from_recipe_example/train_from_recipe.py --config-name=coco2017_ppyoloe_m
#         ppyoloe_l: python src/super_gradients/examples/train_from_recipe_example/train_from_recipe.py --config-name=coco2017_ppyoloe_l
#         ppyoloe_x: python src/super_gradients/examples/train_from_recipe_example/train_from_recipe.py --config-name=coco2017_ppyoloe_x
#
# Training times and accuracies (mAP@0.5-0.95 (COCO API, confidence 0.001, IoU threshold 0.6, test on 640x640 images):
#         ppyoloe_s: 37h on 8 NVIDIA GeForce RTX 3090, mAP: 42.52 (val)
#         ppyoloe_m: 58h on 8 NVIDIA GeForce RTX 3090, mAP: 47.11 (val)
#         ppyoloe_l: COMING SOON
#         ppyoloe_x: COMING SOON
#
defaults:
  - training_hyperparams: coco2017_ppyoloe_train_params
  - dataset_params: coco_detection_ppyoloe_dataset_params
  - arch_params: ppyoloe_m_arch_params
  - checkpoint_params: default_checkpoint_params
  - _self_
train_dataloader: coco2017_train_ppyoloe
val_dataloader: coco2017_val_ppyoloe
load_checkpoint: False
resume: False
dataset_params:
  train_dataloader_params:
    batch_size: 24
training_hyperparams:
  resume: ${resume}
  mixed_precision: True
  initial_lr:  1e-3
architecture: pp_yoloe_m
multi_gpu: DDP
num_gpus: 8
experiment_suffix: ""
experiment_name: coco2017_${architecture}${experiment_suffix}
ckpt_root_dir:
# THE FOLLOWING PARAMS ARE DIRECTLY USED BY HYDRA
hydra:
  run:
    # Set the output directory (i.e. where .hydra folder that logs all the input params will be generated)
    dir: ${hydra_output_dir:${ckpt_root_dir}, ${experiment_name}}

          
        
      

  

  
    
        
          
1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

32

33

34

35

36

37

38

39

40

41

42

43

44

45

46

47

48

49

50

51

52

53

54

55

56

57

          
            # PP-Yolo-E Detection training on COCO2017 Dataset:
# PP-Yolo-E trained in 640x640
# Recipe runs with batch size = 32 X 8 gpus = 256.
# Instructions:
#   0. Make sure that the data is stored in dataset_params.dataset_dir or add "dataset_params.data_dir=<PATH-TO-DATASET>" at the end of the command below (feel free to check ReadMe)
#   1. Move to the project root (where you will find the ReadMe and src folder)
#   2. Run the command you want:
#         ppyoloe_s: python src/super_gradients/examples/train_from_recipe_example/train_from_recipe.py --config-name=coco2017_ppyoloe_s
#         ppyoloe_m: python src/super_gradients/examples/train_from_recipe_example/train_from_recipe.py --config-name=coco2017_ppyoloe_m
#         ppyoloe_l: python src/super_gradients/examples/train_from_recipe_example/train_from_recipe.py --config-name=coco2017_ppyoloe_l
#         ppyoloe_x: python src/super_gradients/examples/train_from_recipe_example/train_from_recipe.py --config-name=coco2017_ppyoloe_x
#
# Training times and accuracies (mAP@0.5-0.95 (COCO API, confidence 0.001, IoU threshold 0.6, test on 640x640 images):
#         ppyoloe_s: 37h on 8 NVIDIA GeForce RTX 3090, mAP: 42.52 (val)
#         ppyoloe_m: 58h on 8 NVIDIA GeForce RTX 3090, mAP: 47.11 (val)
#         ppyoloe_l: COMING SOON
#         ppyoloe_x: COMING SOON
#
defaults:
  - training_hyperparams: coco2017_ppyoloe_train_params
  - dataset_params: coco_detection_ppyoloe_dataset_params
  - arch_params: ppyoloe_s_arch_params
  - checkpoint_params: default_checkpoint_params
  - _self_
train_dataloader: coco2017_train_ppyoloe
val_dataloader: coco2017_val_ppyoloe
load_checkpoint: False
resume: False
dataset_params:
  train_dataloader_params:
    batch_size: 32
training_hyperparams:
  resume: ${resume}
  mixed_precision: True
architecture: pp_yoloe_s
multi_gpu: DDP
num_gpus: 8
experiment_suffix: ""
experiment_name: coco2017_${architecture}${experiment_suffix}
ckpt_root_dir:
# THE FOLLOWING PARAMS ARE DIRECTLY USED BY HYDRA
hydra:
  run:
    # Set the output directory (i.e. where .hydra folder that logs all the input params will be generated)
    dir: ${hydra_output_dir:${ckpt_root_dir}, ${experiment_name}}

          
        
      

  

  
    
        
          
1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

32

33

34

35

36

37

38

39

40

41

42

43

44

45

46

47

48

49

50

51

52

53

54

55

56

57

58

59

          
            # PP-Yolo-E Detection training on COCO2017 Dataset:
# PP-Yolo-E trained in 640x640
# Checkpoints + tensorboards: https://deci-pretrained-models.s3.amazonaws.com/ppyoloe_coco/
# Recipe runs with batch size = 16 X 8 gpus = 128.
# Instructions:
#   0. Make sure that the data is stored in dataset_params.dataset_dir or add "dataset_params.data_dir=<PATH-TO-DATASET>" at the end of the command below (feel free to check ReadMe)
#   1. Move to the project root (where you will find the ReadMe and src folder)
#   2. Run the command you want:
#         ppyoloe_s: python src/super_gradients/examples/train_from_recipe_example/train_from_recipe.py --config-name=coco2017_ppyoloe_s
#         ppyoloe_m: python src/super_gradients/examples/train_from_recipe_example/train_from_recipe.py --config-name=coco2017_ppyoloe_m
#         ppyoloe_l: python src/super_gradients/examples/train_from_recipe_example/train_from_recipe.py --config-name=coco2017_ppyoloe_l
#         ppyoloe_x: python src/super_gradients/examples/train_from_recipe_example/train_from_recipe.py --config-name=coco2017_ppyoloe_x
#
# Training times and accuracies (mAP@0.5-0.95 (COCO API, confidence 0.001, IoU threshold 0.6, test on 640x640 images):
#         ppyoloe_s: 37h on 8 NVIDIA GeForce RTX 3090, mAP: 42.52 (val)
#         ppyoloe_m: 58h on 8 NVIDIA GeForce RTX 3090, mAP: 47.11 (val)
#         ppyoloe_l: COMING SOON
#         ppyoloe_x: COMING SOON
#
defaults:
  - training_hyperparams: coco2017_ppyoloe_train_params
  - dataset_params: coco_detection_ppyoloe_dataset_params
  - arch_params: ppyoloe_x_arch_params
  - checkpoint_params: default_checkpoint_params
  - _self_
train_dataloader: coco2017_train_ppyoloe
val_dataloader: coco2017_val_ppyoloe
load_checkpoint: False
resume: False
dataset_params:
  train_dataloader_params:
    batch_size: 16
training_hyperparams:
  resume: ${resume}
  mixed_precision: True
architecture: pp_yoloe_x
multi_gpu: DDP
num_gpus: 8
experiment_suffix: ""
experiment_name: coco2017_${architecture}${experiment_suffix}
ckpt_root_dir:
# THE FOLLOWING PARAMS ARE DIRECTLY USED BY HYDRA
hydra:
  run:
    # Set the output directory (i.e. where .hydra folder that logs all the input params will be generated)
    dir: ${hydra_output_dir:${ckpt_root_dir}, ${experiment_name}}

          
        
      

  

  
    
        
          
1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

32

33

34

35

36

37

38

39

40

41

42

43

44

45

46

47

48

49

50

51

52

53

54

55

56

57

58

59

60

61

62

63

64

65

66

67

68

69

70

71

72

73

74

75

76

77

78

79

80

81

82

83

84

85

86

87

88

89

90

91

92

93

94

95

96

97

          
            train_dataset_params:
  data_dir: /data/coco # root path to coco data
  subdir: images/train2017 # sub directory path of data_dir containing the train data.
  json_file: instances_train2017.json # path to coco train json file, data_dir/annotations/train_json_file.
  input_dim: # None, do not resize dataset on load
  cache_dir:
  cache: False
  transforms:
    - DetectionRandomAffine:
        degrees: 0                    # rotation degrees, randomly sampled from [-degrees, degrees]
        translate: 0.25               # image translation fraction
        scales: [ 0.5, 1.5 ]          # random rescale range (keeps size by padding/cropping) after mosaic transform.
        shear: 0.0                    # shear degrees, randomly sampled from [-degrees, degrees]
        target_size:
        filter_box_candidates: True   # whether to filter out transformed bboxes by edge size, area ratio, and aspect ratio.
        wh_thr: 2                     # edge size threshold when filter_box_candidates = True (pixels)
        area_thr: 0.1                 # threshold for area ratio between original image and the transformed one, when when filter_box_candidates = True
        ar_thr: 20                    # aspect ratio threshold when filter_box_candidates = True
    - DetectionRandomRotate90:
        prob: 0.5
    - DetectionRGB2BGR:
        prob: 0.25
    - DetectionHSV:
        prob: 0.5                       # probability to apply HSV transform
        hgain: 18                       # HSV transform hue gain (randomly sampled from [-hgain, hgain])
        sgain: 30                       # HSV transform saturation gain (randomly sampled from [-sgain, sgain])
        vgain: 30                       # HSV transform value gain (randomly sampled from [-vgain, vgain])
    - DetectionHorizontalFlip:
        prob: 0.5                       # probability to apply horizontal flip
    - DetectionMixup:
        input_dim:
        mixup_scale: [ 0.5, 1.5 ]         # random rescale range for the additional sample in mixup
        prob: 0.5                       # probability to apply per-sample mixup
        flip_prob: 0.5                  # probability to apply horizontal flip
    - DetectionNormalize:
        mean: [ 123.675, 116.28, 103.53 ]
        std: [ 58.395,  57.12,  57.375 ]
    - DetectionTargetsFormatTransform:
        max_targets: 256
        output_format: LABEL_CXCYWH
  tight_box_rotation: False
  class_inclusion_list:
  max_num_samples:
  with_crowd: False
train_dataloader_params:
  batch_size: 32
  num_workers: 8
  shuffle: True
  drop_last: True
  # Disable pin_memory due to presence of PPYoloECollateFN with uses random resize during training
  pin_memory: False
  worker_init_fn:
    _target_: super_gradients.training.utils.utils.load_func
    dotpath: super_gradients.training.datasets.datasets_utils.worker_init_reset_seed
  collate_fn: # collate function for trainset
    _target_: super_gradients.training.utils.detection_utils.PPYoloECollateFN
    random_resize_sizes: [ 320, 352, 384, 416, 448, 480, 512, 544, 576, 608, 640, 672, 704, 736, 768 ]
    random_resize_modes:
      - 0 # cv::INTER_NEAREST
      - 1 # cv::INTER_LINEAR
      - 2 # cv::INTER_CUBIC
      - 3 # cv::INTER_AREA
      - 4 # cv::INTER_LANCZOS4
val_dataset_params:
  data_dir: /data/coco # root path to coco data
  subdir: images/val2017 # sub directory path of data_dir containing the train data.
  json_file: instances_val2017.json # path to coco train json file, data_dir/annotations/train_json_file.
  input_dim:
  cache_dir:
  cache: False
  transforms:
    - DetectionRescale:
        output_shape: [640, 640]
    - DetectionNormalize:
        mean: [ 123.675, 116.28, 103.53 ]
        std: [ 58.395,  57.12,  57.375 ]
    - DetectionTargetsFormatTransform:
        max_targets: 256
        output_format: LABEL_CXCYWH
  tight_box_rotation: False
  class_inclusion_list:
  max_num_samples:
  with_crowd: False
val_dataloader_params:
  batch_size: 64
  num_workers: 8
  drop_last: False
  shuffle: False
  pin_memory: False
  collate_fn: # collate function for trainset
    _target_: super_gradients.training.utils.detection_utils.PPYoloECollateFN
_convert_: all

          
        
      

  

  
    
        
          
1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

32

33

34

35

36

37

38

39

40

41

42

43

44

45

46

47

48

49

50

51

52

53

54

55

56

57

58

59

60

          
            defaults:
  - default_train_params
max_epochs: 500
static_assigner_end_epoch: 150
warmup_mode: "linear_batch_step"
warmup_initial_lr:  1e-6
lr_warmup_steps: 1000
lr_warmup_epochs: 0
initial_lr:  2e-3
lr_mode: cosine
cosine_final_lr_ratio: 0.1
zero_weight_decay_on_bias_and_bn: False
batch_accumulate: 1
save_ckpt_epoch_list: [200, 250, 300, 350, 400, 450]
loss:
  ppyoloe_loss:
    num_classes: ${arch_params.num_classes}
    reg_max: ${arch_params.head.reg_max}
optimizer: AdamW
optimizer_params:
  weight_decay: 0.0001
ema: True
ema_params:
  decay: 0.9997
  decay_type: threshold
mixed_precision: False
sync_bn: True
valid_metrics_list:
  - DetectionMetrics:
      score_thres: 0.1
      top_k_predictions: 300
      num_cls: ${arch_params.num_classes}
      normalize_targets: True
      post_prediction_callback:
        _target_: super_gradients.training.models.detection_models.pp_yolo_e.PPYoloEPostPredictionCallback
        score_threshold: 0.01
        nms_top_k: 1000
        max_predictions: 300
        nms_threshold: 0.7
pre_prediction_callback:
phase_callbacks:
  - PPYoloETrainingStageSwitchCallback:
      static_assigner_end_epoch: ${training_hyperparams.static_assigner_end_epoch}
metric_to_watch: 'mAP@0.50:0.95'
greater_metric_to_watch_is_better: True
_convert_: all

          
        
      

  

Deci-AI / super-gradients connected to https://github.com/Deci-AI/super-gradients.git

#643 PPYolo-E

Deci-AI
/
super-gradients
connected to https://github.com/Deci-AI/super-gradients.git