@@ -9,18 +9,27 @@ train_dataset_params:
 
                               input_dim: [640, 640]
                
 
                               cache_dir:
                
 
                               cache: False
                
 
                            +  ignore_empty_annotations: False
                
 
                               transforms:
                
 
                            +    - DetectionMosaic:
                
 
                            +        input_dim: ${dataset_params.train_dataset_params.input_dim}
                
 
                            +        prob: 1.
                
 
                                 - DetectionRandomAffine:
                
 
                                     degrees: 0.                  # rotation degrees, randomly sampled from [-degrees, degrees]
                
 
                                     translate: 0.1                # image translation fraction
                
 
                                     scales: [ 0.5, 1.5 ]              # random rescale range (keeps size by padding/cropping) after mosaic transform.
                
 
                                     shear: 0.0                    # shear degrees, randomly sampled from [-degrees, degrees]
                
 
                                     target_size: ${dataset_params.train_dataset_params.input_dim}
                
 
                            -        filter_box_candidates: True   # whether to filter out transformed bboxes by edge size, area ratio, and aspect ratio.
                
 
                            +        filter_box_candidates: False  # whether to filter out transformed bboxes by edge size, area ratio, and aspect ratio.
                
 
                                     wh_thr: 2                     # edge size threshold when filter_box_candidates = True (pixels)
                
 
                                     area_thr: 0.1                 # threshold for area ratio between original image and the transformed one, when filter_box_candidates = True
                
 
                                     ar_thr: 20                    # aspect ratio threshold when filter_box_candidates = True
                
 
                                     border_value: 128
                
 
                            +#    - DetectionMixup:
                
 
                            +#        input_dim: ${dataset_params.train_dataset_params.input_dim}
                
 
                            +#        mixup_scale: [ 0.5, 1.5 ]         # random rescale range for the additional sample in mixup
                
 
                            +#        prob: 1.0                       # probability to apply per-sample mixup
                
 
                            +#        flip_prob: 0.5                  # probability to apply horizontal flip
                
 
                                 - DetectionHSV:
                
 
                                     prob: 1.0                       # probability to apply HSV transform
                
 
                                     hgain: 5                        # HSV transform hue gain (randomly sampled from [-hgain, hgain])
                
@@ -30,8 +39,11 @@ train_dataset_params:
 
                                     prob: 0.5                       # probability to apply horizontal flip
                
 
                                 - DetectionPaddedRescale:
                
 
                                     input_dim: ${dataset_params.train_dataset_params.input_dim}
                
 
                            -        max_targets: 120
                
 
                            +        max_targets: 300
                
 
                            +    - DetectionStandardize:
                
 
                            +        max_value: 255.
                
 
                                 - DetectionTargetsFormatTransform:
                
 
                            +        max_targets: 300
                
 
                                     input_dim: ${dataset_params.train_dataset_params.input_dim}
                
 
                                     output_format: LABEL_CXCYWH
                
 
                               tight_box_rotation: False
                
@@ -43,8 +55,8 @@ train_dataset_params:
 
                             train_dataloader_params:
                
 
                               shuffle: True
                
 
                               batch_size: 16
                
 
                            -  num_workers: 0
                
 
                            -  sampler:
                
 
                            +  min_samples: 512
                
 
                            +  num_workers: 4
                
 
                               drop_last: False
                
 
                               pin_memory: True
                
 
                               worker_init_fn:
                
@@ -60,11 +72,16 @@ val_dataset_params:
 
                               input_dim: [640, 640]
                
 
                               cache_dir:
                
 
                               cache: False
                
 
                            +  ignore_empty_annotations: False
                
 
                               transforms:
                
 
                               - DetectionPaddedRescale:
                
 
                                   input_dim: ${dataset_params.val_dataset_params.input_dim}
                
 
                            +      max_targets: 300
                
 
                            +      pad_value: 114
                
 
                            +  - DetectionStandardize:
                
 
                            +      max_value: 255.
                
 
                               - DetectionTargetsFormatTransform:
                
 
                            -      max_targets: 50
                
 
                            +      max_targets: 300
                
 
                                   input_dim: ${dataset_params.val_dataset_params.input_dim}
                
 
                                   output_format: LABEL_CXCYWH
                
 
                               tight_box_rotation: False
                
@@ -74,10 +91,10 @@ val_dataset_params:
 
                               verbose: 0
                
 
                             val_dataloader_params:
                
 
                            -  batch_size: 64
                
 
                            -  num_workers: 0
                
 
                            -  sampler:
                
 
                            +  batch_size: 32
                
 
                            +  num_workers: 4
                
 
                               drop_last: False
                
 
                            +  shuffle: False
                
 
                               pin_memory: True
                
 
                               collate_fn: # collate function for valset
                
 
                                 _target_: super_gradients.training.utils.detection_utils.CrowdDetectionCollateFN