instance segmentation SOTA params

luxonis · Jan 29, 2025 · 6d27f76 · 6d27f76
1 parent f04678f
commit 6d27f76
Show file tree

Hide file tree

Showing 6 changed files with 33 additions and 15 deletions.
diff --git a/configs/detection_heavy_model.yaml b/configs/detection_heavy_model.yaml
@@ -18,6 +18,7 @@ loader:
     dataset_name: coco_test
 
 trainer:
+  precision: "16-mixed"
   preprocessing:
     train_image_size: [384, 512]
     keep_aspect_ratio: true

diff --git a/configs/detection_light_model.yaml b/configs/detection_light_model.yaml
@@ -18,6 +18,7 @@ loader:
     dataset_name: coco_test
 
 trainer:
+  precision: "16-mixed"
   preprocessing:
     train_image_size: [384, 512]
     keep_aspect_ratio: true

diff --git a/configs/instance_segmentation_heavy_model.yaml b/configs/instance_segmentation_heavy_model.yaml
@@ -16,6 +16,7 @@ loader:
     dataset_name: coco_test
 
 trainer:
+  precision: "16-mixed"
   preprocessing:
     train_image_size: [384, 512]
     keep_aspect_ratio: true
@@ -27,10 +28,10 @@ trainer:
 
   batch_size: 8
   epochs: &epochs 300
-  accumulate_grad_batches: 8 # For best results, always accumulate gradients to effectively use 64 batch size
-  n_workers: 8
+  n_workers: 4
   validation_interval: 10
   n_log_images: 8
+  gradient_clip_val: 10
 
   callbacks:
     - name: EMACallback
@@ -40,15 +41,22 @@ trainer:
         decay_tau: 2000
     - name: ExportOnTrainEnd
     - name: TestOnTrainEnd
+    - name: GradientAccumulationScheduler
+      params:
+        scheduling: # warmup phase is 3 epochs
+          0: 1
+          1: 4
+          2: 8 # For best results, always accumulate gradients to effectively use 64 batch size
 
   training_strategy:
     name: "TripleLRSGDStrategy"
     params: 
       warmup_epochs: 3
-      warmup_bias_lr: 0.1
+      warmup_bias_lr: 0.0
       warmup_momentum: 0.8
       lr: 0.01
       lre: 0.0001
       momentum: 0.937     
       weight_decay: 0.0005
-      nesterov: True
+      nesterov: True
+      cosine_annealing: False
diff --git a/configs/instance_segmentation_light_model.yaml b/configs/instance_segmentation_light_model.yaml
@@ -16,8 +16,9 @@ loader:
     dataset_name: coco_test
 
 trainer:
+  precision: "16-mixed"
   preprocessing:
-    train_image_size: [384, 512]
+    train_image_size: [384, 384]
     keep_aspect_ratio: true
     normalize:
       active: true
@@ -27,10 +28,10 @@ trainer:
 
   batch_size: 8
   epochs: &epochs 300
-  accumulate_grad_batches: 8 # For best results, always accumulate gradients to effectively use 64 batch size
-  n_workers: 8
+  n_workers: 4
   validation_interval: 10
   n_log_images: 8
+  gradient_clip_val: 10
 
   callbacks:
     - name: EMACallback
@@ -40,15 +41,22 @@ trainer:
         decay_tau: 2000
     - name: ExportOnTrainEnd
     - name: TestOnTrainEnd
+    - name: GradientAccumulationScheduler
+      params:
+        scheduling: # warmup phase is 3 epochs
+          0: 1
+          1: 4
+          2: 8 # For best results, always accumulate gradients to effectively use 64 batch size
 
   training_strategy:
     name: "TripleLRSGDStrategy"
     params: 
       warmup_epochs: 3
-      warmup_bias_lr: 0.1
+      warmup_bias_lr: 0.0
       warmup_momentum: 0.8
       lr: 0.01
       lre: 0.0001
       momentum: 0.937     
       weight_decay: 0.0005
-      nesterov: True
+      nesterov: True
+      cosine_annealing: False
diff --git a/configs/keypoint_bbox_heavy_model.yaml b/configs/keypoint_bbox_heavy_model.yaml
@@ -30,7 +30,7 @@ trainer:
         std: [1, 1, 1]
 
   batch_size: 8
-  epochs: &epochs 100
+  epochs: &epochs 300
   n_workers: 4
   validation_interval: 10
   n_log_images: 8
@@ -46,10 +46,10 @@ trainer:
     - name: TestOnTrainEnd
     - name: GradientAccumulationScheduler
       params:
-        scheduling:
+        scheduling: # warmup phase is 3 epochs
           0: 1
           1: 4
-          2: 8
+          2: 8 # For best results, always accumulate gradients to effectively use 64 batch size
 
   training_strategy:
     name: "TripleLRSGDStrategy"

diff --git a/configs/keypoint_bbox_light_model.yaml b/configs/keypoint_bbox_light_model.yaml
@@ -30,7 +30,7 @@ trainer:
         std: [1, 1, 1]
 
   batch_size: 8
-  epochs: &epochs 100
+  epochs: &epochs 300
   n_workers: 4
   validation_interval: 10
   n_log_images: 8
@@ -46,10 +46,10 @@ trainer:
     - name: TestOnTrainEnd
     - name: GradientAccumulationScheduler
       params:
-        scheduling:
+        scheduling: # warmup phase is 3 epochs
           0: 1
           1: 4
-          2: 8
+          2: 8 # For best results, always accumulate gradients to effectively use 64 batch size
 
   training_strategy:
     name: "TripleLRSGDStrategy"