neuralmagic
diff --git a/‎integrations/ultralytics-yolov5/models/yolov5l.yaml‎
Lines changed: 49 additions & 0 deletions b/‎integrations/ultralytics-yolov5/models/yolov5l.yaml‎
Lines changed: 49 additions & 0 deletions
diff --git a/‎integrations/ultralytics-yolov5/models/yolov5s.yaml‎
Lines changed: 49 additions & 0 deletions b/‎integrations/ultralytics-yolov5/models/yolov5s.yaml‎
Lines changed: 49 additions & 0 deletions
diff --git a/‎integrations/ultralytics-yolov5/recipes/.gitkeep‎ b/‎integrations/ultralytics-yolov5/recipes/.gitkeep‎
diff --git a/‎integrations/ultralytics-yolov5/recipes/yolov5l.pruned.md‎
Lines changed: 229 additions & 0 deletions b/‎integrations/ultralytics-yolov5/recipes/yolov5l.pruned.md‎
Lines changed: 229 additions & 0 deletions
@@ -0,0 +1,49 @@
+# parameters
+nc: 80  # number of classes
+depth_multiple: 1.0  # model depth multiple
+width_multiple: 1.0  # layer channel multiple
+act: Hardswish
+
+# anchors
+anchors:
+  - [10,13, 16,30, 33,23]  # P3/8
+  - [30,61, 62,45, 59,119]  # P4/16
+  - [116,90, 156,198, 373,326]  # P5/32
+
+# YOLOv5 backbone
+backbone:
+  # [from, number, module, args]
+  [[-1, 1, Focus, [64, 3]],  # 0-P1/2
+   [-1, 1, Conv, [128, 3, 2]],  # 1-P2/4
+   [-1, 3, C3, [128]],
+   [-1, 1, Conv, [256, 3, 2]],  # 3-P3/8
+   [-1, 9, C3, [256]],
+   [-1, 1, Conv, [512, 3, 2]],  # 5-P4/16
+   [-1, 9, C3, [512]],
+   [-1, 1, Conv, [1024, 3, 2]],  # 7-P5/32
+   [-1, 1, SPP, [1024, [5, 9, 13]]],
+   [-1, 3, C3, [1024, False]],  # 9
+  ]
+
+# YOLOv5 head
+head:
+  [[-1, 1, Conv, [512, 1, 1]],
+   [-1, 1, nn.Upsample, [None, 2, 'nearest']],
+   [[-1, 6], 1, Concat, [1]],  # cat backbone P4
+   [-1, 3, C3, [512, False]],  # 13
+
+   [-1, 1, Conv, [256, 1, 1]],
+   [-1, 1, nn.Upsample, [None, 2, 'nearest']],
+   [[-1, 4], 1, Concat, [1]],  # cat backbone P3
+   [-1, 3, C3, [256, False]],  # 17 (P3/8-small)
+
+   [-1, 1, Conv, [256, 3, 2]],
+   [[-1, 14], 1, Concat, [1]],  # cat head P4
+   [-1, 3, C3, [512, False]],  # 20 (P4/16-medium)
+
+   [-1, 1, Conv, [512, 3, 2]],
+   [[-1, 10], 1, Concat, [1]],  # cat head P5
+   [-1, 3, C3, [1024, False]],  # 23 (P5/32-large)
+
+   [[17, 20, 23], 1, Detect, [nc, anchors]],  # Detect(P3, P4, P5)
+  ]
@@ -0,0 +1,49 @@
+# parameters
+nc: 80  # number of classes
+depth_multiple: 0.33  # model depth multiple
+width_multiple: 0.50  # layer channel multiple
+act: Hardswish
+
+# anchors
+anchors:
+  - [10,13, 16,30, 33,23]  # P3/8
+  - [30,61, 62,45, 59,119]  # P4/16
+  - [116,90, 156,198, 373,326]  # P5/32
+
+# YOLOv5 backbone
+backbone:
+  # [from, number, module, args]
+  [[-1, 1, Focus, [64, 3]],  # 0-P1/2
+   [-1, 1, Conv, [128, 3, 2]],  # 1-P2/4
+   [-1, 3, C3, [128]],
+   [-1, 1, Conv, [256, 3, 2]],  # 3-P3/8
+   [-1, 9, C3, [256]],
+   [-1, 1, Conv, [512, 3, 2]],  # 5-P4/16
+   [-1, 9, C3, [512]],
+   [-1, 1, Conv, [1024, 3, 2]],  # 7-P5/32
+   [-1, 1, SPP, [1024, [5, 9, 13]]],
+   [-1, 3, C3, [1024, False]],  # 9
+  ]
+
+# YOLOv5 head
+head:
+  [[-1, 1, Conv, [512, 1, 1]],
+   [-1, 1, nn.Upsample, [None, 2, 'nearest']],
+   [[-1, 6], 1, Concat, [1]],  # cat backbone P4
+   [-1, 3, C3, [512, False]],  # 13
+
+   [-1, 1, Conv, [256, 1, 1]],
+   [-1, 1, nn.Upsample, [None, 2, 'nearest']],
+   [[-1, 4], 1, Concat, [1]],  # cat backbone P3
+   [-1, 3, C3, [256, False]],  # 17 (P3/8-small)
+
+   [-1, 1, Conv, [256, 3, 2]],
+   [[-1, 14], 1, Concat, [1]],  # cat head P4
+   [-1, 3, C3, [512, False]],  # 20 (P4/16-medium)
+
+   [-1, 1, Conv, [512, 3, 2]],
+   [[-1, 10], 1, Concat, [1]],  # cat head P5
+   [-1, 3, C3, [1024, False]],  # 23 (P5/32-large)
+
+   [[17, 20, 23], 1, Detect, [nc, anchors]],  # Detect(P3, P4, P5)
+  ]
@@ -0,0 +1,229 @@
+<!--
+Copyright (c) 2021 - present / Neuralmagic, Inc. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+-->
+
+---
+# General Hyperparams
+num_epochs: &num_epochs 180
+init_lr: &init_lr 0.01
+final_lr: &final_lr 0.002
+weights_warmup_lr: &weights_warmup_lr 0
+biases_warmup_lr: &biases_warmup_lr 0.1
+
+# Pruning Hyperparams
+init_sparsity: &init_sparsity 0.05
+pruning_start_epoch: &pruning_start_epoch 4
+pruning_end_epoch: &pruning_end_epoch 100
+update_frequency: &pruning_update_frequency 1.0
+prune_none_target_sparsity: &prune_none_target_sparsity 0.6
+prune_low_target_sparsity: &prune_low_target_sparsity 0.75
+prune_mid_target_sparsity: &prune_mid_target_sparsity 0.85
+prune_high_target_sparsity: &prune_high_target_sparsity 0.9
+
+training_modifiers:
+  - !EpochRangeModifier
+    start_epoch: 0
+    end_epoch: *num_epochs
+    
+  - !LearningRateFunctionModifier
+    start_epoch: 3
+    end_epoch: *num_epochs
+    lr_func: cosine
+    init_lr: *init_lr
+    final_lr: *final_lr
+    
+  - !LearningRateFunctionModifier
+    start_epoch: 0
+    end_epoch: 3
+    lr_func: linear
+    init_lr: *weights_warmup_lr
+    final_lr: *init_lr
+    param_groups: [0, 1]
+    
+  - !LearningRateFunctionModifier
+    start_epoch: 0
+    end_epoch: 3
+    lr_func: linear
+    init_lr: *biases_warmup_lr
+    final_lr: *init_lr
+    param_groups: [2]
+    
+pruning_modifiers:
+  - !GMPruningModifier
+    params:
+      - model.2.cv3.conv.weight
+      - model.2.cv1.conv.weight
+      - model.2.m.2.cv1.conv.weight
+      - model.2.m.1.cv1.conv.weight
+      - model.2.m.0.cv1.conv.weight
+      - model.24.m.0.weight
+      - model.24.m.1.weight
+      - model.24.m.2.weight
+    init_sparsity: *init_sparsity
+    final_sparsity: *prune_none_target_sparsity
+    start_epoch: *pruning_start_epoch
+    end_epoch: *pruning_end_epoch
+    update_frequency: *pruning_update_frequency
+        
+  - !GMPruningModifier
+    params:
+      - model.2.cv2.conv.weight
+      - model.6.m.7.cv1.conv.weight
+      - model.6.cv1.conv.weight
+      - model.6.cv3.conv.weight
+      - model.1.conv.weight
+      - model.13.m.0.cv1.conv.weight
+      - model.17.cv1.conv.weight
+      - model.4.m.0.cv1.conv.weight
+      - model.17.m.2.cv1.conv.weight
+      - model.4.cv2.conv.weight
+      - model.2.m.0.cv2.conv.weight
+      - model.2.m.2.cv2.conv.weight
+      - model.2.m.1.cv2.conv.weight
+      - model.4.m.1.cv1.conv.weight
+      - model.4.m.2.cv1.conv.weight
+      - model.4.m.3.cv1.conv.weight
+      - model.4.m.7.cv1.conv.weight
+      - model.4.m.8.cv1.conv.weight
+      - model.4.m.5.cv1.conv.weight
+      - model.4.m.6.cv1.conv.weight
+      - model.4.m.4.cv1.conv.weight
+      - model.17.m.1.cv1.conv.weight
+      - model.23.m.1.cv1.conv.weight
+      - model.9.m.1.cv1.conv.weight
+      - model.23.m.0.cv1.conv.weight
+      - model.23.m.2.cv1.conv.weight
+      - model.4.cv3.conv.weight
+      - model.4.cv1.conv.weight
+      - model.17.m.0.cv1.conv.weight
+      - model.23.cv1.conv.weight
+      - model.9.m.0.cv1.conv.weight
+      - model.13.m.1.cv1.conv.weight
+      - model.6.m.8.cv1.conv.weight
+      - model.9.m.2.cv1.conv.weight
+      - model.6.m.2.cv1.conv.weight
+      - model.9.cv1.conv.weight
+      - model.20.cv1.conv.weight
+      - model.13.cv1.conv.weight
+      - model.6.m.4.cv1.conv.weight
+      - model.6.m.5.cv1.conv.weight
+      - model.13.m.2.cv1.conv.weight
+      - model.6.m.6.cv1.conv.weight
+      - model.6.m.1.cv1.conv.weight
+      - model.6.m.3.cv1.conv.weight
+      - model.20.m.1.cv1.conv.weight
+      - model.20.m.0.cv1.conv.weight
+      - model.6.m.0.cv1.conv.weight
+      - model.8.cv1.conv.weight
+    init_sparsity: *init_sparsity
+    final_sparsity: *prune_low_target_sparsity
+    start_epoch: *pruning_start_epoch
+    end_epoch: *pruning_end_epoch
+    update_frequency: *pruning_update_frequency
+        
+  - !GMPruningModifier
+    params:
+      - model.20.cv3.conv.weight
+      - model.6.m.0.cv2.conv.weight
+      - model.8.cv2.conv.weight
+      - model.13.m.2.cv2.conv.weight
+      - model.20.cv2.conv.weight
+      - model.6.m.8.cv2.conv.weight
+      - model.6.m.2.cv2.conv.weight
+      - model.6.m.7.cv2.conv.weight
+      - model.6.m.1.cv2.conv.weight
+      - model.6.m.5.cv2.conv.weight
+      - model.6.m.4.cv2.conv.weight
+      - model.6.m.6.cv2.conv.weight
+      - model.6.m.3.cv2.conv.weight
+      - model.13.m.1.cv2.conv.weight
+      - model.13.m.0.cv2.conv.weight
+      - model.5.conv.weight
+      - model.9.cv3.conv.weight
+      - model.17.m.2.cv2.conv.weight
+      - model.17.cv2.conv.weight
+      - model.20.m.2.cv1.conv.weight
+      - model.9.cv2.conv.weight
+      - model.17.m.1.cv2.conv.weight
+      - model.4.m.8.cv2.conv.weight
+      - model.4.m.7.cv2.conv.weight
+      - model.4.m.6.cv2.conv.weight
+      - model.4.m.5.cv2.conv.weight
+      - model.10.conv.weight
+      - model.4.m.3.cv2.conv.weight
+      - model.4.m.2.cv2.conv.weight
+      - model.4.m.4.cv2.conv.weight
+      - model.4.m.0.cv2.conv.weight
+      - model.4.m.1.cv2.conv.weight
+      - model.17.cv3.conv.weight
+      - model.6.cv2.conv.weight
+      - model.3.conv.weight
+      - model.13.cv3.conv.weight
+      - model.13.cv2.conv.weight
+      - model.14.conv.weight
+    init_sparsity: *init_sparsity
+    final_sparsity: *prune_mid_target_sparsity
+    start_epoch: *pruning_start_epoch
+    end_epoch: *pruning_end_epoch
+    update_frequency: *pruning_update_frequency
+        
+  - !GMPruningModifier
+    params:
+      - model.23.m.2.cv2.conv.weight
+      - model.21.conv.weight
+      - model.17.m.0.cv2.conv.weight
+      - model.23.m.1.cv2.conv.weight
+      - model.23.m.0.cv2.conv.weight
+      - model.9.m.1.cv2.conv.weight
+      - model.9.m.0.cv2.conv.weight
+      - model.23.cv3.conv.weight
+      - model.9.m.2.cv2.conv.weight
+      - model.23.cv2.conv.weight
+      - model.20.m.2.cv2.conv.weight
+      - model.18.conv.weight
+      - model.7.conv.weight
+      - model.20.m.1.cv2.conv.weight
+      - model.20.m.0.cv2.conv.weight
+    init_sparsity: *init_sparsity
+    final_sparsity: *prune_high_target_sparsity
+    start_epoch: *pruning_start_epoch
+    end_epoch: *pruning_end_epoch
+    update_frequency: *pruning_update_frequency
+---
+
+# YOLOv5l Pruned
+
+This recipe creates a sparse, [YOLOv5l](https://github.com/ultralytics/yolov5) model that achieves 98% recovery of its baseline accuracy on the COCO dataset (0.654 mAP@0.5 baseline vs 0.643 mAP@0.5 for this recipe).
+Training was done using 4 GPUs at half precision with a total batch size of 64 using the [SparseML integration with ultralytics/yolov5](https://github.com/neuralmagic/sparseml/tree/main/integrations/ultralytics-yolov5).
+
+When running, adjust hyperparameters based on training environment and dataset.
+
+## Training
+
+To set up the training environment, follow the instructions on the [integration README](https://github.com/neuralmagic/sparseml/blob/main/integrations/ultralytics-yolov5/README.md).
+Using the given training script from the `yolov5` directory the following command can be used to launch this recipe. 
+Adjust the script command for your GPU device setup. 
+Ultralytics supports both DataParallel and DDP.
+
+*script command:*
+
+```
+python train.py \
+    --cfg ../models/yolov5l.yaml \
+    --weights PRETRAINED_WEIGHTS \
+    --data coco.yaml \
+    --hyp data/hyp.scratch.yaml \
+    --recipe ../recipes/yolov5l.pruned.md \
+```