neuralmagic
diff --git a/‎integrations/ultralytics-yolov3/README.md‎
Lines changed: 16 additions & 0 deletions b/‎integrations/ultralytics-yolov3/README.md‎
Lines changed: 16 additions & 0 deletions
diff --git a/‎integrations/ultralytics-yolov3/data/hyp.pruned.yaml‎
Lines changed: 27 additions & 0 deletions b/‎integrations/ultralytics-yolov3/data/hyp.pruned.yaml‎
Lines changed: 27 additions & 0 deletions
diff --git a/‎integrations/ultralytics-yolov3/data/hyp.pruned_quantized.yaml‎
Lines changed: 27 additions & 0 deletions b/‎integrations/ultralytics-yolov3/data/hyp.pruned_quantized.yaml‎
Lines changed: 27 additions & 0 deletions
diff --git a/‎integrations/ultralytics-yolov3/models/yolov3-spp.lrelu.yaml‎
Lines changed: 52 additions & 0 deletions b/‎integrations/ultralytics-yolov3/models/yolov3-spp.lrelu.yaml‎
Lines changed: 52 additions & 0 deletions
diff --git a/‎integrations/ultralytics-yolov3/recipes/yolov3-spp.pruned.md‎
Lines changed: 202 additions & 0 deletions b/‎integrations/ultralytics-yolov3/recipes/yolov3-spp.pruned.md‎
Lines changed: 202 additions & 0 deletions
@@ -0,0 +1,16 @@
+<!--
+Copyright (c) 2021 - present / Neuralmagic, Inc. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+-->
+
@@ -0,0 +1,27 @@
+lr0: 0.005
+lrf: 0.1
+momentum: 0.843
+weight_decay: 0.00036
+warmup_epochs: 40.0
+warmup_momentum: 0.5
+warmup_bias_lr: 0.05
+box: 0.0296
+cls: 0.243
+cls_pw: 0.631
+obj: 0.301
+obj_pw: 0.911
+iou_t: 0.2
+anchor_t: 2.91
+fl_gamma: 0.0
+hsv_h: 0.0138
+hsv_s: 0.664
+hsv_v: 0.464
+degrees: 0.373
+translate: 0.245
+scale: 0.898
+shear: 0.602
+perspective: 0.0
+flipud: 0.00856
+fliplr: 0.5
+mosaic: 1.0
+mixup: 0.243
@@ -0,0 +1,27 @@
+lr0: 0.0
+lrf: 0.0
+momentum: 0.843
+weight_decay: 0.00036
+warmup_epochs: 40.0
+warmup_momentum: 0.5
+warmup_bias_lr: 0.05
+box: 0.0296
+cls: 0.243
+cls_pw: 0.631
+obj: 0.301
+obj_pw: 0.911
+iou_t: 0.2
+anchor_t: 2.91
+fl_gamma: 0.0
+hsv_h: 0.0138
+hsv_s: 0.664
+hsv_v: 0.464
+degrees: 0.373
+translate: 0.245
+scale: 0.898
+shear: 0.602
+perspective: 0.0
+flipud: 0.00856
+fliplr: 0.5
+mosaic: 1.0
+mixup: 0.243
@@ -0,0 +1,52 @@
+# parameters
+nc: 80  # number of classes
+depth_multiple: 1.0  # model depth multiple
+width_multiple: 1.0  # layer channel multiple
+act: nn.LeakyReLU  # activations
+
+# anchors
+anchors:
+  - [10,13, 16,30, 33,23]  # P3/8
+  - [30,61, 62,45, 59,119]  # P4/16
+  - [116,90, 156,198, 373,326]  # P5/32
+
+# darknet53 backbone
+backbone:
+  # [from, number, module, args]
+  [[-1, 1, Conv, [32, 3, 1]],  # 0
+   [-1, 1, Conv, [64, 3, 2]],  # 1-P1/2
+   [-1, 1, Bottleneck, [64]],
+   [-1, 1, Conv, [128, 3, 2]],  # 3-P2/4
+   [-1, 2, Bottleneck, [128]],
+   [-1, 1, Conv, [256, 3, 2]],  # 5-P3/8
+   [-1, 8, Bottleneck, [256]],
+   [-1, 1, Conv, [512, 3, 2]],  # 7-P4/16
+   [-1, 8, Bottleneck, [512]],
+   [-1, 1, Conv, [1024, 3, 2]],  # 9-P5/32
+   [-1, 4, Bottleneck, [1024]],  # 10
+  ]
+
+# YOLOv3-SPP head
+head:
+  [[-1, 1, Bottleneck, [1024, False]],
+   [-1, 1, SPP, [512, [5, 9, 13]]],
+   [-1, 1, Conv, [1024, 3, 1]],
+   [-1, 1, Conv, [512, 1, 1]],
+   [-1, 1, Conv, [1024, 3, 1]],  # 15 (P5/32-large)
+
+   [-2, 1, Conv, [256, 1, 1]],
+   [-1, 1, nn.Upsample, [None, 2, 'nearest']],
+   [[-1, 8], 1, Concat, [1]],  # cat backbone P4
+   [-1, 1, Bottleneck, [512, False]],
+   [-1, 1, Bottleneck, [512, False]],
+   [-1, 1, Conv, [256, 1, 1]],
+   [-1, 1, Conv, [512, 3, 1]],  # 22 (P4/16-medium)
+
+   [-2, 1, Conv, [128, 1, 1]],
+   [-1, 1, nn.Upsample, [None, 2, 'nearest']],
+   [[-1, 6], 1, Concat, [1]],  # cat backbone P3
+   [-1, 1, Bottleneck, [256, False]],
+   [-1, 2, Bottleneck, [256, False]],  # 27 (P3/8-small)
+
+   [[27, 22, 15], 1, Detect, [nc, anchors]],   # Detect(P3, P4, P5)
+  ]
@@ -0,0 +1,202 @@
+<!--
+Copyright (c) 2021 - present / Neuralmagic, Inc. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+-->
+
+---
+# General Epoch/LR variables
+num_epochs: &num_epochs 300.0
+
+# pruning hyperparameters
+init_sparsity: &init_sparsity 0.05
+pruning_start_epoch: &pruning_start_epoch 0.0
+pruning_end_epoch: &pruning_end_epoch 80.0
+update_frequency: &pruning_update_frequency 0.5
+
+
+# modifiers
+training_modifiers:
+  - !EpochRangeModifier
+    start_epoch: 0.0
+    end_epoch: *num_epochs
+
+pruning_modifiers:
+  - !GMPruningModifier
+    params:
+      - model.16.conv.weight
+      - model.19.cv1.conv.weight
+      - model.26.cv2.conv.weight
+    init_sparsity: *init_sparsity
+    final_sparsity: 0.6
+    start_epoch: *pruning_start_epoch
+    end_epoch: *pruning_end_epoch
+    update_frequency: *pruning_update_frequency
+
+  - !GMPruningModifier
+    params:
+      - model.12.cv1.conv.weight
+      - model.14.conv.weight
+      - model.2.cv1.conv.weight
+      - model.20.cv2.conv.weight
+      - model.22.conv.weight
+      - model.26.cv1.conv.weight
+      - model.27.1.cv1.conv.weight
+      - model.28.m.0.weight
+      - model.28.m.2.weight
+      - model.4.0.cv1.conv.weight
+      - model.6.1.cv1.conv.weight
+      - model.6.2.cv1.conv.weight
+      - model.6.3.cv1.conv.weight
+      - model.6.4.cv1.conv.weight
+      - model.6.5.cv1.conv.weight
+      - model.6.6.cv1.conv.weight
+      - model.6.7.cv1.conv.weight
+      - model.8.0.cv1.conv.weight
+      - model.8.1.cv1.conv.weight
+      - model.8.2.cv1.conv.weight
+      - model.8.3.cv1.conv.weight
+      - model.8.4.cv1.conv.weight
+      - model.8.5.cv1.conv.weight
+      - model.8.6.cv1.conv.weight
+      - model.8.7.cv1.conv.weight
+    init_sparsity: *init_sparsity
+    final_sparsity: 0.75
+    start_epoch: *pruning_start_epoch
+    end_epoch: *pruning_end_epoch
+    update_frequency: *pruning_update_frequency
+
+  - !GMPruningModifier
+    params:
+      - model.1.conv.weight
+      - model.10.0.cv1.conv.weight
+      - model.10.1.cv1.conv.weight
+      - model.10.2.cv1.conv.weight
+      - model.10.3.cv1.conv.weight
+      - model.11.cv1.conv.weight
+      - model.12.cv2.conv.weight
+      - model.19.cv2.conv.weight
+      - model.2.cv2.conv.weight
+      - model.27.0.cv1.conv.weight
+      - model.27.0.cv2.conv.weight
+      - model.27.1.cv2.conv.weight
+      - model.28.m.1.weight
+      - model.3.conv.weight
+      - model.4.0.cv2.conv.weight
+      - model.4.1.cv1.conv.weight
+      - model.4.1.cv2.conv.weight
+      - model.5.conv.weight
+      - model.6.0.cv1.conv.weight
+      - model.6.0.cv2.conv.weight
+      - model.6.1.cv2.conv.weight
+      - model.6.2.cv2.conv.weight
+      - model.6.3.cv2.conv.weight
+    init_sparsity: *init_sparsity
+    final_sparsity: 0.8
+    start_epoch: *pruning_start_epoch
+    end_epoch: *pruning_end_epoch
+    update_frequency: *pruning_update_frequency
+
+  - !GMPruningModifier
+    params:
+      - model.10.0.cv2.conv.weight
+      - model.10.1.cv2.conv.weight
+      - model.10.2.cv2.conv.weight
+      - model.10.3.cv2.conv.weight
+      - model.11.cv2.conv.weight
+      - model.13.conv.weight
+      - model.15.conv.weight
+      - model.20.cv1.conv.weight
+      - model.21.conv.weight
+      - model.23.conv.weight
+      - model.6.4.cv2.conv.weight
+      - model.6.5.cv2.conv.weight
+      - model.6.6.cv2.conv.weight
+      - model.6.7.cv2.conv.weight
+      - model.7.conv.weight
+      - model.8.0.cv2.conv.weight
+      - model.8.1.cv2.conv.weight
+      - model.8.2.cv2.conv.weight
+      - model.8.3.cv2.conv.weight
+      - model.8.4.cv2.conv.weight
+      - model.8.5.cv2.conv.weight
+      - model.8.6.cv2.conv.weight
+      - model.8.7.cv2.conv.weight
+      - model.9.conv.weight
+    init_sparsity: *init_sparsity
+    final_sparsity: 0.92
+    start_epoch: *pruning_start_epoch
+    end_epoch: *pruning_end_epoch
+    update_frequency: *pruning_update_frequency
+---
+
+# YOLOv3-SPP Pruned
+
+This recipe creates a sparse, [YOLOv3-SPP](https://arxiv.org/abs/1804.02767) model that 
+achieves 97% recovery of its baseline accuracy on the COCO detection dataset.
+Training was done using 4 GPUs at half precision using a total training batch size of 256
+using an the
+[SparseML integration with ultralytics/yolov5](https://github.com/neuralmagic/sparseml/tree/main/integrations/ultralytics-yolov3).
+
+When running, adjust hyperparameters based on training environment and dataset.
+
+## Training
+To set up the training environment, follow the instructions on the
+[integration README](https://github.com/neuralmagic/sparseml/blob/main/integrations/ultralytics-yolov3/README.md).
+Using the given training script from the `yolov3` directory the following command can be used
+to launch this recipe.  The contents of the `hyp.prune.yaml` hyperparameters file is given below.
+Adjust the script command for your GPU device setup. Ultralytics supports both DataParallel and DDP.
+
+*script command:*
+
+```
+python train.py \
+  --recipe ../recipes/yolov3-spp.pruned.md \
+  --weights PRETRAINED_WEIGHTS \
+  --cfg ../models/yolov3-spp.lrelu.yaml \
+  --data coco.yaml \
+  --hyp ../data/hyp.pruned.yaml \
+  --batch-size 256 \
+  --name yolov3-spp-lrelu-pruned
+```
+
+hyp.prune.yaml:
+```yaml
+lr0: 0.005
+lrf: 0.1
+momentum: 0.843
+weight_decay: 0.00036
+warmup_epochs: 40.0
+warmup_momentum: 0.5
+warmup_bias_lr: 0.05
+box: 0.0296
+cls: 0.243
+cls_pw: 0.631
+obj: 0.301
+obj_pw: 0.911
+iou_t: 0.2
+anchor_t: 2.91
+fl_gamma: 0.0
+hsv_h: 0.0138
+hsv_s: 0.664
+hsv_v: 0.464
+degrees: 0.373
+translate: 0.245
+scale: 0.898
+shear: 0.602
+perspective: 0.0
+flipud: 0.00856
+fliplr: 0.5
+mosaic: 1.0
+mixup: 0.243
+```