Преглед изворни кода

Fix missing multiproc in example training script

Andrzej Sulecki пре 5 година
родитељ
комит
b946389828
28 измењених фајлова са 28 додато и 28 уклоњено
  1. 1 1
      PyTorch/Classification/ConvNets/resnet50v1.5/training/AMP/DGX1V_resnet50_AMP_250E.sh
  2. 1 1
      PyTorch/Classification/ConvNets/resnet50v1.5/training/AMP/DGX1V_resnet50_AMP_90E.sh
  3. 1 1
      PyTorch/Classification/ConvNets/resnet50v1.5/training/AMP/DGX2V_resnet50_AMP_250E.sh
  4. 1 1
      PyTorch/Classification/ConvNets/resnet50v1.5/training/AMP/DGX2V_resnet50_AMP_90E.sh
  5. 1 1
      PyTorch/Classification/ConvNets/resnet50v1.5/training/AMP/DGXA100_resnet50_AMP_250E.sh
  6. 1 1
      PyTorch/Classification/ConvNets/resnet50v1.5/training/AMP/DGXA100_resnet50_AMP_90E.sh
  7. 1 1
      PyTorch/Classification/ConvNets/resnet50v1.5/training/FP32/DGX1V_resnet50_FP32_250E.sh
  8. 1 1
      PyTorch/Classification/ConvNets/resnet50v1.5/training/FP32/DGX1V_resnet50_FP32_90E.sh
  9. 1 1
      PyTorch/Classification/ConvNets/resnet50v1.5/training/FP32/DGX2V_resnet50_FP32_250E.sh
  10. 1 1
      PyTorch/Classification/ConvNets/resnet50v1.5/training/FP32/DGX2V_resnet50_FP32_90E.sh
  11. 1 1
      PyTorch/Classification/ConvNets/resnet50v1.5/training/TF32/DGXA100_resnet50_TF32_250E.sh
  12. 1 1
      PyTorch/Classification/ConvNets/resnet50v1.5/training/TF32/DGXA100_resnet50_TF32_90E.sh
  13. 1 1
      PyTorch/Classification/ConvNets/resnext101-32x4d/training/AMP/DGX1V_resnext101-32x4d_AMP_250E.sh
  14. 1 1
      PyTorch/Classification/ConvNets/resnext101-32x4d/training/AMP/DGX1V_resnext101-32x4d_AMP_90E.sh
  15. 1 1
      PyTorch/Classification/ConvNets/resnext101-32x4d/training/AMP/DGXA100_resnext101-32x4d_AMP_250E.sh
  16. 1 1
      PyTorch/Classification/ConvNets/resnext101-32x4d/training/AMP/DGXA100_resnext101-32x4d_AMP_90E.sh
  17. 1 1
      PyTorch/Classification/ConvNets/resnext101-32x4d/training/FP32/DGX1V_resnext101-32x4d_FP32_250E.sh
  18. 1 1
      PyTorch/Classification/ConvNets/resnext101-32x4d/training/FP32/DGX1V_resnext101-32x4d_FP32_90E.sh
  19. 1 1
      PyTorch/Classification/ConvNets/resnext101-32x4d/training/TF32/DGXA100_resnext101-32x4d_TF32_250E.sh
  20. 1 1
      PyTorch/Classification/ConvNets/resnext101-32x4d/training/TF32/DGXA100_resnext101-32x4d_TF32_90E.sh
  21. 1 1
      PyTorch/Classification/ConvNets/se-resnext101-32x4d/training/AMP/DGX1V_se-resnext101-32x4d_AMP_250E.sh
  22. 1 1
      PyTorch/Classification/ConvNets/se-resnext101-32x4d/training/AMP/DGX1V_se-resnext101-32x4d_AMP_90E.sh
  23. 1 1
      PyTorch/Classification/ConvNets/se-resnext101-32x4d/training/AMP/DGXA100_se-resnext101-32x4d_AMP_250E.sh
  24. 1 1
      PyTorch/Classification/ConvNets/se-resnext101-32x4d/training/AMP/DGXA100_se-resnext101-32x4d_AMP_90E.sh
  25. 1 1
      PyTorch/Classification/ConvNets/se-resnext101-32x4d/training/FP32/DGX1V_se-resnext101-32x4d_FP32_250E.sh
  26. 1 1
      PyTorch/Classification/ConvNets/se-resnext101-32x4d/training/FP32/DGX1V_se-resnext101-32x4d_FP32_90E.sh
  27. 1 1
      PyTorch/Classification/ConvNets/se-resnext101-32x4d/training/TF32/DGXA100_se-resnext101-32x4d_TF32_250E.sh
  28. 1 1
      PyTorch/Classification/ConvNets/se-resnext101-32x4d/training/TF32/DGXA100_se-resnext101-32x4d_TF32_90E.sh

+ 1 - 1
PyTorch/Classification/ConvNets/resnet50v1.5/training/AMP/DGX1V_resnet50_AMP_250E.sh

@@ -1 +1 @@
-python ./launch.py --model resnet50 --precision AMP --mode convergence --platform DGX1V /imagenet --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnet50 --precision AMP --mode convergence --platform DGX1V /imagenet --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnet50v1.5/training/AMP/DGX1V_resnet50_AMP_90E.sh

@@ -1 +1 @@
-python ./launch.py --model resnet50 --precision AMP --mode convergence --platform DGX1V /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnet50 --precision AMP --mode convergence --platform DGX1V /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnet50v1.5/training/AMP/DGX2V_resnet50_AMP_250E.sh

@@ -1 +1 @@
-python ./launch.py --model resnet50 --precision AMP --mode convergence --platform DGX2V /imagenet --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnet50 --precision AMP --mode convergence --platform DGX2V /imagenet --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnet50v1.5/training/AMP/DGX2V_resnet50_AMP_90E.sh

@@ -1 +1 @@
-python ./launch.py --model resnet50 --precision AMP --mode convergence --platform DGX2V /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnet50 --precision AMP --mode convergence --platform DGX2V /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnet50v1.5/training/AMP/DGXA100_resnet50_AMP_250E.sh

@@ -1 +1 @@
-python ./launch.py --model resnet50 --precision AMP --mode convergence --platform DGXA100 /imagenet --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnet50 --precision AMP --mode convergence --platform DGXA100 /imagenet --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnet50v1.5/training/AMP/DGXA100_resnet50_AMP_90E.sh

@@ -1 +1 @@
-python ./launch.py --model resnet50 --precision AMP --mode convergence --platform DGXA100 /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnet50 --precision AMP --mode convergence --platform DGXA100 /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnet50v1.5/training/FP32/DGX1V_resnet50_FP32_250E.sh

@@ -1 +1 @@
-python ./launch.py --model resnet50 --precision FP32 --mode convergence --platform DGX1V /imagenet --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnet50 --precision FP32 --mode convergence --platform DGX1V /imagenet --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnet50v1.5/training/FP32/DGX1V_resnet50_FP32_90E.sh

@@ -1 +1 @@
-python ./launch.py --model resnet50 --precision FP32 --mode convergence --platform DGX1V /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnet50 --precision FP32 --mode convergence --platform DGX1V /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnet50v1.5/training/FP32/DGX2V_resnet50_FP32_250E.sh

@@ -1 +1 @@
-python ./launch.py --model resnet50 --precision FP32 --mode convergence --platform DGX2V /imagenet --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnet50 --precision FP32 --mode convergence --platform DGX2V /imagenet --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnet50v1.5/training/FP32/DGX2V_resnet50_FP32_90E.sh

@@ -1 +1 @@
-python ./launch.py --model resnet50 --precision FP32 --mode convergence --platform DGX2V /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnet50 --precision FP32 --mode convergence --platform DGX2V /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnet50v1.5/training/TF32/DGXA100_resnet50_TF32_250E.sh

@@ -1 +1 @@
-python ./launch.py --model resnet50 --precision TF32 --mode convergence --platform DGXA100 /imagenet --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnet50 --precision TF32 --mode convergence --platform DGXA100 /imagenet --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnet50v1.5/training/TF32/DGXA100_resnet50_TF32_90E.sh

@@ -1 +1 @@
-python ./launch.py --model resnet50 --precision TF32 --mode convergence --platform DGXA100 /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnet50 --precision TF32 --mode convergence --platform DGXA100 /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnext101-32x4d/training/AMP/DGX1V_resnext101-32x4d_AMP_250E.sh

@@ -1 +1 @@
-python ./launch.py --model resnext101-32x4d --precision AMP --mode convergence --platform DGX1V /imagenet --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnext101-32x4d --precision AMP --mode convergence --platform DGX1V /imagenet --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnext101-32x4d/training/AMP/DGX1V_resnext101-32x4d_AMP_90E.sh

@@ -1 +1 @@
-python ./launch.py --model resnext101-32x4d --precision AMP --mode convergence --platform DGX1V /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnext101-32x4d --precision AMP --mode convergence --platform DGX1V /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnext101-32x4d/training/AMP/DGXA100_resnext101-32x4d_AMP_250E.sh

@@ -1 +1 @@
-python ./launch.py --model resnext101-32x4d --precision AMP --mode convergence --platform DGXA100 /imagenet --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnext101-32x4d --precision AMP --mode convergence --platform DGXA100 /imagenet --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnext101-32x4d/training/AMP/DGXA100_resnext101-32x4d_AMP_90E.sh

@@ -1 +1 @@
-python ./launch.py --model resnext101-32x4d --precision AMP --mode convergence --platform DGXA100 /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnext101-32x4d --precision AMP --mode convergence --platform DGXA100 /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnext101-32x4d/training/FP32/DGX1V_resnext101-32x4d_FP32_250E.sh

@@ -1 +1 @@
-python ./launch.py --model resnext101-32x4d --precision FP32 --mode convergence --platform DGX1V /imagenet --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnext101-32x4d --precision FP32 --mode convergence --platform DGX1V /imagenet --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnext101-32x4d/training/FP32/DGX1V_resnext101-32x4d_FP32_90E.sh

@@ -1 +1 @@
-python ./launch.py --model resnext101-32x4d --precision FP32 --mode convergence --platform DGX1V /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnext101-32x4d --precision FP32 --mode convergence --platform DGX1V /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnext101-32x4d/training/TF32/DGXA100_resnext101-32x4d_TF32_250E.sh

@@ -1 +1 @@
-python ./launch.py --model resnext101-32x4d --precision TF32 --mode convergence --platform DGXA100 /imagenet --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnext101-32x4d --precision TF32 --mode convergence --platform DGXA100 /imagenet --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/resnext101-32x4d/training/TF32/DGXA100_resnext101-32x4d_TF32_90E.sh

@@ -1 +1 @@
-python ./launch.py --model resnext101-32x4d --precision TF32 --mode convergence --platform DGXA100 /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model resnext101-32x4d --precision TF32 --mode convergence --platform DGXA100 /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/se-resnext101-32x4d/training/AMP/DGX1V_se-resnext101-32x4d_AMP_250E.sh

@@ -1 +1 @@
-python ./launch.py --model se-resnext101-32x4d --precision AMP --mode convergence --platform DGX1V /imagenet --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model se-resnext101-32x4d --precision AMP --mode convergence --platform DGX1V /imagenet --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/se-resnext101-32x4d/training/AMP/DGX1V_se-resnext101-32x4d_AMP_90E.sh

@@ -1 +1 @@
-python ./launch.py --model se-resnext101-32x4d --precision AMP --mode convergence --platform DGX1V /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model se-resnext101-32x4d --precision AMP --mode convergence --platform DGX1V /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/se-resnext101-32x4d/training/AMP/DGXA100_se-resnext101-32x4d_AMP_250E.sh

@@ -1 +1 @@
-python ./launch.py --model se-resnext101-32x4d --precision AMP --mode convergence --platform DGXA100 /imagenet --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model se-resnext101-32x4d --precision AMP --mode convergence --platform DGXA100 /imagenet --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/se-resnext101-32x4d/training/AMP/DGXA100_se-resnext101-32x4d_AMP_90E.sh

@@ -1 +1 @@
-python ./launch.py --model se-resnext101-32x4d --precision AMP --mode convergence --platform DGXA100 /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model se-resnext101-32x4d --precision AMP --mode convergence --platform DGXA100 /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/se-resnext101-32x4d/training/FP32/DGX1V_se-resnext101-32x4d_FP32_250E.sh

@@ -1 +1 @@
-python ./launch.py --model se-resnext101-32x4d --precision FP32 --mode convergence --platform DGX1V /imagenet --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model se-resnext101-32x4d --precision FP32 --mode convergence --platform DGX1V /imagenet --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/se-resnext101-32x4d/training/FP32/DGX1V_se-resnext101-32x4d_FP32_90E.sh

@@ -1 +1 @@
-python ./launch.py --model se-resnext101-32x4d --precision FP32 --mode convergence --platform DGX1V /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model se-resnext101-32x4d --precision FP32 --mode convergence --platform DGX1V /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/se-resnext101-32x4d/training/TF32/DGXA100_se-resnext101-32x4d_TF32_250E.sh

@@ -1 +1 @@
-python ./launch.py --model se-resnext101-32x4d --precision TF32 --mode convergence --platform DGXA100 /imagenet --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model se-resnext101-32x4d --precision TF32 --mode convergence --platform DGXA100 /imagenet --workspace ${1:-./} --raport-file raport.json

+ 1 - 1
PyTorch/Classification/ConvNets/se-resnext101-32x4d/training/TF32/DGXA100_se-resnext101-32x4d_TF32_90E.sh

@@ -1 +1 @@
-python ./launch.py --model se-resnext101-32x4d --precision TF32 --mode convergence --platform DGXA100 /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json
+python ./multiproc.py --nproc_per_node 8 ./launch.py --model se-resnext101-32x4d --precision TF32 --mode convergence --platform DGXA100 /imagenet --epochs 90 --mixup 0.0 --workspace ${1:-./} --raport-file raport.json