We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 89026ae commit 73bee9aCopy full SHA for 73bee9a
qa/TL3_SSD_convergence/test_pytorch.sh
@@ -42,7 +42,7 @@ export NCCL_NVLS_ENABLE=0
42
43
# Prevent OOM due to fragmentation on 16G machines
44
export PYTORCH_CUDA_ALLOC_CONF=max_split_size_mb:4096
45
-torchrun --nproc_per_node=${NUM_GPUS} main.py --backbone resnet50 --warmup 300 --bs 256 --eval-batch-size 8 --data /coco --data ${DATA_DIR} --data_pipeline dali --target 0.25 2>&1 | tee $LOG
+torchrun --nproc_per_node=${NUM_GPUS} main.py --backbone resnet50 --warmup 300 --bs 64 --eval-batch-size 8 --data /coco --data ${DATA_DIR} --data_pipeline dali --target 0.25 2>&1 | tee $LOG
46
((IS_TMP_DIR)) && rm -rf ${DATA_DIR}
47
48
RET=${PIPESTATUS[0]}
0 commit comments