Commit 5a104e99 authored by Aristeidis Tsaris's avatar Aristeidis Tsaris
Browse files

adding more plots

parent be5d1f2a
This source diff could not be displayed because it is too large. You can view the blob instead.
#!/bin/bash
# Begin LSF directives
#BSUB -P gen166
#BSUB -J sc21
#BSUB -o logs/sc21.o%J
#BSUB -W 0:30
#BSUB -nnodes 1
#BSUB -alloc_flags "nvme smt4"
####BSUB -N
# End LSF directives and begin shell commands
nnodes=$(cat ${LSB_DJOB_HOSTFILE} | sort | uniq | grep -v login | grep -v batch | wc -l)
DATA_DIR=/gpfs/wolf/gen166/proj-shared/atsaris/imagenet/data/
LOG_DIR=/gpfs/wolf/gen166/proj-shared/atsaris/pytorch_tutorial/ascent/ascent_logs/
source /gpfs/wolf/gen166/proj-shared/atsaris/env/activate.sh
jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a1 -c42 -g1 -r1 \
--bind=proportional-packed:7 --launch_distribution=packed \
bash -c "\
source export_DDP_envvars.sh && \
python -u ../imagenet/main.py \
--arch resnet50 \
-j 1 \
-p 10 \
-b 128\
--training-only \
--raport-file ${LOG_DIR}/benchmark.dataload.opt.1GPU.json \
--epochs 1 \
--prof 100 \
--no-checkpoints \
--data-backend pytorch \
--amp \
--memory-format nhwc \
--dtLdTime \
${DATA_DIR}
"
......@@ -21,11 +21,11 @@ jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a5 -c42 -g5 -r1 \
source export_DDP_envvars.sh && \
python -u ../imagenet/main.py \
--arch resnet50 \
-j 1 \
-j 28 \
-p 10 \
-b 128\
--training-only \
--raport-file ${LOG_DIR}/benchmark.dataload.opt.5GPU.json \
--raport-file ${LOG_DIR}/benchmark.dataload.opt.1N.json \
--epochs 1 \
--prof 100 \
--no-checkpoints \
......@@ -35,3 +35,44 @@ jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a5 -c42 -g5 -r1 \
--dtLdTime \
${DATA_DIR}
"
jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a5 -c42 -g5 -r1 \
--bind=proportional-packed:7 --launch_distribution=packed \
bash -c "\
source export_DDP_envvars.sh && \
python -u ../imagenet/main.py \
--arch resnet50 \
-j 28 \
-p 10 \
-b 128\
--training-only \
--raport-file ${LOG_DIR}/benchmark.syntetic.opt.1N.json \
--epochs 1 \
--prof 100 \
--no-checkpoints \
--data-backend syntetic \
--amp \
--memory-format nhwc \
${DATA_DIR}
"
jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a5 -c42 -g5 -r1 \
--bind=proportional-packed:7 --launch_distribution=packed \
bash -c "\
source export_DDP_envvars.sh && \
python -u ../imagenet/main.py \
--arch resnet50 \
-j 28 \
-p 10 \
-b 128\
--training-only \
--raport-file ${LOG_DIR}/benchmark.syntetic.noddp.opt.1N.json \
--epochs 1 \
--prof 100 \
--no-checkpoints \
--data-backend syntetic \
--amp \
--memory-format nhwc \
--noDDP \
${DATA_DIR}
"
......@@ -21,11 +21,11 @@ jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a5 -c42 -g5 -r1 \
source export_DDP_envvars.sh && \
python -u ../imagenet/main.py \
--arch resnet50 \
-j 1 \
-j 28 \
-p 10 \
-b 128\
--training-only \
--raport-file ${LOG_DIR}/benchmark.dataload.opt.10GPU.json \
--raport-file ${LOG_DIR}/benchmark.dataload.opt.2N.json \
--epochs 1 \
--prof 100 \
--no-checkpoints \
......@@ -35,3 +35,44 @@ jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a5 -c42 -g5 -r1 \
--dtLdTime \
${DATA_DIR}
"
jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a5 -c42 -g5 -r1 \
--bind=proportional-packed:7 --launch_distribution=packed \
bash -c "\
source export_DDP_envvars.sh && \
python -u ../imagenet/main.py \
--arch resnet50 \
-j 28 \
-p 10 \
-b 128\
--training-only \
--raport-file ${LOG_DIR}/benchmark.syntetic.opt.2N.json \
--epochs 1 \
--prof 100 \
--no-checkpoints \
--data-backend syntetic \
--amp \
--memory-format nhwc \
${DATA_DIR}
"
jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a5 -c42 -g5 -r1 \
--bind=proportional-packed:7 --launch_distribution=packed \
bash -c "\
source export_DDP_envvars.sh && \
python -u ../imagenet/main.py \
--arch resnet50 \
-j 28 \
-p 10 \
-b 128\
--training-only \
--raport-file ${LOG_DIR}/benchmark.syntetic.noddp.opt.2N.json \
--epochs 1 \
--prof 100 \
--no-checkpoints \
--data-backend syntetic \
--amp \
--memory-format nhwc \
--noDDP \
${DATA_DIR}
"
......@@ -21,11 +21,11 @@ jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a5 -c42 -g5 -r1 \
source export_DDP_envvars.sh && \
python -u ../imagenet/main.py \
--arch resnet50 \
-j 1 \
-j 28 \
-p 10 \
-b 128\
--training-only \
--raport-file ${LOG_DIR}/benchmark.dataload.opt.15GPU.json \
--raport-file ${LOG_DIR}/benchmark.dataload.opt.3N.json \
--epochs 1 \
--prof 100 \
--no-checkpoints \
......@@ -35,3 +35,44 @@ jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a5 -c42 -g5 -r1 \
--dtLdTime \
${DATA_DIR}
"
jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a5 -c42 -g5 -r1 \
--bind=proportional-packed:7 --launch_distribution=packed \
bash -c "\
source export_DDP_envvars.sh && \
python -u ../imagenet/main.py \
--arch resnet50 \
-j 28 \
-p 10 \
-b 128\
--training-only \
--raport-file ${LOG_DIR}/benchmark.syntetic.opt.3N.json \
--epochs 1 \
--prof 100 \
--no-checkpoints \
--data-backend syntetic \
--amp \
--memory-format nhwc \
${DATA_DIR}
"
jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a5 -c42 -g5 -r1 \
--bind=proportional-packed:7 --launch_distribution=packed \
bash -c "\
source export_DDP_envvars.sh && \
python -u ../imagenet/main.py \
--arch resnet50 \
-j 28 \
-p 10 \
-b 128\
--training-only \
--raport-file ${LOG_DIR}/benchmark.syntetic.noddp.opt.3N.json \
--epochs 1 \
--prof 100 \
--no-checkpoints \
--data-backend syntetic \
--amp \
--memory-format nhwc \
--noDDP \
${DATA_DIR}
"
......@@ -21,11 +21,11 @@ jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a5 -c42 -g5 -r1 \
source export_DDP_envvars.sh && \
python -u ../imagenet/main.py \
--arch resnet50 \
-j 1 \
-j 28 \
-p 10 \
-b 128\
--training-only \
--raport-file ${LOG_DIR}/benchmark.dataload.opt.20GPU.json \
--raport-file ${LOG_DIR}/benchmark.dataload.opt.4N.json \
--epochs 1 \
--prof 100 \
--no-checkpoints \
......@@ -35,3 +35,44 @@ jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a5 -c42 -g5 -r1 \
--dtLdTime \
${DATA_DIR}
"
jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a5 -c42 -g5 -r1 \
--bind=proportional-packed:7 --launch_distribution=packed \
bash -c "\
source export_DDP_envvars.sh && \
python -u ../imagenet/main.py \
--arch resnet50 \
-j 28 \
-p 10 \
-b 128\
--training-only \
--raport-file ${LOG_DIR}/benchmark.syntetic.opt.4N.json \
--epochs 1 \
--prof 100 \
--no-checkpoints \
--data-backend syntetic \
--amp \
--memory-format nhwc \
${DATA_DIR}
"
jsrun --smpiargs="-disable_gpu_hooks" -n${nnodes} -a5 -c42 -g5 -r1 \
--bind=proportional-packed:7 --launch_distribution=packed \
bash -c "\
source export_DDP_envvars.sh && \
python -u ../imagenet/main.py \
--arch resnet50 \
-j 28 \
-p 10 \
-b 128\
--training-only \
--raport-file ${LOG_DIR}/benchmark.syntetic.noddp.opt.4N.json \
--epochs 1 \
--prof 100 \
--no-checkpoints \
--data-backend syntetic \
--amp \
--memory-format nhwc \
--noDDP \
${DATA_DIR}
"
Supports Markdown
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment