Skip to content

Commit 08b32cc

Browse files
committed
fix slurm scripts
1 parent bad5387 commit 08b32cc

File tree

3 files changed

+5
-4
lines changed

3 files changed

+5
-4
lines changed

multimodal/vl2l/scripts/slurm/benchmark.sh

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -25,8 +25,6 @@ srun \
2525
--vllm.model.repo_id=${MODEL_REPO_ID} \
2626
--vllm.cli=--async-scheduling \
2727
--vllm.cli=--max-model-len=32768 \
28-
--vllm.cli=--max-num-seqs=1024 \
29-
--vllm.cli=--mm-encoder-tp-mode=data \
3028
--vllm.cli=--limit-mm-per-prompt.video=0 \
3129
--vllm.cli=--tensor-parallel-size=8 \
3230
--settings.logging.log_output.outdir=${OUTPUT_CONTAINER_DIR}/${SLURM_JOB_ID}

multimodal/vl2l/scripts/slurm/evaluate.sh

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,10 +9,13 @@
99
#SBATCH --output=evaluate-slurm-output-%j.txt
1010
#SBATCH --error=evaluate-slurm-error-%j.txt
1111

12+
export NVIDIA_VISIBLE_DEVICES=void
13+
1214
srun \
1315
--container-image=${CONTAINER_IMAGE} \
1416
--container-mounts=${CACHE_HOST_DIR}:${CACHE_CONTAINER_DIR},${OUTPUT_HOST_DIR}:${OUTPUT_CONTAINER_DIR} \
1517
--no-container-mount-home \
18+
--container-env=NVIDIA_VISIBLE_DEVICES \
1619
mlperf-inf-mm-vl2l evaluate \
1720
--dataset.token=${DATASET_TOKEN} \
18-
--filename=${OUTPUT_CONTAINER_DIR}/${SLURM_JOB_ID}/mlperf_log_accuracy.json
21+
--filename=${OUTPUT_CONTAINER_DIR}/${BENCHMARK_JOB_ID}/mlperf_log_accuracy.json

multimodal/vl2l/scripts/slurm/submit.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -197,7 +197,7 @@ benchmark_job_id=$(
197197
if [[ "${mode}" == "accuracy_only" ]]; then
198198
sbatch \
199199
--dependency=afterok:"${benchmark_job_id}" \
200-
--export=CACHE_HOST_DIR="${cache_host_dir}",CACHE_CONTAINER_DIR="${cache_container_dir}",OUTPUT_HOST_DIR="${output_host_dir}",OUTPUT_CONTAINER_DIR="${output_container_dir}",CONTAINER_IMAGE="${container_image}",DATASET_TOKEN="${dataset_token}" \
200+
--export=CACHE_HOST_DIR="${cache_host_dir}",CACHE_CONTAINER_DIR="${cache_container_dir}",OUTPUT_HOST_DIR="${output_host_dir}",OUTPUT_CONTAINER_DIR="${output_container_dir}",CONTAINER_IMAGE="${container_image}",DATASET_TOKEN="${dataset_token}",BENCHMARK_JOB_ID="${benchmark_job_id}" \
201201
--account="${slurm_account}" \
202202
--partition="${evaluate_slurm_partition}" \
203203
evaluate.sh

0 commit comments

Comments
 (0)