From a6b889d6d13664f2998fbe5c58d801396882fc5c Mon Sep 17 00:00:00 2001 From: zhewenli Date: Sat, 16 Aug 2025 14:50:04 -0700 Subject: [PATCH 1/2] update checks --- vllm/benchmarks/throughput.py | 8 ++++++++ 1 file changed, 8 insertions(+) diff --git a/vllm/benchmarks/throughput.py b/vllm/benchmarks/throughput.py index fdf6548ada5b..42a0d60c9461 100644 --- a/vllm/benchmarks/throughput.py +++ b/vllm/benchmarks/throughput.py @@ -422,6 +422,14 @@ def validate_args(args): if args.backend == "mii" and args.tokenizer != args.model: raise ValueError( "Tokenizer must be the same as the model for MII backend.") + + # --data-parallel is not supported currently. + # https://github.com/vllm-project/vllm/issues/16222 + if args.data_parallel_size > 1: + raise ValueError( + "Data parallel is not supported in offline benchmark, \ + please use benchmark serving instead" + ) def add_cli_args(parser: argparse.ArgumentParser): From c7e84b57bfa8ab2a75e5dbefca00572d7791ea2f Mon Sep 17 00:00:00 2001 From: zhewenli Date: Sat, 16 Aug 2025 15:03:39 -0700 Subject: [PATCH 2/2] format --- benchmarks/benchmark_throughput.py | 4 ++-- vllm/benchmarks/throughput.py | 4 ++-- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/benchmarks/benchmark_throughput.py b/benchmarks/benchmark_throughput.py index c51b57968652..c7f290e1eb88 100644 --- a/benchmarks/benchmark_throughput.py +++ b/benchmarks/benchmark_throughput.py @@ -597,8 +597,8 @@ def validate_args(args): # https://github.com/vllm-project/vllm/issues/16222 if args.data_parallel_size > 1: raise ValueError( - "Data parallel is not supported in offline benchmark, \ - please use benchmark serving instead" + "Data parallel is not supported in offline benchmark, " + "please use benchmark serving instead" ) diff --git a/vllm/benchmarks/throughput.py b/vllm/benchmarks/throughput.py index 42a0d60c9461..e12cfd896424 100644 --- a/vllm/benchmarks/throughput.py +++ b/vllm/benchmarks/throughput.py @@ -427,8 +427,8 @@ def validate_args(args): # https://github.com/vllm-project/vllm/issues/16222 if args.data_parallel_size > 1: raise ValueError( - "Data parallel is not supported in offline benchmark, \ - please use benchmark serving instead" + "Data parallel is not supported in offline benchmark, " + "please use benchmark serving instead" )