Skip to content

Commit 6ffc098

Browse files
krishung5nv-anants
authored andcommitted
test: Add deepep test for vllm (#2534)
1 parent 3ba93a0 commit 6ffc098

File tree

3 files changed

+33
-1
lines changed

3 files changed

+33
-1
lines changed

components/backends/vllm/launch/dsr1_dep.sh

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,6 +10,7 @@ NODE_RANK=""
1010
GPUS_PER_NODE=""
1111
MASTER_ADDR="localhost"
1212
LOG_DIR="./logs"
13+
MODEL="deepseek-ai/DeepSeek-R1"
1314

1415
# Parse command line arguments
1516
while [[ $# -gt 0 ]]; do
@@ -34,6 +35,10 @@ while [[ $# -gt 0 ]]; do
3435
LOG_DIR="$2"
3536
shift 2
3637
;;
38+
--model)
39+
MODEL="$2"
40+
shift 2
41+
;;
3742
-h|--help)
3843
echo "Usage: $0 [OPTIONS]"
3944
echo "Options:"
@@ -42,6 +47,7 @@ while [[ $# -gt 0 ]]; do
4247
echo " --gpus-per-node L Number of GPUs per node (required, int)"
4348
echo " --master-addr ADDR Master node address (default: localhost)"
4449
echo " --log-dir DIR Directory for log files (default: ./logs)"
50+
echo " --model MODEL Model name to use (default: deepseek-ai/DeepSeek-R1)"
4551
echo " -h, --help Show this help message"
4652
exit 0
4753
;;
@@ -71,6 +77,7 @@ echo " GPUs per node: $GPUS_PER_NODE"
7177
echo " Data parallel size: $DATA_PARALLEL_SIZE"
7278
echo " Master address: $MASTER_ADDR"
7379
echo " Log directory: $LOG_DIR"
80+
echo " Model name: $MODEL"
7481

7582
trap 'echo Cleaning up...; kill 0' EXIT
7683

@@ -90,7 +97,7 @@ for ((i=0; i<GPUS_PER_NODE; i++)); do
9097
VLLM_USE_DEEP_GEMM=1 \
9198
VLLM_RANDOMIZE_DP_DUMMY_INPUTS=1 \
9299
python3 -m dynamo.vllm \
93-
--model deepseek-ai/DeepSeek-R1 \
100+
--model $MODEL \
94101
--data_parallel_size $DATA_PARALLEL_SIZE \
95102
--data-parallel-rank $dp_rank \
96103
--enable-expert-parallel \

pyproject.toml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -175,6 +175,7 @@ markers = [
175175
"trtllm_marker: marks tests as requiring trtllm",
176176
"sglang: marks tests as requiring sglang",
177177
"slow: marks tests as known to be slow",
178+
"h100: marks tests to run on H100",
178179
"kvbm: marks tests for KV behavior and model determinism"
179180
]
180181

tests/serve/test_vllm.py

Lines changed: 24 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -260,6 +260,30 @@ def wait_for_ready(self, payload, logger=logging.getLogger()):
260260
model="Qwen/Qwen3-0.6B",
261261
delayed_start=45,
262262
),
263+
"deepep": VLLMConfig(
264+
name="deepep",
265+
directory="/workspace/components/backends/vllm",
266+
script_name="dsr1_dep.sh",
267+
marks=[pytest.mark.gpu_2, pytest.mark.vllm, pytest.mark.h100],
268+
endpoints=["v1/chat/completions", "v1/completions"],
269+
response_handlers=[
270+
chat_completions_response_handler,
271+
completions_response_handler,
272+
],
273+
model="deepseek-ai/DeepSeek-V2-Lite",
274+
delayed_start=45,
275+
args=[
276+
"--model",
277+
"deepseek-ai/DeepSeek-V2-Lite",
278+
"--num-nodes",
279+
"1",
280+
"--node-rank",
281+
"0",
282+
"--gpus-per-node",
283+
"2",
284+
],
285+
timeout=300,
286+
),
263287
"multimodal_agg": VLLMConfig(
264288
name="multimodal_agg",
265289
directory="/workspace/examples/multimodal",

0 commit comments

Comments
 (0)