Skip to content

Commit f1d24eb

Browse files
NickLucche0xrushi
authored andcommitted
[CI] Nixl integration tests DP-EP (vllm-project#27199)
Signed-off-by: NickLucche <nlucches@redhat.com> Signed-off-by: 0xrushi <6279035+0xrushi@users.noreply.github.com>
1 parent 2fb57bf commit f1d24eb

File tree

2 files changed

+10
-1
lines changed

2 files changed

+10
-1
lines changed

tests/v1/kv_connector/nixl_integration/run_accuracy_test.sh

Lines changed: 9 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -178,8 +178,16 @@ run_tests_for_model() {
178178
--port $PORT \
179179
--enforce-eager \
180180
--gpu-memory-utilization $GPU_MEMORY_UTILIZATION \
181-
--tensor-parallel-size $DECODER_TP_SIZE \
182181
--kv-transfer-config '$KV_CONFIG'"
182+
183+
# DP-EP attention mode
184+
if [[ -z "$DP_EP" ]]; then
185+
BASE_CMD="${BASE_CMD} --tensor-parallel-size $DECODER_TP_SIZE"
186+
else
187+
echo "DP-EP Attention enabled, deploying with dp=DECODER_TP_SIZE and tp=1"
188+
BASE_CMD="${BASE_CMD} --data-parallel-size $DECODER_TP_SIZE \
189+
--tensor-parallel-size 1 --enable-expert-parallel"
190+
fi
183191

184192
if [ -n "$model_args" ]; then
185193
FULL_CMD="$BASE_CMD $model_args"

tests/v1/kv_connector/nixl_integration/tp_config_sweep_accuracy_test.sh

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -10,6 +10,7 @@ configs=(
1010
"GPU_MEMORY_UTILIZATION=0.6 PREFILLER_TP_SIZE=1 DECODER_TP_SIZE=2"
1111
"GPU_MEMORY_UTILIZATION=0.8 MODEL_NAMES=deepseek-ai/deepseek-vl2-tiny" # MLA case
1212
"GPU_MEMORY_UTILIZATION=0.8 PREFILLER_TP_SIZE=1 DECODER_TP_SIZE=2 MODEL_NAMES=deepseek-ai/deepseek-vl2-tiny"
13+
"DP_EP=1 GPU_MEMORY_UTILIZATION=0.8 PREFILLER_TP_SIZE=1 DECODER_TP_SIZE=2 MODEL_NAMES=deepseek-ai/deepseek-vl2-tiny" # MLA+P-TP1, D-DPEP=2 (TP=1)
1314
)
1415

1516
run_tests() {

0 commit comments

Comments
 (0)