Skip to content

Commit c0134d2

Browse files
committed
revert ds e2e
Signed-off-by: MengqingCao <cmq0113@163.com>
1 parent c7f3b7d commit c0134d2

File tree

1 file changed

+15
-0
lines changed

1 file changed

+15
-0
lines changed

tests/e2e/multicard/test_offline_inference_distributed.py

Lines changed: 15 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -50,6 +50,21 @@ def test_models_distributed_QwQ():
5050
vllm_model.generate_greedy(example_prompts, max_tokens)
5151

5252

53+
def test_models_distributed_DeepSeek():
54+
example_prompts = [
55+
"Hello, my name is",
56+
]
57+
dtype = "half"
58+
max_tokens = 5
59+
with VllmRunner(
60+
"deepseek-ai/DeepSeek-V2-Lite",
61+
dtype=dtype,
62+
tensor_parallel_size=4,
63+
distributed_executor_backend="mp",
64+
) as vllm_model:
65+
vllm_model.generate_greedy(example_prompts, max_tokens)
66+
67+
5368
@patch.dict(os.environ, {"VLLM_ASCEND_ENABLE_TOPK_OPTIMIZE": "1"})
5469
def test_models_distributed_topk() -> None:
5570
example_prompts = [

0 commit comments

Comments
 (0)