|
94 | 94 | @pytest.mark.parametrize("batch_size", [1, 32]) |
95 | 95 | @pytest.mark.parametrize("seed", [1]) |
96 | 96 | def test_mtp_e2e_greedy_correctness( |
97 | | - enable_model_scope_env, |
| 97 | + enable_modelscope_env, |
98 | 98 | vllm_runner, |
99 | 99 | common_llm_kwargs, |
100 | 100 | per_test_common_llm_kwargs, |
@@ -145,7 +145,7 @@ def test_mtp_e2e_greedy_correctness( |
145 | 145 | @pytest.mark.parametrize("batch_size", [1, 32]) |
146 | 146 | @pytest.mark.parametrize("seed", [1]) |
147 | 147 | def test_mtp_e2e_quant_greedy_correctness( |
148 | | - enable_model_scope_env, |
| 148 | + enable_modelscope_env, |
149 | 149 | vllm_runner, |
150 | 150 | common_llm_kwargs, |
151 | 151 | per_test_common_llm_kwargs, |
@@ -204,7 +204,7 @@ def test_mtp_e2e_quant_greedy_correctness( |
204 | 204 | @pytest.mark.parametrize("seed", [1]) |
205 | 205 | @pytest.mark.parametrize("logprobs", [1, 6]) |
206 | 206 | def test_mtp_e2e_greedy_logprobs( |
207 | | - enable_model_scope_env, |
| 207 | + enable_modelscope_env, |
208 | 208 | vllm_runner, |
209 | 209 | common_llm_kwargs, |
210 | 210 | per_test_common_llm_kwargs, |
@@ -263,7 +263,7 @@ def test_mtp_e2e_greedy_logprobs( |
263 | 263 | @pytest.mark.parametrize("batch_size", [1, 32]) |
264 | 264 | @pytest.mark.parametrize("seed", [1]) |
265 | 265 | def test_mtp_e2e_greedy_correctness_torchair_graph( |
266 | | - enable_model_scope_env, |
| 266 | + enable_modelscope_env, |
267 | 267 | vllm_runner, |
268 | 268 | common_llm_kwargs, |
269 | 269 | per_test_common_llm_kwargs, |
@@ -314,7 +314,7 @@ def test_mtp_e2e_greedy_correctness_torchair_graph( |
314 | 314 | @pytest.mark.parametrize("batch_size", [1, 32]) |
315 | 315 | @pytest.mark.parametrize("seed", [1]) |
316 | 316 | def test_mtp_e2e_quant_greedy_correctness_torchair_graph( |
317 | | - enable_model_scope_env, |
| 317 | + enable_modelscope_env, |
318 | 318 | vllm_runner, |
319 | 319 | common_llm_kwargs, |
320 | 320 | per_test_common_llm_kwargs, |
@@ -372,7 +372,7 @@ def test_mtp_e2e_quant_greedy_correctness_torchair_graph( |
372 | 372 | @pytest.mark.parametrize("batch_size", [4]) |
373 | 373 | @pytest.mark.parametrize("seed", [1]) |
374 | 374 | def test_mtp_e2e_greedy_correctness_with_preemption( |
375 | | - enable_model_scope_env, |
| 375 | + enable_modelscope_env, |
376 | 376 | vllm_runner, |
377 | 377 | common_llm_kwargs, |
378 | 378 | per_test_common_llm_kwargs, |
@@ -430,7 +430,7 @@ def test_mtp_e2e_greedy_correctness_with_preemption( |
430 | 430 | ]) |
431 | 431 | @pytest.mark.parametrize("seed", [1]) |
432 | 432 | def test_mtp_different_k( |
433 | | - enable_model_scope_env, |
| 433 | + enable_modelscope_env, |
434 | 434 | vllm_runner, |
435 | 435 | common_llm_kwargs, |
436 | 436 | per_test_common_llm_kwargs, |
@@ -483,7 +483,7 @@ def test_mtp_different_k( |
483 | 483 | ]) |
484 | 484 | @pytest.mark.parametrize("seed", [1]) |
485 | 485 | def test_mtp_disable_queue( |
486 | | - enable_model_scope_env, |
| 486 | + enable_modelscope_env, |
487 | 487 | vllm_runner, |
488 | 488 | common_llm_kwargs, |
489 | 489 | per_test_common_llm_kwargs, |
|
0 commit comments