9292 - VLLM_ATTENTION_BACKEND=FLASH_ATTN pytest -v -s basic_correctness/test_chunked_prefill.py
9393
9494- label : Core Test # 10min
95+ working_dir : " /vllm-workspace/tests"
9596 mirror_hardwares : [amd]
97+ amd_gpus : 4 # Just for the sake of queue testing
9698 fast_check : true
9799 source_file_dependencies :
98100 - vllm/core
@@ -105,6 +107,7 @@ steps:
105107 working_dir : " /vllm-workspace/tests"
106108 fast_check : true
107109 mirror_hardwares : [amd]
110+ amd_gpus : 2 # Just for the sake of queue testing
108111 source_file_dependencies :
109112 - vllm/
110113 - tests/entrypoints/llm
@@ -186,6 +189,7 @@ steps:
186189 - pytest -v -s engine test_sequence.py test_config.py test_logger.py
187190 # OOM in the CI unless we run this separately
188191 - pytest -v -s tokenization
192+ working_dir : " /vllm-workspace/tests" # optional
189193
190194- label : V1 Test
191195 # mirror_hardwares: [amd]
@@ -230,6 +234,7 @@ steps:
230234 - python3 offline_inference/profiling.py --model facebook/opt-125m run_num_steps --num-steps 2
231235
232236- label : Prefix Caching Test # 9min
237+ working_dir : " /vllm-workspace/tests"
233238 mirror_hardwares : [amd]
234239 source_file_dependencies :
235240 - vllm/
@@ -248,6 +253,7 @@ steps:
248253 - VLLM_USE_FLASHINFER_SAMPLER=1 pytest -v -s samplers
249254
250255- label : LogitsProcessor Test # 5min
256+ working_dir : " /vllm-workspace/tests"
251257 mirror_hardwares : [amd]
252258 source_file_dependencies :
253259 - vllm/model_executor/layers
@@ -269,7 +275,9 @@ steps:
269275 - pytest -v -s spec_decode/e2e/test_eagle_correctness.py
270276
271277- label : LoRA Test %N # 15min each
278+ working_dir : " /vllm-workspace/tests"
272279 mirror_hardwares : [amd]
280+ amd_gpus : 8
273281 source_file_dependencies :
274282 - vllm/lora
275283 - tests/lora
@@ -295,7 +303,9 @@ steps:
295303 - pytest -v -s compile/test_full_graph.py
296304
297305- label : Kernels Test %N # 1h each
306+ working_dir : " /vllm-workspace/tests"
298307 mirror_hardwares : [amd]
308+ amd_gpus : 8
299309 source_file_dependencies :
300310 - csrc/
301311 - vllm/attention
@@ -305,6 +315,7 @@ steps:
305315 parallelism : 4
306316
307317- label : Tensorizer Test # 11min
318+ working_dir : " /vllm-workspace/tests"
308319 mirror_hardwares : [amd]
309320 soft_fail : true
310321 source_file_dependencies :
@@ -355,6 +366,7 @@ steps:
355366 - pytest -v -s encoder_decoder
356367
357368- label : OpenAI-Compatible Tool Use # 20 min
369+ working_dir : " /vllm-workspace/tests"
358370 fast_check : false
359371 mirror_hardwares : [ amd ]
360372 source_file_dependencies :
0 commit comments