@@ -225,7 +225,7 @@ steps:
225225# #### 1 GPU test #####
226226
227227- label : Regression Test # 5min
228- mirror_hardwares : [amdexperimental]
228+ mirror_hardwares : [amdexperimental, amdproduction ]
229229 source_file_dependencies :
230230 - vllm/
231231 - tests/test_regression
@@ -277,7 +277,7 @@ steps:
277277 - pytest -v -s entrypoints/openai/correctness/test_lmeval.py::test_lm_eval_accuracy_v1_engine
278278
279279- label : Examples Test # 25min
280- mirror_hardwares : [amdexperimental]
280+ mirror_hardwares : [amdexperimental, amdproduction ]
281281 working_dir : " /vllm-workspace/examples"
282282 source_file_dependencies :
283283 - vllm/entrypoints
@@ -311,7 +311,7 @@ steps:
311311
312312
313313- label : Platform Tests (CUDA)
314- mirror_hardwares : [amdexperimental]
314+ mirror_hardwares : [amdexperimental, amdproduction ]
315315 source_file_dependencies :
316316 - vllm/
317317 - tests/cuda
@@ -330,7 +330,7 @@ steps:
330330 - VLLM_USE_FLASHINFER_SAMPLER=1 pytest -v -s samplers
331331
332332- label : LoRA Test %N # 15min each
333- mirror_hardwares : [amdexperimental, amdproduction ]
333+ mirror_hardwares : [amdexperimental]
334334 source_file_dependencies :
335335 - vllm/lora
336336 - tests/lora
@@ -382,7 +382,7 @@ steps:
382382 - pytest -v -s kernels/core
383383
384384- label : Kernels Attention Test %N
385- mirror_hardwares : [amdexperimental, amdproduction ]
385+ mirror_hardwares : [amdexperimental]
386386 source_file_dependencies :
387387 - csrc/attention/
388388 - vllm/attention
@@ -393,7 +393,7 @@ steps:
393393 parallelism : 2
394394
395395- label : Kernels Quantization Test %N
396- mirror_hardwares : [amdexperimental, amdproduction ]
396+ mirror_hardwares : [amdexperimental]
397397 source_file_dependencies :
398398 - csrc/quantization/
399399 - vllm/model_executor/layers/quantization
@@ -412,15 +412,15 @@ steps:
412412 - pytest -v -s kernels/moe
413413
414414- label : Kernels Mamba Test
415- mirror_hardwares : [amdexperimental]
415+ mirror_hardwares : [amdexperimental, amdproduction ]
416416 source_file_dependencies :
417417 - csrc/mamba/
418418 - tests/kernels/mamba
419419 commands :
420420 - pytest -v -s kernels/mamba
421421
422422- label : Tensorizer Test # 11min
423- mirror_hardwares : [amdexperimental]
423+ mirror_hardwares : [amdexperimental, amdproduction ]
424424 soft_fail : true
425425 source_file_dependencies :
426426 - vllm/model_executor/model_loader
@@ -490,15 +490,15 @@ steps:
490490 - pytest -s entrypoints/openai/correctness/
491491
492492- label : Encoder Decoder tests # 5min
493- mirror_hardwares : [amdexperimental]
493+ mirror_hardwares : [amdexperimental, amdproduction ]
494494 source_file_dependencies :
495495 - vllm/
496496 - tests/encoder_decoder
497497 commands :
498498 - pytest -v -s encoder_decoder
499499
500500- label : OpenAI-Compatible Tool Use # 20 min
501- mirror_hardwares : [amdexperimental]
501+ mirror_hardwares : [amdexperimental, amdproduction ]
502502 fast_check : false
503503 source_file_dependencies :
504504 - vllm/
@@ -610,7 +610,7 @@ steps:
610610 - pytest -v -s models/multimodal/generation/test_common.py -m 'split(group=1) and not core_model'
611611
612612- label : Quantized Models Test
613- mirror_hardwares : [amdexperimental, amdproduction ]
613+ mirror_hardwares : [amdexperimental]
614614 source_file_dependencies :
615615 - vllm/model_executor/layers/quantization
616616 - tests/models/quantization
0 commit comments