Skip to content

Commit 17b26bd

Browse files
Enabling the ROCm-vLLM CI on MI250 machines (#432)
* Enabling ROCm CI on MI250 machines: - correct build target - correct queue Signed-off-by: Alexei V. Ivanov <alexei.ivanov@amd.com> --------- Signed-off-by: Alexei V. Ivanov <alexei.ivanov@amd.com>
1 parent 4fd2f5b commit 17b26bd

File tree

2 files changed

+13
-1
lines changed

2 files changed

+13
-1
lines changed

.buildkite/test-pipeline.yaml

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -92,7 +92,9 @@ steps:
9292
- VLLM_ATTENTION_BACKEND=FLASH_ATTN pytest -v -s basic_correctness/test_chunked_prefill.py
9393

9494
- label: Core Test # 10min
95+
working_dir: "/vllm-workspace/tests"
9596
mirror_hardwares: [amd]
97+
amd_gpus: 4 # Just for the sake of queue testing
9698
fast_check: true
9799
source_file_dependencies:
98100
- vllm/core
@@ -105,6 +107,7 @@ steps:
105107
working_dir: "/vllm-workspace/tests"
106108
fast_check: true
107109
mirror_hardwares: [amd]
110+
amd_gpus: 2 # Just for the sake of queue testing
108111
source_file_dependencies:
109112
- vllm/
110113
- tests/entrypoints/llm
@@ -186,6 +189,7 @@ steps:
186189
- pytest -v -s engine test_sequence.py test_config.py test_logger.py
187190
# OOM in the CI unless we run this separately
188191
- pytest -v -s tokenization
192+
working_dir: "/vllm-workspace/tests" # optional
189193

190194
- label: V1 Test
191195
#mirror_hardwares: [amd]
@@ -230,6 +234,7 @@ steps:
230234
- python3 offline_inference/profiling.py --model facebook/opt-125m run_num_steps --num-steps 2
231235

232236
- label: Prefix Caching Test # 9min
237+
working_dir: "/vllm-workspace/tests"
233238
mirror_hardwares: [amd]
234239
source_file_dependencies:
235240
- vllm/
@@ -248,6 +253,7 @@ steps:
248253
- VLLM_USE_FLASHINFER_SAMPLER=1 pytest -v -s samplers
249254

250255
- label: LogitsProcessor Test # 5min
256+
working_dir: "/vllm-workspace/tests"
251257
mirror_hardwares: [amd]
252258
source_file_dependencies:
253259
- vllm/model_executor/layers
@@ -269,7 +275,9 @@ steps:
269275
- pytest -v -s spec_decode/e2e/test_eagle_correctness.py
270276

271277
- label: LoRA Test %N # 15min each
278+
working_dir: "/vllm-workspace/tests"
272279
mirror_hardwares: [amd]
280+
amd_gpus: 8
273281
source_file_dependencies:
274282
- vllm/lora
275283
- tests/lora
@@ -295,7 +303,9 @@ steps:
295303
- pytest -v -s compile/test_full_graph.py
296304

297305
- label: Kernels Test %N # 1h each
306+
working_dir: "/vllm-workspace/tests"
298307
mirror_hardwares: [amd]
308+
amd_gpus: 8
299309
source_file_dependencies:
300310
- csrc/
301311
- vllm/attention
@@ -305,6 +315,7 @@ steps:
305315
parallelism: 4
306316

307317
- label: Tensorizer Test # 11min
318+
working_dir: "/vllm-workspace/tests"
308319
mirror_hardwares: [amd]
309320
soft_fail: true
310321
source_file_dependencies:
@@ -355,6 +366,7 @@ steps:
355366
- pytest -v -s encoder_decoder
356367

357368
- label: OpenAI-Compatible Tool Use # 20 min
369+
working_dir: "/vllm-workspace/tests"
358370
fast_check: false
359371
mirror_hardwares: [ amd ]
360372
source_file_dependencies:

.buildkite/test-template.j2

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@ steps:
77
- label: ":docker: build image"
88
depends_on: ~
99
commands:
10-
- "docker build --build-arg max_jobs=16 --tag {{ docker_image_amd }} -f Dockerfile.rocm --progress plain ."
10+
- "docker build --build-arg max_jobs=16 --tag {{ docker_image_amd }} -f Dockerfile.rocm --target test --progress plain ."
1111
- "docker push {{ docker_image_amd }}"
1212
key: "amd-build"
1313
env:

0 commit comments

Comments
 (0)