Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
62 commits
Select commit Hold shift + click to select a range
45ab9f5
launch pd disagg
cyber-pioneer Apr 15, 2025
7a7076e
merge main
cyber-pioneer Apr 28, 2025
87a0936
fix code
cyber-pioneer Apr 16, 2025
384f92d
fix code
cyber-pioneer Apr 16, 2025
8b647cd
fix confict
cyber-pioneer Apr 28, 2025
6ebfadd
fix code
cyber-pioneer Apr 16, 2025
c3c55d9
fix code
cyber-pioneer Apr 16, 2025
45f6d7f
fix code
cyber-pioneer Apr 16, 2025
dee02b2
fix code
cyber-pioneer Apr 16, 2025
ca48ee0
fix code
cyber-pioneer Apr 16, 2025
314d41c
fix code
cyber-pioneer Apr 16, 2025
3ea878a
fix code
cyber-pioneer Apr 16, 2025
3e3b7e0
fix code
cyber-pioneer Apr 16, 2025
29dcdd7
fix code
cyber-pioneer Apr 16, 2025
85e6bb1
fix code
cyber-pioneer Apr 16, 2025
cf25c80
fix code
cyber-pioneer Apr 16, 2025
aab9e5a
fix code
cyber-pioneer Apr 16, 2025
ec8f6fd
fix code
cyber-pioneer Apr 16, 2025
1e1bcb8
fix code
cyber-pioneer Apr 16, 2025
987a37c
fix code
cyber-pioneer Apr 17, 2025
b617ac2
fix code
cyber-pioneer Apr 17, 2025
ea0832b
fix code
cyber-pioneer Apr 17, 2025
eea51d2
fix code
cyber-pioneer Apr 17, 2025
8540109
fix code
cyber-pioneer Apr 17, 2025
f3e00a6
fix code
cyber-pioneer Apr 17, 2025
19ba091
fix code
cyber-pioneer Apr 17, 2025
2e8708f
fix code
cyber-pioneer Apr 17, 2025
0bc464a
fix code
cyber-pioneer Apr 17, 2025
abb6e93
fix code
cyber-pioneer Apr 17, 2025
28d385d
v1
cyber-pioneer Apr 17, 2025
f6ad7aa
v2: dev robin
cyber-pioneer Apr 17, 2025
4f8025d
v2: dev robin
cyber-pioneer Apr 17, 2025
5b46227
v2: dev robin
cyber-pioneer Apr 17, 2025
14dd136
v2: dev load
cyber-pioneer Apr 18, 2025
9aaa50b
v2: dev load
cyber-pioneer Apr 18, 2025
c9acd71
v2: dev load
cyber-pioneer Apr 18, 2025
4e60387
polish code
cyber-pioneer Apr 18, 2025
3f6f18e
polish code
cyber-pioneer Apr 18, 2025
bcd23d7
polish code
cyber-pioneer Apr 18, 2025
9dfd44a
polish code
cyber-pioneer Apr 18, 2025
514ceb9
polish code
cyber-pioneer Apr 18, 2025
d44b1fc
polish code
cyber-pioneer Apr 18, 2025
a4fe733
polish code
cyber-pioneer Apr 18, 2025
6337fe1
remove debug code
cyber-pioneer Apr 18, 2025
42543a8
code
cyber-pioneer Apr 28, 2025
4d48282
fix code
cyber-pioneer Apr 28, 2025
2a0d12a
fix code
cyber-pioneer Apr 28, 2025
e7dca53
add pd of vllm support flagcx
cyber-pioneer Apr 29, 2025
f497249
polish code
cyber-pioneer Apr 29, 2025
89cbc65
polish copyright
cyber-pioneer Apr 29, 2025
5c65a78
polish code
cyber-pioneer Apr 29, 2025
adc03c3
fix code
cyber-pioneer Apr 29, 2025
0df9f75
polish code
cyber-pioneer Apr 29, 2025
47ac748
polish code
cyber-pioneer Apr 29, 2025
01680c5
polish code
cyber-pioneer Apr 29, 2025
058cf50
fix code
cyber-pioneer Apr 29, 2025
23a4318
fix code
cyber-pioneer Apr 29, 2025
38d2b73
polish code
cyber-pioneer Apr 29, 2025
12a8154
fix code
cyber-pioneer Apr 29, 2025
f070e96
polish code
cyber-pioneer Apr 29, 2025
b061d00
polish code
cyber-pioneer Apr 29, 2025
cd70188
polish name
cyber-pioneer Apr 29, 2025
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
36 changes: 36 additions & 0 deletions examples/qwen/conf/config_qwen2.5_7b_disagg_xpyd.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,36 @@
defaults:
- _self_
- serve: serve_qwen2.5_7b

experiment:
exp_name: qwen2.5_7b
exp_dir: outputs/${experiment.exp_name}
task:
type: serve
deploy:
port: 10001
use_fs_serve: false
prefill_decode_disaggregation: true
prefill_num: 2
prefill_address: x.x.x.x # optional, default "auto"
decode_num: 2
decode_address: x.x.x.x # optional, default "auto"
runner:
hostfile: examples/qwen/conf/hostfile.txt
docker: fr-v2
envs:
CUDA_DEVICE_MAX_CONNECTIONS: 1
VLLM_USE_V1: 0
FLAGCX_SOCKET_IFNAME: bond0
FLAGCX_PATH: /path/to/FlagCX/
FLAGCX_DEBUG: TRACE
FLAGCX_DEBUG_SUBSYS: ALL
USE_FLAGCX: true
cmds:
before_start: source /root/miniconda3/bin/activate flagscale-inference

action: run

hydra:
run:
dir: ${experiment.exp_dir}/hydra
5 changes: 5 additions & 0 deletions examples/qwen/conf/hostfile.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
# ip slots type=xxx[optional]
# master node
x.x.x.x slots=8 type=gpu
# worker nodes
x.x.x.x slots=8 type=gpu
1 change: 1 addition & 0 deletions examples/qwen/conf/serve/serve_qwen2.5_7b.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -2,6 +2,7 @@
engine: vllm
engine_args:
model: /models/Qwen2.5-7B-Instruct
host: 0.0.0.0
tensor_parallel_size: 1
pipeline_parallel_size: 1
gpu_memory_utilization: 0.9
Expand Down
Loading
Loading