File tree Expand file tree Collapse file tree 4 files changed +10
-10
lines changed
bindings/python/rust/llm/block_manager/distributed
llm/src/block_manager/storage Expand file tree Collapse file tree 4 files changed +10
-10
lines changed Original file line number Diff line number Diff line change @@ -36,15 +36,15 @@ docker compose -f deploy/metrics/docker-compose.yml up -d
3636./container/run.sh --framework kvbm -it --mount-workspace --use-nixl-gds
3737
3838# enable using kvbm instead of vllm's own kv cache manager
39- export DYNAMO_KVBM_MANAGER =kvbm
39+ export DYN_KVBM_MANAGER =kvbm
4040
4141# enable kv offloading to CPU memory
4242# 4 means 4GB of CPU memory would be used
43- export DYNAMO_KVBM_CPU_CACHE_GB =4
43+ export DYN_KVBM_CPU_CACHE_GB =4
4444
4545# enable kv offloading to disk
4646# 8 means 8GB of disk would be used
47- export DYNAMO_KVBM_DISK_CACHE_GB =8
47+ export DYN_KVBM_DISK_CACHE_GB =8
4848
4949# serve an example LLM model
5050vllm serve deepseek-ai/DeepSeek-R1-Distill-Llama-8B
Original file line number Diff line number Diff line change @@ -7,13 +7,13 @@ use utils::get_barrier_id;
77use derive_getters:: Dissolve ;
88use llm_rs:: block_manager:: distributed:: { KvbmLeader as KvbmLeaderImpl , KvbmLeaderConfig } ;
99
10- const CPU_CACHE : & str = "DYNAMO_KVBM_CPU_CACHE_GB " ;
11- const CPU_CACHE_OVERRIDE : & str = "DYNAMO_KVBM_CPU_CACHE_OVERRIDE_NUM_BLOCKS " ;
10+ const CPU_CACHE : & str = "DYN_KVBM_CPU_CACHE_GB " ;
11+ const CPU_CACHE_OVERRIDE : & str = "DYN_KVBM_CPU_CACHE_OVERRIDE_NUM_BLOCKS " ;
1212
13- const DISK_CACHE : & str = "DYNAMO_KVBM_DISK_CACHE_GB " ;
14- const DISK_CACHE_OVERRIDE : & str = "DYNAMO_KVBM_DISK_CACHE_OVERRIDE_NUM_BLOCKS " ;
13+ const DISK_CACHE : & str = "DYN_KVBM_DISK_CACHE_GB " ;
14+ const DISK_CACHE_OVERRIDE : & str = "DYN_KVBM_DISK_CACHE_OVERRIDE_NUM_BLOCKS " ;
1515
16- const LEADER_WORKER_INIT_TIMEOUT_SECS : & str = "DYNAMO_KVBM_LEADER_WORKER_INIT_TIMEOUT_SECS " ;
16+ const LEADER_WORKER_INIT_TIMEOUT_SECS : & str = "DYN_KVBM_LEADER_WORKER_INIT_TIMEOUT_SECS " ;
1717const DEFAULT_INIT_TIMEOUT_SECS : u64 = 120 ;
1818
1919fn compute_num_blocks ( cache_size_key : & str , override_key : & str , bytes_per_block : usize ) -> usize {
Original file line number Diff line number Diff line change 22// SPDX-License-Identifier: Apache-2.0
33
44pub fn get_barrier_id ( ) -> String {
5- std:: env:: var ( "DYNAMO_KVBM_BARRIER_ID " ) . unwrap_or ( "kvbm" . to_string ( ) )
5+ std:: env:: var ( "DYN_KVBM_BARRIER_ID " ) . unwrap_or ( "kvbm" . to_string ( ) )
66}
Original file line number Diff line number Diff line change @@ -22,7 +22,7 @@ use std::ffi::CStr;
2222use std:: ffi:: CString ;
2323use std:: path:: Path ;
2424
25- const DISK_CACHE_KEY : & str = "DYNAMO_KVBM_DISK_CACHE_DIR " ;
25+ const DISK_CACHE_KEY : & str = "DYN_KVBM_DISK_CACHE_DIR " ;
2626const DEFAULT_DISK_CACHE_DIR : & str = "/tmp/" ;
2727
2828#[ derive( Debug ) ]
You can’t perform that action at this time.
0 commit comments