From 9bdd726f2b43f31e0bb2959a2f48253edf896b85 Mon Sep 17 00:00:00 2001 From: Liren Tu Date: Wed, 11 Dec 2024 01:31:04 -0800 Subject: [PATCH 1/2] Adjust launch arguments for 1b 6gb --- docker-compose.yaml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/docker-compose.yaml b/docker-compose.yaml index 24d7e38..27a596c 100644 --- a/docker-compose.yaml +++ b/docker-compose.yaml @@ -26,11 +26,11 @@ services: - --gpu-memory-utilization - "0.70" - --max-model-len - - "32768" + - "2048" - --max-num-seqs - - "750" + - "100" - --max-seq-len-to-capture - - "32768" + - "2048" depends_on: - liquid-labs-model-volume # This is equivalent to "runtime: nvidia", but does not require From 50899dbf5889f1a97c45afa39a158610470a0513 Mon Sep 17 00:00:00 2001 From: Liren Tu Date: Wed, 11 Dec 2024 01:32:04 -0800 Subject: [PATCH 2/2] Update stack and model image --- launch.sh | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/launch.sh b/launch.sh index dab147b..f4cb5ff 100755 --- a/launch.sh +++ b/launch.sh @@ -50,8 +50,8 @@ set_and_export_env_var "JWT_SECRET" "$(generate_random_string 64)" set_and_export_env_var "API_SECRET" "$(generate_random_string 64)" set_and_export_env_var "AUTH_SECRET" "$(generate_random_string 64)" -set_and_export_env_var "STACK_VERSION" "2b3f969864" -set_and_export_env_var "MODEL_IMAGE" "liquidai/lfm-3be:0.0.6" +set_and_export_env_var "STACK_VERSION" "2685ff757d" +set_and_export_env_var "MODEL_IMAGE" "liquidai/lfm-1be:0.0.1" MODEL_NAME=Liquid-$(extract_model_name "$MODEL_IMAGE") set_and_export_env_var "MODEL_NAME" "$MODEL_NAME" true