diff --git a/docker-compose.yaml b/docker-compose.yaml index 24d7e38..27a596c 100644 --- a/docker-compose.yaml +++ b/docker-compose.yaml @@ -26,11 +26,11 @@ services: - --gpu-memory-utilization - "0.70" - --max-model-len - - "32768" + - "2048" - --max-num-seqs - - "750" + - "100" - --max-seq-len-to-capture - - "32768" + - "2048" depends_on: - liquid-labs-model-volume # This is equivalent to "runtime: nvidia", but does not require diff --git a/launch.sh b/launch.sh index dab147b..f4cb5ff 100755 --- a/launch.sh +++ b/launch.sh @@ -50,8 +50,8 @@ set_and_export_env_var "JWT_SECRET" "$(generate_random_string 64)" set_and_export_env_var "API_SECRET" "$(generate_random_string 64)" set_and_export_env_var "AUTH_SECRET" "$(generate_random_string 64)" -set_and_export_env_var "STACK_VERSION" "2b3f969864" -set_and_export_env_var "MODEL_IMAGE" "liquidai/lfm-3be:0.0.6" +set_and_export_env_var "STACK_VERSION" "2685ff757d" +set_and_export_env_var "MODEL_IMAGE" "liquidai/lfm-1be:0.0.1" MODEL_NAME=Liquid-$(extract_model_name "$MODEL_IMAGE") set_and_export_env_var "MODEL_NAME" "$MODEL_NAME" true