mozilla-ai · agpituk · Feb 7, 2025 · Feb 7, 2025 · Feb 7, 2025 · Feb 10, 2025
diff --git a/.github/workflows/lumigator_pipeline.yaml b/.github/workflows/lumigator_pipeline.yaml
@@ -58,7 +58,7 @@ jobs:
 
   integration-tests:
     name: Integration tests (SQLite)
-    runs-on: ubuntu-latest
+    runs-on: lumigator-integration-tests-runner
     needs: lint
     if: ${{ needs.lint.result == 'success' }}
     strategy:
@@ -105,7 +105,7 @@ jobs:
 
   integration-tests-postgres:
     name: Integration tests (PostgreSQL)
-    runs-on: ubuntu-latest
+    runs-on: lumigator-integration-tests-runner
     needs: lint
     if: ${{ needs.lint.result == 'success' }}
     strategy:
@@ -153,7 +153,7 @@ jobs:
 
   notebook-integration-test:
     name: Notebook integration tests
-    runs-on: ubuntu-latest
+    runs-on: lumigator-integration-tests-runner
     needs: lint
     if: ${{ needs.lint.result == 'success' }}
     steps:

diff --git a/Makefile b/Makefile
@@ -111,7 +111,7 @@ endef
 # Launches Lumigator in 'development' mode (all services running locally, code mounted in)
 local-up: config-generate-env
 	uv run pre-commit install
-	RAY_ARCH_SUFFIX=$(RAY_ARCH_SUFFIX) COMPUTE_TYPE=$(COMPUTE_TYPE) docker compose --env-file "$(CONFIG_BUILD_DIR)/.env" --profile local $(GPU_COMPOSE) -f $(LOCAL_DOCKERCOMPOSE_FILE) -f $(DEV_DOCKER_COMPOSE_FILE) up --watch --build
+	RAY_ARCH_SUFFIX=$(RAY_ARCH_SUFFIX) ARCH=${ARCH} COMPUTE_TYPE=$(COMPUTE_TYPE) docker compose --env-file "$(CONFIG_BUILD_DIR)/.env" --profile local $(GPU_COMPOSE) -f $(LOCAL_DOCKERCOMPOSE_FILE) -f $(DEV_DOCKER_COMPOSE_FILE) up --watch --build
 
 local-down: config-generate-env
 	docker compose --env-file "$(CONFIG_BUILD_DIR)/.env" --profile local $(GPU_COMPOSE) -f $(LOCAL_DOCKERCOMPOSE_FILE) -f ${DEV_DOCKER_COMPOSE_FILE} down
@@ -130,18 +130,18 @@ start-lumigator: config-generate-env
 
 # Launches lumigator with no code mounted in, and forces build of containers (used in CI for integration tests)
 start-lumigator-build: config-generate-env
-	RAY_ARCH_SUFFIX=$(RAY_ARCH_SUFFIX) COMPUTE_TYPE=$(COMPUTE_TYPE) docker compose --env-file "$(CONFIG_BUILD_DIR)/.env" --profile local $(GPU_COMPOSE) -f $(LOCAL_DOCKERCOMPOSE_FILE) up -d --build
+	RAY_ARCH_SUFFIX=$(RAY_ARCH_SUFFIX) ARCH=${ARCH} COMPUTE_TYPE=$(COMPUTE_TYPE) docker compose --env-file "$(CONFIG_BUILD_DIR)/.env" --profile local $(GPU_COMPOSE) -f $(LOCAL_DOCKERCOMPOSE_FILE) up -d --build
 
 # Launches lumigator with no code mounted in, and forces build of containers (used in CI for integration tests)
 start-lumigator-build-postgres: config-generate-env
-	RAY_ARCH_SUFFIX=$(RAY_ARCH_SUFFIX) COMPUTE_TYPE=$(COMPUTE_TYPE) docker compose --env-file "$(CONFIG_BUILD_DIR)/.env" --profile local $(GPU_COMPOSE) -f $(LOCAL_DOCKERCOMPOSE_FILE) -f $(POSTGRES_DOCKER_COMPOSE_FILE) up -d --build
+	RAY_ARCH_SUFFIX=$(RAY_ARCH_SUFFIX) ARCH=${ARCH} COMPUTE_TYPE=$(COMPUTE_TYPE) docker compose --env-file "$(CONFIG_BUILD_DIR)/.env" --profile local $(GPU_COMPOSE) -f $(LOCAL_DOCKERCOMPOSE_FILE) -f $(POSTGRES_DOCKER_COMPOSE_FILE) up -d --build
 
 # Launches lumigator without local dependencies (ray, S3)
 start-lumigator-external-services: config-generate-env
-	docker compose --env-file "$(CONFIG_BUILD_DIR)/.env"$(GPU_COMPOSE) -f $(LOCAL_DOCKERCOMPOSE_FILE) up -d
+	ARCH=${ARCH} docker compose --env-file "$(CONFIG_BUILD_DIR)/.env"$(GPU_COMPOSE) -f $(LOCAL_DOCKERCOMPOSE_FILE) up -d
 
 stop-lumigator: config-generate-env
-	RAY_ARCH_SUFFIX=$(RAY_ARCH_SUFFIX) COMPUTE_TYPE=$(COMPUTE_TYPE) docker compose --env-file "$(CONFIG_BUILD_DIR)/.env" --profile local $(GPU_COMPOSE) -f $(LOCAL_DOCKERCOMPOSE_FILE) -f $(POSTGRES_DOCKER_COMPOSE_FILE) down
+	ARCH=${ARCH} RAY_ARCH_SUFFIX=$(RAY_ARCH_SUFFIX) COMPUTE_TYPE=$(COMPUTE_TYPE) docker compose --env-file "$(CONFIG_BUILD_DIR)/.env" --profile local $(GPU_COMPOSE) -f $(LOCAL_DOCKERCOMPOSE_FILE) -f $(POSTGRES_DOCKER_COMPOSE_FILE) down
 	$(call remove_config_dir)
 
 clean-docker-buildcache:

diff --git a/README.md b/README.md
@@ -45,6 +45,7 @@ need to have the following prerequisites installed on your machine:
     - On Linux, you need to follow the
       [post-installation steps](https://docs.docker.com/engine/install/linux-postinstall/).
 - The system Python (version managers such as uv should be deactivated)
+- At least 10 GB available on disk and allocated for docker, since some small language models will be pre downloaded
 
 You can run and develop Lumigator locally using Docker Compose. This creates four container
 services networked together to make up all the components of the Lumigator application:

diff --git a/cache/Dockerfile.model-inference b/cache/Dockerfile.model-inference
@@ -0,0 +1,19 @@
+# Dockerfile.huggingface-cache
+FROM python:3.11-slim
+
+# Install required packages: transformers and huggingface_hub
+RUN pip install --no-cache-dir transformers huggingface_hub
+
+# Ensure the cache directory exists (snapshot_download will create its own subfolders)
+RUN mkdir -p /home/ray/.cache/huggingface/hub
+
+# Use the huggingface_hub API to download the model exactly as the Hub does.
+# This will create a folder with the proper structure (e.g. blobs, refs, snapshots).
+RUN python -c "\
+from huggingface_hub import snapshot_download; \
+model_path = snapshot_download('facebook/bart-large-cnn', cache_dir='/home/ray/.cache/huggingface/hub'); \
+print('Model downloaded to:', model_path)\
+"
+
+# Exit immediately (this container’s only job is to populate the cache)
+CMD ["/bin/true"]
diff --git a/docker-compose.yaml b/docker-compose.yaml
@@ -2,6 +2,16 @@ name: lumigator
 
 services:
 
+  inference-model:
+    build:
+      context: .
+      dockerfile: cache/Dockerfile.model-inference
+    platform: linux/${ARCH}
+    command: /bin/true
+    volumes:
+      - huggingface_cache_vol:/home/ray/.cache/huggingface
+    profiles:
+      - local
   minio:
     labels:
       ai.mozilla.product_name: lumigator
@@ -68,6 +78,8 @@ services:
     depends_on:
       redis:
         condition: service_healthy
+      inference-model:
+        condition: service_completed_successfully
     ports:
       - "6379:6379"
       - "${RAY_DASHBOARD_PORT}:${RAY_DASHBOARD_PORT}"
@@ -83,18 +95,18 @@ services:
       - -c
       - |
           set -eaux
-          mkdir -p /tmp/ray_pip_cache
+          mkdir -p /home/ray/.cache/ && mkdir -p /tmp/ray_pip_cache
+          sudo chmod -R 777 /home/ray/.cache/ && sudo chmod -R 777 /tmp/ray_pip_cache/ || true
+          RAY_JOB_ALLOW_DRIVER_ON_WORKER_NODES=1 RAY_REDIS_ADDRESS=redis:6379 ray start --head --dashboard-port=${RAY_DASHBOARD_PORT} --port=6379 --dashboard-host=0.0.0.0 --ray-client-server-port 10001
           # If the file was mounted in a volume instead of
           # a shared dir, permissions need to be setup
           # ... || true allows this to fail (-e is set)
-          sudo chmod -R 777 /tmp/ray_pip_cache/ || true
-          RAY_JOB_ALLOW_DRIVER_ON_WORKER_NODES=1 RAY_REDIS_ADDRESS=redis:6379 ray start --head --dashboard-port=${RAY_DASHBOARD_PORT} --port=6379 --dashboard-host=0.0.0.0 --ray-client-server-port 10001
           mkdir -p /tmp/ray/session_latest/runtime_resources/pip
           rmdir /tmp/ray/session_latest/runtime_resources/pip/ && ln -s /tmp/ray_pip_cache /tmp/ray/session_latest/runtime_resources/pip
           sleep infinity
     shm_size: 2g
     volumes:
-      - ${HOME}/.cache/huggingface:/home/ray/.cache/huggingface
+      - huggingface_cache_vol:/home/ray/.cache/huggingface
       - ray-pip-cache:/tmp/ray_pip_cache
     deploy:
       resources:
@@ -242,6 +254,9 @@ volumes:
     redis-data:
       labels:
         ai.mozilla.product_name: lumigator
+    huggingface_cache_vol:
+      labels:
+        ai.mozilla.product_name: lumigator
     ray-pip-cache:
       labels:
         ai.mozilla.product_name: lumigator