Skip to content

Commit c3945df

Browse files
committed
Enable Prometheus and Grafana docker compose under telemetry.yaml file
Signed-off-by: Tsai, Louie <louie.tsai@intel.com>
1 parent 12657ac commit c3945df

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

41 files changed

+106217
-8
lines changed

ChatQnA/README.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -70,11 +70,11 @@ To set up environment variables for deploying ChatQnA services, follow these ste
7070
# on Gaudi
7171
cd GenAIExamples/ChatQnA/docker_compose/intel/hpu/gaudi/
7272
source ./set_env.sh
73-
export no_proxy="Your_No_Proxy",chatqna-gaudi-ui-server,chatqna-gaudi-backend-server,dataprep-redis-service,tei-embedding-service,retriever,tei-reranking-service,tgi-service,vllm-service,guardrails
73+
export no_proxy="Your_No_Proxy",chatqna-gaudi-ui-server,chatqna-gaudi-backend-server,dataprep-redis-service,tei-embedding-service,retriever,tei-reranking-service,tgi-service,vllm-service,guardrails,jaeger,prometheus,grafana,gaudi-node-exporter-1
7474
# on Xeon
7575
cd GenAIExamples/ChatQnA/docker_compose/intel/cpu/xeon/
7676
source ./set_env.sh
77-
export no_proxy="Your_No_Proxy",chatqna-xeon-ui-server,chatqna-xeon-backend-server,dataprep-redis-service,tei-embedding-service,retriever,tei-reranking-service,tgi-service,vllm-service
77+
export no_proxy="Your_No_Proxy",chatqna-xeon-ui-server,chatqna-xeon-backend-server,dataprep-redis-service,tei-embedding-service,retriever,tei-reranking-service,tgi-service,vllm-service,jaeger,prometheus,grafana,xeon-node-exporter-1
7878
# on Nvidia GPU
7979
cd GenAIExamples/ChatQnA/docker_compose/nvidia/gpu
8080
source ./set_env.sh

ChatQnA/docker_compose/intel/cpu/xeon/compose.telemetry.yaml

Lines changed: 56 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -4,8 +4,17 @@
44
services:
55
tei-embedding-service:
66
command: --model-id ${EMBEDDING_MODEL_ID} --auto-truncate --otlp-endpoint $OTEL_EXPORTER_OTLP_TRACES_ENDPOINT
7+
environment:
8+
- TELEMETRY_ENDPOINT=${TELEMETRY_ENDPOINT}
79
tei-reranking-service:
810
command: --model-id ${RERANK_MODEL_ID} --auto-truncate --otlp-endpoint $OTEL_EXPORTER_OTLP_TRACES_ENDPOINT
11+
environment:
12+
- TELEMETRY_ENDPOINT=${TELEMETRY_ENDPOINT}
13+
# vllm-service:
14+
# command: --model $LLM_MODEL_ID --host 0.0.0.0 --port 80 --otlp-traces-endpoint $OTEL_EXPORTER_OTLP_TRACES_ENDPOINT
15+
chatqna-xeon-backend-server:
16+
environment:
17+
- TELEMETRY_ENDPOINT=${TELEMETRY_ENDPOINT}
918
jaeger:
1019
image: jaegertracing/all-in-one:latest
1120
container_name: jaeger
@@ -21,7 +30,51 @@ services:
2130
https_proxy: ${https_proxy}
2231
COLLECTOR_ZIPKIN_HOST_PORT: 9411
2332
restart: unless-stopped
24-
chatqna-xeon-backend-server:
33+
prometheus:
34+
image: prom/prometheus:v2.52.0
35+
container_name: prometheus
36+
user: root
37+
volumes:
38+
- ./prometheus.yaml:/etc/prometheus/prometheus.yaml
39+
- ./prometheus_data:/prometheus
40+
command:
41+
- '--config.file=/etc/prometheus/prometheus.yaml'
42+
ports:
43+
- '9090:9090'
44+
ipc: host
45+
restart: unless-stopped
46+
grafana:
47+
image: grafana/grafana:11.0.0
48+
container_name: grafana
49+
volumes:
50+
- ./grafana_data:/var/lib/grafana
51+
- ./grafana/dashboards:/var/lib/grafana/dashboards
52+
- ./grafana/provisioning:/etc/grafana/provisioning
53+
user: root
2554
environment:
26-
- ENABLE_OPEA_TELEMETRY=true
27-
- TELEMETRY_ENDPOINT=${TELEMETRY_ENDPOINT}
55+
GF_SECURITY_ADMIN_PASSWORD: admin
56+
GF_RENDERING_CALLBACK_URL: http://grafana:3000/
57+
GF_LOG_FILTERS: rendering:debug
58+
depends_on:
59+
- prometheus
60+
ports:
61+
- '3000:3000'
62+
ipc: host
63+
restart: unless-stopped
64+
node-exporter:
65+
image: prom/node-exporter
66+
container_name: node-exporter
67+
volumes:
68+
- /proc:/host/proc:ro
69+
- /sys:/host/sys:ro
70+
- /:/rootfs:ro
71+
command:
72+
- '--path.procfs=/host/proc'
73+
- '--path.sysfs=/host/sys'
74+
- --collector.filesystem.ignored-mount-points
75+
- "^/(sys|proc|dev|host|etc|rootfs/var/lib/docker/containers|rootfs/var/lib/docker/overlay2|rootfs/run/docker/netns|rootfs/var/lib/docker/aufs)($$|/)"
76+
ports:
77+
- 9100:9100
78+
restart: always
79+
deploy:
80+
mode: global

ChatQnA/docker_compose/intel/cpu/xeon/compose_tgi.telemetry.yaml

Lines changed: 56 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -4,10 +4,19 @@
44
services:
55
tei-embedding-service:
66
command: --model-id ${EMBEDDING_MODEL_ID} --auto-truncate --otlp-endpoint $OTEL_EXPORTER_OTLP_TRACES_ENDPOINT
7+
environment:
8+
- TELEMETRY_ENDPOINT=${TELEMETRY_ENDPOINT}
79
tei-reranking-service:
810
command: --model-id ${RERANK_MODEL_ID} --auto-truncate --otlp-endpoint $OTEL_EXPORTER_OTLP_TRACES_ENDPOINT
11+
environment:
12+
- TELEMETRY_ENDPOINT=${TELEMETRY_ENDPOINT}
913
tgi-service:
1014
command: --model-id ${LLM_MODEL_ID} --cuda-graphs 0 --otlp-endpoint $OTEL_EXPORTER_OTLP_TRACES_ENDPOINT
15+
environment:
16+
- TELEMETRY_ENDPOINT=${TELEMETRY_ENDPOINT}
17+
chatqna-xeon-backend-server:
18+
environment:
19+
- TELEMETRY_ENDPOINT=${TELEMETRY_ENDPOINT}
1120
jaeger:
1221
image: jaegertracing/all-in-one:latest
1322
container_name: jaeger
@@ -23,7 +32,51 @@ services:
2332
https_proxy: ${https_proxy}
2433
COLLECTOR_ZIPKIN_HOST_PORT: 9411
2534
restart: unless-stopped
26-
chatqna-xeon-backend-server:
35+
prometheus:
36+
image: prom/prometheus:v2.52.0
37+
container_name: prometheus
38+
user: root
39+
volumes:
40+
- ./prometheus.yaml:/etc/prometheus/prometheus.yaml
41+
- ./prometheus_data:/prometheus
42+
command:
43+
- '--config.file=/etc/prometheus/prometheus.yaml'
44+
ports:
45+
- '9090:9090'
46+
ipc: host
47+
restart: unless-stopped
48+
grafana:
49+
image: grafana/grafana:11.0.0
50+
container_name: grafana
51+
volumes:
52+
- ./grafana_data:/var/lib/grafana
53+
- ./grafana/dashboards:/var/lib/grafana/dashboards
54+
- ./grafana/provisioning:/etc/grafana/provisioning
55+
user: root
2756
environment:
28-
- ENABLE_OPEA_TELEMETRY=true
29-
- TELEMETRY_ENDPOINT=${TELEMETRY_ENDPOINT}
57+
GF_SECURITY_ADMIN_PASSWORD: admin
58+
GF_RENDERING_CALLBACK_URL: http://grafana:3000/
59+
GF_LOG_FILTERS: rendering:debug
60+
depends_on:
61+
- prometheus
62+
ports:
63+
- '3000:3000'
64+
ipc: host
65+
restart: unless-stopped
66+
node-exporter:
67+
image: prom/node-exporter
68+
container_name: node-exporter
69+
volumes:
70+
- /proc:/host/proc:ro
71+
- /sys:/host/sys:ro
72+
- /:/rootfs:ro
73+
command:
74+
- '--path.procfs=/host/proc'
75+
- '--path.sysfs=/host/sys'
76+
- --collector.filesystem.ignored-mount-points
77+
- "^/(sys|proc|dev|host|etc|rootfs/var/lib/docker/containers|rootfs/var/lib/docker/overlay2|rootfs/run/docker/netns|rootfs/var/lib/docker/aufs)($$|/)"
78+
ports:
79+
- 9100:9100
80+
restart: always
81+
deploy:
82+
mode: global

0 commit comments

Comments
 (0)