Skip to content

Commit dbb4caa

Browse files
docs: Remove TRTLLM_USE_NIXL_KVCACHE and TRTLLM_USE_UCX_KVCACHE environment variables (#2231)
1 parent e5fa8b6 commit dbb4caa

File tree

3 files changed

+1
-39
lines changed

3 files changed

+1
-39
lines changed

components/backends/trtllm/kv-cache-tranfer.md

Lines changed: 1 addition & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -61,10 +61,4 @@ To enable NIXL for KV cache transfer in disaggregated serving:
6161
4. **Send the request:**
6262
See [client](./README.md#client) section to learn how to send the request to deployment.
6363

64-
**Important:** Ensure that ETCD and NATS services are running before starting the service.
65-
66-
The container will automatically configure the appropriate environment variables (`TRTLLM_USE_NIXL_KVCACHE=1`) when built with the NIXL flag. The same container image can be used to use UCX for KV cache transfer.
67-
```bash
68-
unset TRTLLM_USE_NIXL_KVCACHE
69-
export TRTLLM_USE_UCX_KVCACHE=1
70-
```
64+
**Important:** Ensure that ETCD and NATS services are running before starting the service.

components/backends/trtllm/multinode/start_trtllm_worker.sh

Lines changed: 0 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -22,13 +22,6 @@ if [[ -z ${ENGINE_CONFIG} ]]; then
2222
exit 1
2323
fi
2424

25-
# NOTE: When this script is run directly from srun, the environment variables
26-
# for TRTLLM KV cache are not set. So we need to set them here.
27-
# Related issue: https://github.com/ai-dynamo/dynamo/issues/1743
28-
if [[ -z ${TRTLLM_USE_UCX_KVCACHE} ]] && [[ -z ${TRTLLM_USE_NIXL_KVCACHE} ]]; then
29-
export TRTLLM_USE_UCX_KVCACHE=1
30-
fi
31-
3225
EXTRA_ARGS=""
3326
if [[ -n ${DISAGGREGATION_MODE} ]]; then
3427
EXTRA_ARGS+="--disaggregation-mode ${DISAGGREGATION_MODE} "

container/Dockerfile.tensorrt_llm

Lines changed: 0 additions & 25 deletions
Original file line numberDiff line numberDiff line change
@@ -332,26 +332,6 @@ RUN pip install dist/ai_dynamo_runtime*cp312*.whl && \
332332
pip install dist/ai_dynamo*any.whl
333333

334334
ENV DYNAMO_HOME=/workspace
335-
336-
# Use UCX for TRTLLM KV Cache Transfer
337-
ARG TRTLLM_USE_NIXL_KVCACHE_EXPERIMENTAL
338-
ENV TRTLLM_USE_UCX_KVCACHE=1
339-
340-
# Create a script that sets the environment variables and source it.
341-
# If TRTLLM_USE_NIXL_KVCACHE_EXPERIMENTAL is set to 1, unset TRTLLM_USE_UCX_KVCACHE
342-
# and set TRTLLM_USE_NIXL_KVCACHE to 1.
343-
RUN echo '#!/bin/bash' > /usr/local/bin/set_trtllm_env.sh && \
344-
if [ "$TRTLLM_USE_NIXL_KVCACHE_EXPERIMENTAL" = "1" ]; then \
345-
echo 'unset TRTLLM_USE_UCX_KVCACHE' >> /usr/local/bin/set_trtllm_env.sh; \
346-
echo 'export TRTLLM_USE_NIXL_KVCACHE=1' >> /usr/local/bin/set_trtllm_env.sh; \
347-
else \
348-
echo '# TRTLLM_USE_UCX_KVCACHE should already be set to 1' >> /usr/local/bin/set_trtllm_env.sh; \
349-
fi && \
350-
chmod +x /usr/local/bin/set_trtllm_env.sh
351-
352-
# Source the script in bashrc
353-
RUN echo 'source /usr/local/bin/set_trtllm_env.sh' >> /root/.bashrc
354-
355335
# Copy launch banner
356336
RUN --mount=type=bind,source=./container/launch_message.txt,target=/workspace/launch_message.txt \
357337
sed '/^#\s/d' /workspace/launch_message.txt > ~/.launch_screen && \
@@ -501,11 +481,6 @@ RUN uv pip install --extra-index-url "${TENSORRTLLM_INDEX_URL}" \
501481
"${TENSORRTLLM_PIP_WHEEL}" && \
502482
uv pip install ai-dynamo nixl --find-links wheelhouse
503483

504-
# Setup TRTLLM environment variables, same as in dev image
505-
ENV TRTLLM_USE_UCX_KVCACHE=1
506-
COPY --from=dev /usr/local/bin/set_trtllm_env.sh /usr/local/bin/set_trtllm_env.sh
507-
RUN echo 'source /usr/local/bin/set_trtllm_env.sh' >> /root/.bashrc
508-
509484
# Copy benchmarks, backends and tests for CI
510485
# TODO: Remove this once we have a functional CI image built on top of the runtime image
511486
COPY tests /workspace/tests

0 commit comments

Comments
 (0)