From 8e73ce1d42a9232e08201d82692bc5edea275f31 Mon Sep 17 00:00:00 2001 From: Phil Date: Wed, 10 Jul 2024 23:05:49 +0200 Subject: [PATCH] Add triton P100 FP16 patch - experimental (not tested if working) --- Dockerfile | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/Dockerfile b/Dockerfile index e71f6e230e19a..a4dae9933af89 100644 --- a/Dockerfile +++ b/Dockerfile @@ -205,3 +205,7 @@ ENV VLLM_USAGE_SOURCE production-docker-image ENTRYPOINT ["python3", "-m", "vllm.entrypoints.openai.api_server"] #################### OPENAI API SERVER #################### + +# patch triton for P100 FP16 +RUN --mount=type=cache,target=/root/.cache/pip \ + python3 -m pip install --extra-index-url https://sasha0552.github.io/vllm-ci/ --force-reinstall triton