From df01c0cfbe330b94d311d4083d40fa9d8246c602 Mon Sep 17 00:00:00 2001 From: Atinoda <61033436+Atinoda@users.noreply.github.com> Date: Fri, 26 Jul 2024 20:41:51 +0100 Subject: [PATCH] Add default-nvidia-tensorrtllm variant --- Dockerfile | 13 +++++++++++++ 1 file changed, 13 insertions(+) diff --git a/Dockerfile b/Dockerfile index 4a74269..2b4c879 100644 --- a/Dockerfile +++ b/Dockerfile @@ -183,6 +183,19 @@ RUN echo "Nvidia Extended (No AVX2)" > /variant.txt ENV EXTRA_LAUNCH_ARGS="" CMD ["python3", "/app/server.py"] +# Extended with TensorRT-LLM +FROM run_base AS default-nvidia-tensorrtllm +# Copy venv +COPY --from=app_nvidia_x $VIRTUAL_ENV $VIRTUAL_ENV +# Install TensorRT-LLM +RUN apt install -y openmpi-bin libopenmpi-dev +RUN pip3 install tensorrt_llm==0.10.0 -U --pre --extra-index-url https://pypi.nvidia.com +ENV LD_LIBRARY_PATH=/usr/lib/x86_64-linux-gnu:$LD_LIBRARY_PATH +# Variant parameters +RUN echo "Nvidia Extended (TensorRT-LLM)" > /variant.txt +ENV EXTRA_LAUNCH_ARGS="" +CMD ["python3", "/app/server.py"] + # ROCM # Base