From df3fe8137b88fececae5bc629022044f70a25edc Mon Sep 17 00:00:00 2001 From: sarthaks95 <13473111+sarthaks95@users.noreply.github.com> Date: Tue, 25 Feb 2025 18:23:49 +0530 Subject: [PATCH] Update Dockerfile - llm-optimized-inference version (#3864) --- .../foundation-model-inference/context/Dockerfile | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/assets/training/model_management/environments/foundation-model-inference/context/Dockerfile b/assets/training/model_management/environments/foundation-model-inference/context/Dockerfile index 80960f23fa..dd9fe45562 100644 --- a/assets/training/model_management/environments/foundation-model-inference/context/Dockerfile +++ b/assets/training/model_management/environments/foundation-model-inference/context/Dockerfile @@ -48,7 +48,7 @@ RUN pip install git+https://github.com/stanford-futuredata/megablocks.git@5897cd # RUN pip install -e ./ --no-cache-dir # When copied to assets repo, change to install from public pypi -RUN pip install llm-optimized-inference==0.2.17 --no-cache-dir +RUN pip install llm-optimized-inference==0.2.19 --no-cache-dir RUN pip uninstall -y vllm RUN pip install https://automlsamplenotebookdata.blob.core.windows.net/vllm/vllm-0.6.3.post1+cu122-cp310-cp310-linux_x86_64.whl @@ -63,4 +63,4 @@ RUN chmod +x /var/runit/api_server/run ENV SVDIR=/var/runit ENV WORKER_TIMEOUT=3600 EXPOSE 5001 -CMD [ "runsvdir", "/var/runit" ] \ No newline at end of file +CMD [ "runsvdir", "/var/runit" ]