diff --git a/assets/training/model_management/environments/foundation-model-inference/context/Dockerfile b/assets/training/model_management/environments/foundation-model-inference/context/Dockerfile index 06de296d62..cf7264e6a3 100644 --- a/assets/training/model_management/environments/foundation-model-inference/context/Dockerfile +++ b/assets/training/model_management/environments/foundation-model-inference/context/Dockerfile @@ -48,12 +48,12 @@ RUN pip install git+https://github.com/stanford-futuredata/megablocks.git@5897cd # RUN pip install -e ./ --no-cache-dir # When copied to assets repo, change to install from public pypi -RUN pip install llm-optimized-inference==0.2.7 --no-cache-dir +RUN pip install llm-optimized-inference==0.2.16 --no-cache-dir +RUN pip uninstall transformers -y RUN pip uninstall -y vllm - -# Install patched vllm wheel -RUN pip install https://automlsamplenotebookdata.blob.core.windows.net/vllm/vllm-0.5.3.post1-cp310-cp310-linux_x86_64.whl +RUN pip install vllm==0.6.1.post2 +RUN pip install transformers==4.46.2 # clean conda and pip caches RUN rm -rf ~/.cache/pip