From edbbfd4326a5d32bf7a855bfbc22f0ae24437b39 Mon Sep 17 00:00:00 2001 From: Robert Yang <141875536+ydm-amazon@users.noreply.github.com> Date: Mon, 5 Aug 2024 13:46:53 -0700 Subject: [PATCH] dockerfile versions non nightly (#2277) --- serving/docker/lmi.Dockerfile | 2 +- serving/docker/pytorch-inf2.Dockerfile | 2 +- serving/docker/tensorrt-llm.Dockerfile | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/serving/docker/lmi.Dockerfile b/serving/docker/lmi.Dockerfile index 0d08e3e6d..380c21e30 100644 --- a/serving/docker/lmi.Dockerfile +++ b/serving/docker/lmi.Dockerfile @@ -36,7 +36,7 @@ ARG vllm_wheel="https://publish.djl.ai/vllm/cu124-pt231/vllm-0.5.3.post1%2Bcu124 ARG flash_attn_2_wheel="https://github.com/vllm-project/flash-attention/releases/download/v2.5.9.post1/vllm_flash_attn-2.5.9.post1-cp310-cp310-manylinux1_x86_64.whl" ARG flash_infer_wheel="https://github.com/flashinfer-ai/flashinfer/releases/download/v0.0.9/flashinfer-0.0.9+cu121torch2.3-cp310-cp310-linux_x86_64.whl" # %2B is the url escape for the '+' character -ARG lmi_dist_wheel="https://publish.djl.ai/lmi_dist/lmi_dist-11.0.0%2Bnightly-py3-none-any.whl" +ARG lmi_dist_wheel="https://publish.djl.ai/lmi_dist/lmi_dist-11.0.0-py3-none-any.whl" ARG seq_scheduler_wheel="https://publish.djl.ai/seq_scheduler/seq_scheduler-0.1.0-py3-none-any.whl" ARG peft_version=0.11.1 diff --git a/serving/docker/pytorch-inf2.Dockerfile b/serving/docker/pytorch-inf2.Dockerfile index 833064d2e..44af2ca76 100644 --- a/serving/docker/pytorch-inf2.Dockerfile +++ b/serving/docker/pytorch-inf2.Dockerfile @@ -26,7 +26,7 @@ ARG diffusers_version=0.28.2 ARG pydantic_version=2.6.1 ARG optimum_neuron_version=0.0.23 # %2B is the url escape for the '+' character -ARG vllm_wheel="https://publish.djl.ai/neuron_vllm/vllm-0.5.0%2Bnightly-py3-none-any.whl" +ARG vllm_wheel="https://publish.djl.ai/neuron_vllm/vllm-0.5.0-py3-none-any.whl" EXPOSE 8080 # Sets up Path for Neuron tools diff --git a/serving/docker/tensorrt-llm.Dockerfile b/serving/docker/tensorrt-llm.Dockerfile index 09a8b6002..523d3a311 100644 --- a/serving/docker/tensorrt-llm.Dockerfile +++ b/serving/docker/tensorrt-llm.Dockerfile @@ -19,7 +19,7 @@ ARG transformers_version=4.42.4 ARG accelerate_version=0.32.1 ARG tensorrtlibs_version=10.1.0 # %2B is the url escape for the '+' character -ARG trtllm_toolkit_version=0.11.0%2Bnightly +ARG trtllm_toolkit_version=0.11.0 ARG trtllm_version=v0.11.0 ARG cuda_python_version=12.4 ARG peft_version=0.10.0