From df05a43c4b3260a17f685ad3fd0f2d10e8779bb2 Mon Sep 17 00:00:00 2001 From: Xin Yang <105740670+xyang16@users.noreply.github.com> Date: Fri, 29 Mar 2024 13:02:07 -0700 Subject: [PATCH] [0.27.0-dlc] Use fixed versions in dockerfile (#1703) --- serving/docker/Dockerfile | 2 +- serving/docker/aarch64.Dockerfile | 2 +- serving/docker/deepspeed.Dockerfile | 8 ++++---- serving/docker/pytorch-gpu.Dockerfile | 2 +- serving/docker/pytorch-inf2.Dockerfile | 2 +- serving/docker/tensorrt-llm.Dockerfile | 2 +- 6 files changed, 9 insertions(+), 9 deletions(-) diff --git a/serving/docker/Dockerfile b/serving/docker/Dockerfile index 1b5dfc0ad1..6c5f9be513 100644 --- a/serving/docker/Dockerfile +++ b/serving/docker/Dockerfile @@ -10,7 +10,7 @@ # BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, express or implied. See the License for # the specific language governing permissions and limitations under the License. FROM ubuntu:22.04 AS base -ARG djl_version=0.27.0~SNAPSHOT +ARG djl_version=0.27.0 COPY scripts scripts/ RUN mkdir -p /opt/djl/conf && \ diff --git a/serving/docker/aarch64.Dockerfile b/serving/docker/aarch64.Dockerfile index 587cda3126..0272c32748 100644 --- a/serving/docker/aarch64.Dockerfile +++ b/serving/docker/aarch64.Dockerfile @@ -10,7 +10,7 @@ # BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, express or implied. See the License for # the specific language governing permissions and limitations under the License. FROM arm64v8/ubuntu:22.04 -ARG djl_version=0.27.0~SNAPSHOT +ARG djl_version=0.27.0 ARG torch_version=2.1.1 EXPOSE 8080 diff --git a/serving/docker/deepspeed.Dockerfile b/serving/docker/deepspeed.Dockerfile index 0a43a73047..b64635cab4 100644 --- a/serving/docker/deepspeed.Dockerfile +++ b/serving/docker/deepspeed.Dockerfile @@ -12,7 +12,7 @@ ARG version=12.1.1-cudnn8-devel-ubuntu22.04 FROM nvidia/cuda:$version ARG cuda_version=cu121 -ARG djl_version=0.27.0~SNAPSHOT +ARG djl_version=0.27.0 # Base Deps ARG python_version=3.10 ARG torch_version=2.1.2 @@ -28,15 +28,15 @@ ARG optimum_version=1.15.0 ARG auto_gptq_version=0.5.1 ARG datasets_version=2.17.1 # DeepSpeed Deps -ARG deepspeed_version=nightly +ARG deepspeed_version=0.12.6 ARG deepspeed_wheel="https://publish.djl.ai/deepspeed/deepspeed-${deepspeed_version}-cp310-cp310-linux_x86_64.whl" # LMI-Dist Deps ARG vllm_wheel="https://github.com/vllm-project/vllm/releases/download/v0.3.3/vllm-0.3.3-cp310-cp310-manylinux1_x86_64.whl" ARG flash_attn_2_wheel="https://publish.djl.ai/flash_attn/cu121-pt212/flash_attn-2.5.6-cp310-cp310-linux_x86_64.whl" -ARG lmi_dist_wheel="https://publish.djl.ai/lmi_dist/lmi_dist-nightly-py3-none-any.whl" +ARG lmi_dist_wheel="https://publish.djl.ai/lmi_dist/lmi_dist-9.0.0-py3-none-any.whl" ARG seq_scheduler_wheel="https://publish.djl.ai/seq_scheduler/seq_scheduler-0.1.0-py3-none-any.whl" ARG peft_wheel="https://publish.djl.ai/peft/peft-0.5.0alpha-py3-none-any.whl" -ARG mmaploader_wheel="https://publish.djl.ai/mmaploader/mmaploader-nightly-py3-none-any.whl" +ARG mmaploader_wheel="https://publish.djl.ai/mmaploader/mmaploader-1.0.0-py3-none-any.whl" ARG aiccl_wheel="https://publish.djl.ai/aiccl/aiccl-1.1%2Bcu121torch2.1-cp310-cp310-linux_x86_64.whl" EXPOSE 8080 diff --git a/serving/docker/pytorch-gpu.Dockerfile b/serving/docker/pytorch-gpu.Dockerfile index a145cecfc0..01333dec83 100644 --- a/serving/docker/pytorch-gpu.Dockerfile +++ b/serving/docker/pytorch-gpu.Dockerfile @@ -13,7 +13,7 @@ ARG version=12.1.1-cudnn8-devel-ubuntu22.04 FROM nvidia/cuda:$version as base -ARG djl_version=0.27.0~SNAPSHOT +ARG djl_version=0.27.0 ARG cuda_version=cu121 ARG torch_version=2.1.1 ARG torch_vision_version=0.16.1 diff --git a/serving/docker/pytorch-inf2.Dockerfile b/serving/docker/pytorch-inf2.Dockerfile index 5d0ebcce08..72f0c0a41e 100644 --- a/serving/docker/pytorch-inf2.Dockerfile +++ b/serving/docker/pytorch-inf2.Dockerfile @@ -10,7 +10,7 @@ # BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, express or implied. See the License for # the specific language governing permissions and limitations under the License. FROM ubuntu:20.04 -ARG djl_version=0.27.0~SNAPSHOT +ARG djl_version=0.27.0 ARG torch_version=1.13.1 ARG python_version=3.9 ARG neuronsdk_version=2.17.0 diff --git a/serving/docker/tensorrt-llm.Dockerfile b/serving/docker/tensorrt-llm.Dockerfile index 39f43f4768..0fad648d33 100644 --- a/serving/docker/tensorrt-llm.Dockerfile +++ b/serving/docker/tensorrt-llm.Dockerfile @@ -14,7 +14,7 @@ FROM nvidia/cuda:$version ARG cuda_version=cu122 ARG python_version=3.10 ARG TORCH_VERSION=2.1.2 -ARG djl_version=0.27.0~SNAPSHOT +ARG djl_version=0.27.0 ARG transformers_version=4.38.1 ARG accelerate_version=0.27.0 ARG tensorrtlibs_version=9.2.0.post12.dev5