From 81eb834d77d5d9cea5eed444356613ffd848e6e9 Mon Sep 17 00:00:00 2001 From: Yeonsil Yoon Date: Tue, 24 Dec 2024 14:00:50 -0800 Subject: [PATCH 1/2] Upgrade to SynapseAI 1.19.0 --- examples/multi-node-training/EFA/Dockerfile | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/examples/multi-node-training/EFA/Dockerfile b/examples/multi-node-training/EFA/Dockerfile index a527f99603..2e32bd0ca1 100644 --- a/examples/multi-node-training/EFA/Dockerfile +++ b/examples/multi-node-training/EFA/Dockerfile @@ -1,4 +1,4 @@ -FROM vault.habana.ai/gaudi-docker/1.18.0/ubuntu22.04/habanalabs/pytorch-installer-2.4.0:latest +FROM vault.habana.ai/gaudi-docker/1.19.0/ubuntu22.04/habanalabs/pytorch-installer-2.5.1:latest # Installs pdsh and upgrade pip RUN apt-get update && apt-get install -y pdsh && \ @@ -18,7 +18,7 @@ RUN sed -i 's/#Port 22/Port 3022/g' /etc/ssh/sshd_config && \ # Installs Optimum Habana and Habana's fork of DeepSpeed RUN pip install optimum[habana] && \ - pip install git+https://github.com/HabanaAI/DeepSpeed.git@1.18.0 + pip install git+https://github.com/HabanaAI/DeepSpeed.git@1.19.0 CMD ssh-keygen -t rsa -b 4096 -N '' -f ~/.ssh/id_rsa && \ chmod 600 ~/.ssh/id_rsa && \ From a3b4cd614f66e634332ef47551feedabe86263b4 Mon Sep 17 00:00:00 2001 From: Libin Tang Date: Tue, 24 Dec 2024 16:08:17 -0800 Subject: [PATCH 2/2] Update Dockerfile --- examples/multi-node-training/EFA/Dockerfile | 1 + 1 file changed, 1 insertion(+) diff --git a/examples/multi-node-training/EFA/Dockerfile b/examples/multi-node-training/EFA/Dockerfile index 2e32bd0ca1..bc6f827164 100644 --- a/examples/multi-node-training/EFA/Dockerfile +++ b/examples/multi-node-training/EFA/Dockerfile @@ -14,6 +14,7 @@ RUN git clone "https://github.com/HabanaAI/hccl_ofi_wrapper.git" "${OFI_WRAPPER_ RUN sed -i 's/#Port 22/Port 3022/g' /etc/ssh/sshd_config && \ sed -i 's/# Port 22/ Port 3022/g' /etc/ssh/ssh_config && \ sed -i 's/#PermitRootLogin prohibit-password/PermitRootLogin yes/' /etc/ssh/sshd_config && \ + /usr/bin/ssh-keygen -A && \ service ssh restart # Installs Optimum Habana and Habana's fork of DeepSpeed