From f9ffddd4fe72f6266105d9981e43159e7511f8e2 Mon Sep 17 00:00:00 2001 From: FrankLeeeee Date: Fri, 7 Jul 2023 11:14:16 +0800 Subject: [PATCH] [docker] added ssh and rdma support for docker --- docker/Dockerfile | 12 ++++++++++++ 1 file changed, 12 insertions(+) diff --git a/docker/Dockerfile b/docker/Dockerfile index 2c7bafd9604c..97399c939376 100644 --- a/docker/Dockerfile +++ b/docker/Dockerfile @@ -5,6 +5,18 @@ LABEL org.opencontainers.image.source = "https://github.com/hpcaitech/ColossalAI LABEL org.opencontainers.image.licenses = "Apache License 2.0" LABEL org.opencontainers.image.base.name = "docker.io/library/hpcaitech/cuda-conda:11.3" +# enable passwordless ssh +RUN mkdir ~/.ssh && \ + printf "Host * \n ForwardAgent yes\nHost *\n StrictHostKeyChecking no" > ~/.ssh/config && \ + ssh-keygen -t rsa -N "" -f ~/.ssh/id_rsa && \ + cat ~/.ssh/id_rsa.pub >> ~/.ssh/authorized_keys + +# enable RDMA support +RUN apt-get update && \ + apt-get install -y infiniband-diags perftest ibverbs-providers libibumad3 libibverbs1 libnl-3-200 libnl-route-3-200 librdmacm1 && \ + apt-get clean && \ + rm -rf /var/lib/apt/lists/* + # install torch RUN conda install pytorch==1.12.1 torchvision==0.13.1 torchaudio==0.12.1 cudatoolkit=11.3 -c pytorch