From 1543cee7c8c95ef47f832b1f37625ba2923c4994 Mon Sep 17 00:00:00 2001 From: Yih-Dar <2521628+ydshieh@users.noreply.github.com> Date: Thu, 15 Dec 2022 21:35:27 +0100 Subject: [PATCH] Recompile `apex` in `DeepSpeed` CI image (#20788) Recompile apex in DeepSpeed CI image Co-authored-by: ydshieh --- docker/transformers-pytorch-deepspeed-latest-gpu/Dockerfile | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/docker/transformers-pytorch-deepspeed-latest-gpu/Dockerfile b/docker/transformers-pytorch-deepspeed-latest-gpu/Dockerfile index 0b3e9d6737..7234d6881e 100644 --- a/docker/transformers-pytorch-deepspeed-latest-gpu/Dockerfile +++ b/docker/transformers-pytorch-deepspeed-latest-gpu/Dockerfile @@ -24,6 +24,11 @@ RUN python3 -m pip install --no-cache-dir ./transformers[deepspeed-testing] RUN python3 -m pip install torch-tensorrt==1.3.0 --find-links https://github.com/pytorch/TensorRT/releases/expanded_assets/v1.3.0 +# recompile apex +RUN python3 -m pip uninstall -y apex +RUN git clone https://github.com/NVIDIA/apex +RUN cd apex && python3 -m pip install --global-option="--cpp_ext" --global-option="--cuda_ext" --no-cache -v --disable-pip-version-check . + # Pre-build **latest** DeepSpeed, so it would be ready for testing (otherwise, the 1st deepspeed test will timeout) RUN python3 -m pip uninstall -y deepspeed # This has to be run (again) inside the GPU VMs running the tests.