From 2a501ac954bba0aa1661ac4b8118bdb607bceca9 Mon Sep 17 00:00:00 2001 From: Lysandre Debut Date: Thu, 1 Jul 2021 15:26:46 +0200 Subject: [PATCH] Comment fast GPU TF tests (#12452) --- .github/workflows/self-push.yml | 168 ++++++++++++++++---------------- 1 file changed, 84 insertions(+), 84 deletions(-) diff --git a/.github/workflows/self-push.yml b/.github/workflows/self-push.yml index 515d5bc73d..6d05c79274 100644 --- a/.github/workflows/self-push.yml +++ b/.github/workflows/self-push.yml @@ -61,47 +61,47 @@ jobs: name: run_all_tests_torch_gpu_test_reports path: reports - run_tests_tf_gpu: - runs-on: [self-hosted, docker-gpu, single-gpu] - timeout-minutes: 120 - container: - image: tensorflow/tensorflow:2.4.1-gpu - options: --gpus 0 --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/ - steps: - - name: Launcher docker - uses: actions/checkout@v2 - - - name: NVIDIA-SMI - run: | - nvidia-smi - - - name: Install dependencies - run: | - pip install --upgrade pip - pip install .[sklearn,testing,onnxruntime,sentencepiece] - - - name: Are GPUs recognized by our DL frameworks - run: | - TF_CPP_MIN_LOG_LEVEL=3 python -c "import tensorflow as tf; print('TF GPUs available:', bool(tf.config.list_physical_devices('GPU')))" - TF_CPP_MIN_LOG_LEVEL=3 python -c "import tensorflow as tf; print('Number of TF GPUs available:', len(tf.config.list_physical_devices('GPU')))" - - - name: Run all non-slow tests on GPU - env: - TF_NUM_INTRAOP_THREADS: 8 - TF_NUM_INTEROP_THREADS: 1 - run: | - python -m pytest -n 1 --dist=loadfile --make-reports=tests_tf_gpu tests - - - name: Failure short reports - if: ${{ always() }} - run: cat reports/tests_tf_gpu_failures_short.txt - - - name: Test suite reports artifacts - if: ${{ always() }} - uses: actions/upload-artifact@v2 - with: - name: run_all_tests_tf_gpu_test_reports - path: reports +# run_tests_tf_gpu: +# runs-on: [self-hosted, docker-gpu, single-gpu] +# timeout-minutes: 120 +# container: +# image: tensorflow/tensorflow:2.4.1-gpu +# options: --gpus 0 --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/ +# steps: +# - name: Launcher docker +# uses: actions/checkout@v2 +# +# - name: NVIDIA-SMI +# run: | +# nvidia-smi +# +# - name: Install dependencies +# run: | +# pip install --upgrade pip +# pip install .[sklearn,testing,onnxruntime,sentencepiece] +# +# - name: Are GPUs recognized by our DL frameworks +# run: | +# TF_CPP_MIN_LOG_LEVEL=3 python -c "import tensorflow as tf; print('TF GPUs available:', bool(tf.config.list_physical_devices('GPU')))" +# TF_CPP_MIN_LOG_LEVEL=3 python -c "import tensorflow as tf; print('Number of TF GPUs available:', len(tf.config.list_physical_devices('GPU')))" +# +# - name: Run all non-slow tests on GPU +# env: +# TF_NUM_INTRAOP_THREADS: 8 +# TF_NUM_INTEROP_THREADS: 1 +# run: | +# python -m pytest -n 1 --dist=loadfile --make-reports=tests_tf_gpu tests +# +# - name: Failure short reports +# if: ${{ always() }} +# run: cat reports/tests_tf_gpu_failures_short.txt +# +# - name: Test suite reports artifacts +# if: ${{ always() }} +# uses: actions/upload-artifact@v2 +# with: +# name: run_all_tests_tf_gpu_test_reports +# path: reports run_tests_torch_multi_gpu: @@ -147,47 +147,47 @@ jobs: name: run_all_tests_torch_multi_gpu_test_reports path: reports - run_tests_tf_multi_gpu: - runs-on: [self-hosted, docker-gpu, multi-gpu] - timeout-minutes: 120 - container: - image: tensorflow/tensorflow:2.4.1-gpu - options: --gpus all --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/ - steps: - - name: Launcher docker - uses: actions/checkout@v2 - - - name: NVIDIA-SMI - run: | - nvidia-smi - - - name: Install dependencies - run: | - pip install --upgrade pip - pip install .[sklearn,testing,onnxruntime,sentencepiece] - - - name: Are GPUs recognized by our DL frameworks - run: | - TF_CPP_MIN_LOG_LEVEL=3 python -c "import tensorflow as tf; print('TF GPUs available:', bool(tf.config.list_physical_devices('GPU')))" - TF_CPP_MIN_LOG_LEVEL=3 python -c "import tensorflow as tf; print('Number of TF GPUs available:', len(tf.config.list_physical_devices('GPU')))" - - - name: Run all non-slow tests on GPU - env: - TF_NUM_INTRAOP_THREADS: 8 - TF_NUM_INTEROP_THREADS: 1 - run: | - python -m pytest -n 1 --dist=loadfile --make-reports=tests_tf_multi_gpu tests - - - name: Failure short reports - if: ${{ always() }} - run: cat reports/tests_tf_multi_gpu_failures_short.txt - - - name: Test suite reports artifacts - if: ${{ always() }} - uses: actions/upload-artifact@v2 - with: - name: run_all_tests_tf_multi_gpu_test_reports - path: reports +# run_tests_tf_multi_gpu: +# runs-on: [self-hosted, docker-gpu, multi-gpu] +# timeout-minutes: 120 +# container: +# image: tensorflow/tensorflow:2.4.1-gpu +# options: --gpus all --shm-size "16gb" --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/ +# steps: +# - name: Launcher docker +# uses: actions/checkout@v2 +# +# - name: NVIDIA-SMI +# run: | +# nvidia-smi +# +# - name: Install dependencies +# run: | +# pip install --upgrade pip +# pip install .[sklearn,testing,onnxruntime,sentencepiece] +# +# - name: Are GPUs recognized by our DL frameworks +# run: | +# TF_CPP_MIN_LOG_LEVEL=3 python -c "import tensorflow as tf; print('TF GPUs available:', bool(tf.config.list_physical_devices('GPU')))" +# TF_CPP_MIN_LOG_LEVEL=3 python -c "import tensorflow as tf; print('Number of TF GPUs available:', len(tf.config.list_physical_devices('GPU')))" +# +# - name: Run all non-slow tests on GPU +# env: +# TF_NUM_INTRAOP_THREADS: 8 +# TF_NUM_INTEROP_THREADS: 1 +# run: | +# python -m pytest -n 1 --dist=loadfile --make-reports=tests_tf_multi_gpu tests +# +# - name: Failure short reports +# if: ${{ always() }} +# run: cat reports/tests_tf_multi_gpu_failures_short.txt +# +# - name: Test suite reports artifacts +# if: ${{ always() }} +# uses: actions/upload-artifact@v2 +# with: +# name: run_all_tests_tf_multi_gpu_test_reports +# path: reports run_tests_torch_cuda_extensions_gpu: runs-on: [self-hosted, docker-gpu, single-gpu] @@ -278,9 +278,9 @@ jobs: if: always() needs: [ run_tests_torch_gpu, - run_tests_tf_gpu, +# run_tests_tf_gpu, run_tests_torch_multi_gpu, - run_tests_tf_multi_gpu, +# run_tests_tf_multi_gpu, run_tests_torch_cuda_extensions_gpu, run_tests_torch_cuda_extensions_multi_gpu ]