clear ~/.cache/torch_extensions between builds (#14520)
This commit is contained in:
7
.github/workflows/self-nightly-scheduled.yml
vendored
7
.github/workflows/self-nightly-scheduled.yml
vendored
@@ -205,8 +205,9 @@ jobs:
|
|||||||
apt -y update && apt install -y libaio-dev
|
apt -y update && apt install -y libaio-dev
|
||||||
pip install --upgrade pip
|
pip install --upgrade pip
|
||||||
pip install --pre torch torchvision torchaudio -f https://download.pytorch.org/whl/nightly/cu111/torch_nightly.html -U
|
pip install --pre torch torchvision torchaudio -f https://download.pytorch.org/whl/nightly/cu111/torch_nightly.html -U
|
||||||
pip install .[testing,deepspeed,fairscale]
|
rm -rf ~/.cache/torch_extensions/ # shared between conflicting builds
|
||||||
pip install git+https://github.com/microsoft/DeepSpeed
|
pip install .[testing,fairscale]
|
||||||
|
pip install git+https://github.com/microsoft/DeepSpeed # testing bleeding edge
|
||||||
|
|
||||||
- name: Are GPUs recognized by our DL frameworks
|
- name: Are GPUs recognized by our DL frameworks
|
||||||
run: |
|
run: |
|
||||||
@@ -218,7 +219,7 @@ jobs:
|
|||||||
- name: Run all tests on GPU
|
- name: Run all tests on GPU
|
||||||
run: |
|
run: |
|
||||||
python -m pytest -n 1 -v --dist=loadfile --make-reports=tests_torch_cuda_extensions_multi_gpu tests/deepspeed tests/extended
|
python -m pytest -n 1 -v --dist=loadfile --make-reports=tests_torch_cuda_extensions_multi_gpu tests/deepspeed tests/extended
|
||||||
|
|
||||||
- name: Failure short reports
|
- name: Failure short reports
|
||||||
if: ${{ always() }}
|
if: ${{ always() }}
|
||||||
run: cat reports/tests_torch_cuda_extensions_multi_gpu_failures_short.txt
|
run: cat reports/tests_torch_cuda_extensions_multi_gpu_failures_short.txt
|
||||||
|
|||||||
13
.github/workflows/self-push.yml
vendored
13
.github/workflows/self-push.yml
vendored
@@ -50,7 +50,7 @@ jobs:
|
|||||||
python -c "import torch; print('Cuda version:', torch.version.cuda)"
|
python -c "import torch; print('Cuda version:', torch.version.cuda)"
|
||||||
python -c "import torch; print('CuDNN version:', torch.backends.cudnn.version())"
|
python -c "import torch; print('CuDNN version:', torch.backends.cudnn.version())"
|
||||||
python -c "import torch; print('Number of GPUs available:', torch.cuda.device_count())"
|
python -c "import torch; print('Number of GPUs available:', torch.cuda.device_count())"
|
||||||
|
|
||||||
- name: Fetch the tests to run
|
- name: Fetch the tests to run
|
||||||
run: |
|
run: |
|
||||||
python utils/tests_fetcher.py --diff_with_last_commit | tee test_preparation.txt
|
python utils/tests_fetcher.py --diff_with_last_commit | tee test_preparation.txt
|
||||||
@@ -105,7 +105,7 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
python -c "from jax.lib import xla_bridge; print('GPU available:', xla_bridge.get_backend().platform)"
|
python -c "from jax.lib import xla_bridge; print('GPU available:', xla_bridge.get_backend().platform)"
|
||||||
python -c "import jax; print('Number of GPUs available:', len(jax.local_devices()))"
|
python -c "import jax; print('Number of GPUs available:', len(jax.local_devices()))"
|
||||||
|
|
||||||
- name: Fetch the tests to run
|
- name: Fetch the tests to run
|
||||||
run: |
|
run: |
|
||||||
python utils/tests_fetcher.py --diff_with_last_commit | tee test_preparation.txt
|
python utils/tests_fetcher.py --diff_with_last_commit | tee test_preparation.txt
|
||||||
@@ -203,7 +203,7 @@ jobs:
|
|||||||
apt install -y libsndfile1-dev
|
apt install -y libsndfile1-dev
|
||||||
pip install --upgrade pip
|
pip install --upgrade pip
|
||||||
pip install .[sklearn,testing,onnxruntime,sentencepiece,torch-speech,vision,timm]
|
pip install .[sklearn,testing,onnxruntime,sentencepiece,torch-speech,vision,timm]
|
||||||
|
|
||||||
- name: Launcher docker
|
- name: Launcher docker
|
||||||
uses: actions/checkout@v2
|
uses: actions/checkout@v2
|
||||||
with:
|
with:
|
||||||
@@ -277,7 +277,7 @@ jobs:
|
|||||||
# run: |
|
# run: |
|
||||||
# python -c "from jax.lib import xla_bridge; print('GPU available:', xla_bridge.get_backend().platform)"
|
# python -c "from jax.lib import xla_bridge; print('GPU available:', xla_bridge.get_backend().platform)"
|
||||||
# python -c "import jax; print('Number of GPUs available:', len(jax.local_devices()))"
|
# python -c "import jax; print('Number of GPUs available:', len(jax.local_devices()))"
|
||||||
#
|
#
|
||||||
# - name: Fetch the tests to run
|
# - name: Fetch the tests to run
|
||||||
# run: |
|
# run: |
|
||||||
# python utils/tests_fetcher.py --diff_with_last_commit | tee test_preparation.txt
|
# python utils/tests_fetcher.py --diff_with_last_commit | tee test_preparation.txt
|
||||||
@@ -389,11 +389,11 @@ jobs:
|
|||||||
python -c "import torch; print('Cuda version:', torch.version.cuda)"
|
python -c "import torch; print('Cuda version:', torch.version.cuda)"
|
||||||
python -c "import torch; print('CuDNN version:', torch.backends.cudnn.version())"
|
python -c "import torch; print('CuDNN version:', torch.backends.cudnn.version())"
|
||||||
python -c "import torch; print('Number of GPUs available:', torch.cuda.device_count())"
|
python -c "import torch; print('Number of GPUs available:', torch.cuda.device_count())"
|
||||||
|
|
||||||
- name: Fetch the tests to run
|
- name: Fetch the tests to run
|
||||||
run: |
|
run: |
|
||||||
python utils/tests_fetcher.py --diff_with_last_commit --filters tests/deepspeed tests/extended | tee test_preparation.txt
|
python utils/tests_fetcher.py --diff_with_last_commit --filters tests/deepspeed tests/extended | tee test_preparation.txt
|
||||||
|
|
||||||
- name: Report fetched tests
|
- name: Report fetched tests
|
||||||
uses: actions/upload-artifact@v2
|
uses: actions/upload-artifact@v2
|
||||||
with:
|
with:
|
||||||
@@ -437,6 +437,7 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
apt -y update && apt install -y libaio-dev
|
apt -y update && apt install -y libaio-dev
|
||||||
pip install --upgrade pip
|
pip install --upgrade pip
|
||||||
|
rm -rf ~/.cache/torch_extensions/ # shared between conflicting builds
|
||||||
pip install .[testing,deepspeed,fairscale]
|
pip install .[testing,deepspeed,fairscale]
|
||||||
|
|
||||||
- name: Are GPUs recognized by our DL frameworks
|
- name: Are GPUs recognized by our DL frameworks
|
||||||
|
|||||||
1
.github/workflows/self-scheduled.yml
vendored
1
.github/workflows/self-scheduled.yml
vendored
@@ -429,6 +429,7 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
apt -y update && apt install -y libaio-dev
|
apt -y update && apt install -y libaio-dev
|
||||||
pip install --upgrade pip
|
pip install --upgrade pip
|
||||||
|
rm -rf ~/.cache/torch_extensions/ # shared between conflicting builds
|
||||||
pip install .[testing,deepspeed,fairscale]
|
pip install .[testing,deepspeed,fairscale]
|
||||||
|
|
||||||
- name: Are GPUs recognized by our DL frameworks
|
- name: Are GPUs recognized by our DL frameworks
|
||||||
|
|||||||
Reference in New Issue
Block a user