Unverified Commit d1fd64e7 authored by Stas Bekman's avatar Stas Bekman Committed by GitHub
Browse files

clear ~/.cache/torch_extensions between builds (#14520)

parent 3772af49
...@@ -205,8 +205,9 @@ jobs: ...@@ -205,8 +205,9 @@ jobs:
apt -y update && apt install -y libaio-dev apt -y update && apt install -y libaio-dev
pip install --upgrade pip pip install --upgrade pip
pip install --pre torch torchvision torchaudio -f https://download.pytorch.org/whl/nightly/cu111/torch_nightly.html -U pip install --pre torch torchvision torchaudio -f https://download.pytorch.org/whl/nightly/cu111/torch_nightly.html -U
pip install .[testing,deepspeed,fairscale] rm -rf ~/.cache/torch_extensions/ # shared between conflicting builds
pip install git+https://github.com/microsoft/DeepSpeed pip install .[testing,fairscale]
pip install git+https://github.com/microsoft/DeepSpeed # testing bleeding edge
- name: Are GPUs recognized by our DL frameworks - name: Are GPUs recognized by our DL frameworks
run: | run: |
...@@ -218,7 +219,7 @@ jobs: ...@@ -218,7 +219,7 @@ jobs:
- name: Run all tests on GPU - name: Run all tests on GPU
run: | run: |
python -m pytest -n 1 -v --dist=loadfile --make-reports=tests_torch_cuda_extensions_multi_gpu tests/deepspeed tests/extended python -m pytest -n 1 -v --dist=loadfile --make-reports=tests_torch_cuda_extensions_multi_gpu tests/deepspeed tests/extended
- name: Failure short reports - name: Failure short reports
if: ${{ always() }} if: ${{ always() }}
run: cat reports/tests_torch_cuda_extensions_multi_gpu_failures_short.txt run: cat reports/tests_torch_cuda_extensions_multi_gpu_failures_short.txt
......
...@@ -50,7 +50,7 @@ jobs: ...@@ -50,7 +50,7 @@ jobs:
python -c "import torch; print('Cuda version:', torch.version.cuda)" python -c "import torch; print('Cuda version:', torch.version.cuda)"
python -c "import torch; print('CuDNN version:', torch.backends.cudnn.version())" python -c "import torch; print('CuDNN version:', torch.backends.cudnn.version())"
python -c "import torch; print('Number of GPUs available:', torch.cuda.device_count())" python -c "import torch; print('Number of GPUs available:', torch.cuda.device_count())"
- name: Fetch the tests to run - name: Fetch the tests to run
run: | run: |
python utils/tests_fetcher.py --diff_with_last_commit | tee test_preparation.txt python utils/tests_fetcher.py --diff_with_last_commit | tee test_preparation.txt
...@@ -105,7 +105,7 @@ jobs: ...@@ -105,7 +105,7 @@ jobs:
run: | run: |
python -c "from jax.lib import xla_bridge; print('GPU available:', xla_bridge.get_backend().platform)" python -c "from jax.lib import xla_bridge; print('GPU available:', xla_bridge.get_backend().platform)"
python -c "import jax; print('Number of GPUs available:', len(jax.local_devices()))" python -c "import jax; print('Number of GPUs available:', len(jax.local_devices()))"
- name: Fetch the tests to run - name: Fetch the tests to run
run: | run: |
python utils/tests_fetcher.py --diff_with_last_commit | tee test_preparation.txt python utils/tests_fetcher.py --diff_with_last_commit | tee test_preparation.txt
...@@ -203,7 +203,7 @@ jobs: ...@@ -203,7 +203,7 @@ jobs:
apt install -y libsndfile1-dev apt install -y libsndfile1-dev
pip install --upgrade pip pip install --upgrade pip
pip install .[sklearn,testing,onnxruntime,sentencepiece,torch-speech,vision,timm] pip install .[sklearn,testing,onnxruntime,sentencepiece,torch-speech,vision,timm]
- name: Launcher docker - name: Launcher docker
uses: actions/checkout@v2 uses: actions/checkout@v2
with: with:
...@@ -277,7 +277,7 @@ jobs: ...@@ -277,7 +277,7 @@ jobs:
# run: | # run: |
# python -c "from jax.lib import xla_bridge; print('GPU available:', xla_bridge.get_backend().platform)" # python -c "from jax.lib import xla_bridge; print('GPU available:', xla_bridge.get_backend().platform)"
# python -c "import jax; print('Number of GPUs available:', len(jax.local_devices()))" # python -c "import jax; print('Number of GPUs available:', len(jax.local_devices()))"
# #
# - name: Fetch the tests to run # - name: Fetch the tests to run
# run: | # run: |
# python utils/tests_fetcher.py --diff_with_last_commit | tee test_preparation.txt # python utils/tests_fetcher.py --diff_with_last_commit | tee test_preparation.txt
...@@ -389,11 +389,11 @@ jobs: ...@@ -389,11 +389,11 @@ jobs:
python -c "import torch; print('Cuda version:', torch.version.cuda)" python -c "import torch; print('Cuda version:', torch.version.cuda)"
python -c "import torch; print('CuDNN version:', torch.backends.cudnn.version())" python -c "import torch; print('CuDNN version:', torch.backends.cudnn.version())"
python -c "import torch; print('Number of GPUs available:', torch.cuda.device_count())" python -c "import torch; print('Number of GPUs available:', torch.cuda.device_count())"
- name: Fetch the tests to run - name: Fetch the tests to run
run: | run: |
python utils/tests_fetcher.py --diff_with_last_commit --filters tests/deepspeed tests/extended | tee test_preparation.txt python utils/tests_fetcher.py --diff_with_last_commit --filters tests/deepspeed tests/extended | tee test_preparation.txt
- name: Report fetched tests - name: Report fetched tests
uses: actions/upload-artifact@v2 uses: actions/upload-artifact@v2
with: with:
...@@ -437,6 +437,7 @@ jobs: ...@@ -437,6 +437,7 @@ jobs:
run: | run: |
apt -y update && apt install -y libaio-dev apt -y update && apt install -y libaio-dev
pip install --upgrade pip pip install --upgrade pip
rm -rf ~/.cache/torch_extensions/ # shared between conflicting builds
pip install .[testing,deepspeed,fairscale] pip install .[testing,deepspeed,fairscale]
- name: Are GPUs recognized by our DL frameworks - name: Are GPUs recognized by our DL frameworks
......
...@@ -429,6 +429,7 @@ jobs: ...@@ -429,6 +429,7 @@ jobs:
run: | run: |
apt -y update && apt install -y libaio-dev apt -y update && apt install -y libaio-dev
pip install --upgrade pip pip install --upgrade pip
rm -rf ~/.cache/torch_extensions/ # shared between conflicting builds
pip install .[testing,deepspeed,fairscale] pip install .[testing,deepspeed,fairscale]
- name: Are GPUs recognized by our DL frameworks - name: Are GPUs recognized by our DL frameworks
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment