9
group: ${{ github.workflow }}-${{ github.ref }}
10
cancel-in-progress: true
18
runs-on: [self-hosted, nvidia, cu111, v100]
21
- uses: actions/checkout@v3
24
uses: ./.github/workflows/setup-venv
26
- name: Install pytorch
28
pip install -U --cache-dir $TORCH_CACHE torch==1.10.0+cu111 torchvision==0.11.0+cu111 -f https://download.pytorch.org/whl/torch_stable.html
29
python -c "import torch; print('torch:', torch.__version__, torch)"
30
python -c "import torch; print('CUDA available:', torch.cuda.is_available())"
32
- name: Install transformers
34
git clone https://github.com/huggingface/transformers
36
# if needed switch to the last known good SHA until transformers@master is fixed
37
# git checkout 1cc453d33
38
git rev-parse --short HEAD
41
- name: Install deepspeed
43
pip install .[dev,1bit,autotuning] --no-build-isolation
46
- name: Python environment
52
unset TORCH_CUDA_ARCH_LIST # only jit compile for current arch
54
pytest $PYTEST_OPTS --forked -n 4 unit/ --torch_ver="1.10" --cuda_ver="11"
55
pytest $PYTEST_OPTS --forked -m 'sequential' unit/ --torch_ver="1.10" --cuda_ver="11"
57
- name: Open GitHub issue if nightly CI fails
58
if: ${{ failure() && (github.event_name == 'schedule') }}
59
uses: JasonEtco/create-an-issue@v2
61
GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
63
filename: .github/ISSUE_TEMPLATE/ci_failure_report.md