Skip to content

Commit b1c5817

Browse files
DN6sayakpaul
andauthored
Add debugging workflow (#7778)
add debug workflow Co-authored-by: Sayak Paul <[email protected]>
1 parent 235d34c commit b1c5817

File tree

1 file changed

+55
-0
lines changed

1 file changed

+55
-0
lines changed

.github/workflows/ssh-runner.yml

Lines changed: 55 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,55 @@
1+
name: SSH into runners
2+
3+
on:
4+
workflow_dispatch:
5+
inputs:
6+
runner_type:
7+
description: 'Type of runner to test (a10 or t4)'
8+
required: true
9+
docker_image:
10+
description: 'Name of the Docker image'
11+
required: true
12+
13+
env:
14+
IS_GITHUB_CI: "1"
15+
HF_HUB_READ_TOKEN: ${{ secrets.HF_HUB_READ_TOKEN }}
16+
HF_HOME: /mnt/cache
17+
DIFFUSERS_IS_CI: yes
18+
OMP_NUM_THREADS: 8
19+
MKL_NUM_THREADS: 8
20+
RUN_SLOW: yes
21+
22+
jobs:
23+
ssh_runner:
24+
name: "SSH"
25+
runs-on: [single-gpu, nvidia-gpu, "${{ github.event.inputs.runner_type }}", ci]
26+
container:
27+
image: ${{ github.event.inputs.docker_image }}
28+
options: --gpus all --privileged --ipc host -v /mnt/cache/.cache/huggingface:/mnt/cache/
29+
30+
steps:
31+
- name: Update clone
32+
working-directory: /diffusers
33+
run: |
34+
git fetch && git checkout ${{ github.sha }}
35+
- name: Cleanup
36+
working-directory: /diffusers
37+
run: |
38+
rm -rf tests/__pycache__
39+
rm -rf tests/models/__pycache__
40+
rm -rf reports
41+
- name: Show installed libraries and their versions
42+
working-directory: /diffusers
43+
run: pip freeze
44+
45+
- name: NVIDIA-SMI
46+
run: |
47+
nvidia-smi
48+
49+
- name: Tailscale # In order to be able to SSH when a test fails
50+
uses: huggingface/tailscale-action@v1
51+
with:
52+
authkey: ${{ secrets.TAILSCALE_SSH_AUTHKEY }}
53+
slackChannel: ${{ secrets.SLACK_CIFEEDBACK_CHANNEL }}
54+
slackToken: ${{ secrets.SLACK_CIFEEDBACK_BOT_TOKEN }}
55+
waitForSSH: true

0 commit comments

Comments
 (0)