forked from deepmodeling/abacus-develop
-
Notifications
You must be signed in to change notification settings - Fork 0
91 lines (86 loc) · 3.1 KB
/
cuda.yml
File metadata and controls
91 lines (86 loc) · 3.1 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
name: CUDA Test
on:
workflow_dispatch:
jobs:
start-runner:
name: Start self-hosted EC2 runner
runs-on: ubuntu-latest
outputs:
label: ${{ steps.start-ec2-runner.outputs.label }}
ec2-instance-id: ${{ steps.start-ec2-runner.outputs.ec2-instance-id }}
steps:
- name: Configure AWS credentials
uses: aws-actions/configure-aws-credentials@v1
with:
aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
aws-region: us-east-2
- name: Start EC2 runner
id: start-ec2-runner
uses: machulav/ec2-github-runner@v2
with:
mode: start
github-token: ${{ secrets.PAT }}
ec2-image-id: ami-04cd9fec4a7a39019
ec2-instance-type: g4dn.xlarge
subnet-id: subnet-72d3e53e
security-group-id: sg-06b0c93122c08aeab
test:
name: Do the job on the runner
needs: start-runner # required to start the main job when the runner is ready
runs-on: ${{ needs.start-runner.outputs.label }} # run the job on the newly created runner
container:
image: ghcr.io/deepmodeling/abacus-cuda
options: --gpus all
steps:
- name: Checkout
uses: actions/checkout@v3
- name: Build cuSolver
run: |
nvidia-smi
cmake -B build -DUSE_CUSOLVER_LCAO=ON
cmake --build build -j4
cmake --install build
cmake -B build -DBUILD_TESTING=ON
cmake --build build -j4 --target hsolver_diago
- name: Test e2e
run: |
export LD_LIBRARY_PATH=${LD_LIBRARY_PATH}:/usr/local/cuda/lib64
cd tests/integrate
echo "ks_solver cusolver" >> ./270_NO_MD_2O/INPUT
./Autotest.sh -r 270_NO_MD_2O
- name: Test UT
run: |
cd source/src_pdiag/test/
cp ../../../build/source/src_pdiag/test/hsolver_diago .
./hsolver_diago
bash diago_parallel_test.sh
- name: Test performance
run: |
cd examples/performance
ls -d P1*lcao* > allcase
sed -i '/ks_solver/d' P1*lcao*/INPUT
sed -i '$a ks_solver cusolver' P1*lcao*/INPUT
bash run.sh
cat sumall.dat
stop-runner:
name: Stop self-hosted EC2 runner
needs:
- start-runner # required to get output from the start-runner job
- test # required to wait when the main job is done
runs-on: ubuntu-latest
if: ${{ always() }} # required to stop the runner even if the error happened in the previous jobs
steps:
- name: Configure AWS credentials
uses: aws-actions/configure-aws-credentials@v1
with:
aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }}
aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }}
aws-region: us-east-2
- name: Stop EC2 runner
uses: machulav/ec2-github-runner@v2
with:
mode: stop
github-token: ${{ secrets.PAT }}
label: ${{ needs.start-runner.outputs.label }}
ec2-instance-id: ${{ needs.start-runner.outputs.ec2-instance-id }}