Skip to content

Commit b256dd7

Browse files
committed
Merge remote-tracking branch 'origin/main' into trtllm-attention-test-unify
2 parents 8712963 + 85a9a8d commit b256dd7

File tree

188 files changed

+32159
-11118
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

188 files changed

+32159
-11118
lines changed

.github/workflows/build-doc.yml

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -27,6 +27,11 @@ jobs:
2727
with:
2828
submodules: recursive
2929

30+
- name: Setup Python
31+
uses: actions/setup-python@v4
32+
with:
33+
python-version: '3.12'
34+
3035
- name: Configuring build Environment
3136
run: |
3237
sudo apt-get update

.github/workflows/release-ci-docker.yml

Lines changed: 58 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -7,16 +7,72 @@ jobs:
77
build:
88
runs-on: ubuntu-latest
99
steps:
10+
- name: Free Disk Space
11+
uses: jlumbroso/free-disk-space@main
12+
with:
13+
tool-cache: false
14+
android: true
15+
dotnet: true
16+
haskell: true
17+
large-packages: true
18+
docker-images: true
19+
swap-storage: true
20+
1021
- uses: actions/checkout@v4
22+
23+
- name: Set up QEMU
24+
uses: docker/setup-qemu-action@v3
25+
26+
- name: Set up Docker Buildx
27+
uses: docker/setup-buildx-action@v3
28+
1129
- name: Login to Docker Hub
1230
uses: docker/login-action@v3
1331
with:
1432
username: flashinfer
1533
password: ${{ secrets.DOCKERHUB_TOKEN }}
1634

17-
- uses: docker/build-push-action@v4
35+
- name: Build and push AMD64 image
36+
uses: docker/build-push-action@v5
1837
with:
1938
context: docker
2039
file: docker/Dockerfile.ci_gpu
40+
platforms: linux/amd64
2141
push: true
22-
tags: flashinfer/flashinfer-ci:latest
42+
tags: |
43+
flashinfer/flashinfer-ci:amd64
44+
cache-from: type=registry,ref=flashinfer/flashinfer-ci:buildcache-amd64
45+
cache-to: type=registry,ref=flashinfer/flashinfer-ci:buildcache-amd64,mode=max
46+
provenance: false
47+
sbom: false
48+
49+
- name: Clean up after AMD64 build
50+
run: |
51+
df -h /
52+
docker buildx prune -af
53+
docker system prune -af --volumes
54+
sudo rm -rf /tmp/* /var/tmp/* ~/.docker/buildx
55+
df -h /
56+
57+
- name: Re-setup Docker Buildx for ARM64
58+
uses: docker/setup-buildx-action@v3
59+
60+
- name: Build and push ARM64 image
61+
uses: docker/build-push-action@v5
62+
with:
63+
context: docker
64+
file: docker/Dockerfile.ci_gpu
65+
platforms: linux/arm64
66+
push: true
67+
tags: |
68+
flashinfer/flashinfer-ci:arm64
69+
cache-from: type=registry,ref=flashinfer/flashinfer-ci:buildcache-arm64
70+
cache-to: type=registry,ref=flashinfer/flashinfer-ci:buildcache-arm64,mode=max
71+
provenance: false
72+
sbom: false
73+
74+
- name: Create and push multi-arch manifest
75+
run: |
76+
docker buildx imagetools create -t flashinfer/flashinfer-ci:latest \
77+
flashinfer/flashinfer-ci:amd64 \
78+
flashinfer/flashinfer-ci:arm64

.pre-commit-config.yaml

Lines changed: 15 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -35,22 +35,25 @@ repos:
3535
- id: remove-crlf
3636

3737
# Formatters
38-
- repo: https://github.com/psf/black-pre-commit-mirror
39-
rev: 24.8.0
40-
hooks:
41-
- id: black
42-
exclude: flashinfer/tuning_configs/.*\.py
43-
44-
- repo: https://github.com/pycqa/isort
45-
rev: 5.13.2
46-
hooks:
47-
- id: isort
48-
args: ["--profile=black"] # <-- this one
49-
5038
- repo: https://github.com/pre-commit/mirrors-clang-format
5139
rev: v19.1.1
5240
hooks:
5341
- id: clang-format
5442
types_or: [c++, c, cuda]
5543
exclude: |
5644
(?x)^(3rdparty/.* flashinfer/jit/aot_config.py)$
45+
46+
- repo: https://github.com/pre-commit/mirrors-mypy
47+
rev: 'v1.17.1' # Use the sha / tag you want to point at
48+
hooks:
49+
- id: mypy
50+
51+
- repo: https://github.com/astral-sh/ruff-pre-commit
52+
# Ruff version.
53+
rev: v0.12.8
54+
hooks:
55+
# Run the linter.
56+
- id: ruff-check
57+
# Run the formatter.
58+
- id: ruff-format
59+
types_or: [ python, pyi ]

3rdparty/composable_kernels

Submodule composable_kernels deleted from 5055b3b

Jenkinsfile

Lines changed: 19 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -133,7 +133,7 @@ stage('Unittest') {
133133
cancel_previous_build()
134134
parallel(
135135
failFast: true,
136-
'AOT-Build-Import': {
136+
'AOT-Build-Import-x86-64': {
137137
try {
138138
run_unittest_CPU_AOT_COMPILE('CPU-LARGE-SPOT')
139139
} catch (Throwable ex) {
@@ -151,6 +151,24 @@ stage('Unittest') {
151151
}
152152
}
153153
},
154+
'AOT-Build-Import-aarch64': {
155+
try {
156+
run_unittest_CPU_AOT_COMPILE('ARM-LARGE-SPOT')
157+
} catch (Throwable ex) {
158+
echo 'Exception during SPOT run ' + ex.toString()
159+
if (is_last_build()) {
160+
// retry if we are currently at last build
161+
// mark the current stage as success
162+
// and try again via on demand node
163+
echo 'Exception during SPOT run ' + ex.toString() + ' retry on-demand'
164+
currentBuild.result = 'SUCCESS'
165+
run_unittest_CPU_AOT_COMPILE('ARM-LARGE')
166+
} else {
167+
echo 'Exit since it is not last build'
168+
throw ex
169+
}
170+
}
171+
},
154172
'JIT-Unittest-1': {
155173
try {
156174
shard_run_unittest_GPU('GPU-G5-SPOT', 1)

NOTICE

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
FlashInfer
2+
Copyright 2025 NVIDIA
3+
Copyright 2023-2025 FlashInfer community (https://flashinfer.ai/)
4+
5+
-------------------------------------------------------------------------------------------------
6+
Some of the code in this project are adapted from other open-source projects with different
7+
licenses. This product also bundles some third-party components under other open source licenses.
8+
See licenses/ for text of these licenses.

0 commit comments

Comments
 (0)