Skip to content

Commit f9745f7

Browse files
committed
Merge remote-tracking branch 'upstream/release'
2 parents 59ff746 + 57cf8f9 commit f9745f7

File tree

1,443 files changed

+69125
-25906
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

1,443 files changed

+69125
-25906
lines changed

.buildkite/check-wheel-size.py

Lines changed: 7 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,9 +1,14 @@
1+
# SPDX-License-Identifier: Apache-2.0
2+
13
import os
24
import sys
35
import zipfile
46

5-
# Read the VLLM_MAX_SIZE_MB environment variable, defaulting to 250 MB
6-
VLLM_MAX_SIZE_MB = int(os.environ.get('VLLM_MAX_SIZE_MB', 250))
7+
# Read the VLLM_MAX_SIZE_MB environment variable, defaulting to 400 MiB
8+
# Note that we have 400 MiB quota, please use it wisely.
9+
# See https://github.com/pypi/support/issues/3792 .
10+
# Please also sync the value with the one in Dockerfile.
11+
VLLM_MAX_SIZE_MB = int(os.environ.get('VLLM_MAX_SIZE_MB', 400))
712

813

914
def print_top_10_largest_files(zip_file):

.buildkite/generate_index.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,5 @@
1+
# SPDX-License-Identifier: Apache-2.0
2+
13
import argparse
24
import os
35

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,11 @@
1+
# bash ./run-lm-eval-gsm-vllm-baseline.sh -m nm-testing/SparseLlama-3.1-8B-gsm8k-pruned.2of4-chnl_wts_per_tok_dyn_act_fp8-BitM -b "auto" -t 2
2+
model_name: "nm-testing/SparseLlama-3.1-8B-gsm8k-pruned.2of4-chnl_wts_per_tok_dyn_act_fp8-BitM"
3+
tasks:
4+
- name: "gsm8k"
5+
metrics:
6+
- name: "exact_match,strict-match"
7+
value: 0.6353
8+
- name: "exact_match,flexible-extract"
9+
value: 0.637
10+
limit: null
11+
num_fewshot: null

.buildkite/lm-eval-harness/test_lm_eval_correctness.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,4 @@
1+
# SPDX-License-Identifier: Apache-2.0
12
"""
23
LM eval harness on model to compare vs HF baseline computed offline.
34
Configs are found in configs/$MODEL.yaml

.buildkite/nightly-benchmarks/benchmark-pipeline.yaml

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,6 @@
11
steps:
22
- label: "Wait for container to be ready"
3+
key: wait-for-container-image
34
agents:
45
queue: A100
56
plugins:
@@ -10,12 +11,11 @@ steps:
1011
command:
1112
- sh .buildkite/nightly-benchmarks/scripts/wait-for-image.sh
1213

13-
- wait
14-
1514
- label: "A100"
1615
# skip: "use this flag to conditionally skip the benchmark step, useful for PR testing"
1716
agents:
1817
queue: A100
18+
depends_on: wait-for-container-image
1919
plugins:
2020
- kubernetes:
2121
podSpec:
@@ -49,6 +49,7 @@ steps:
4949
# skip: "use this flag to conditionally skip the benchmark step, useful for PR testing"
5050
agents:
5151
queue: H200
52+
depends_on: wait-for-container-image
5253
plugins:
5354
- docker#v5.12.0:
5455
image: public.ecr.aws/q9t5s3a7/vllm-ci-postmerge-repo:$BUILDKITE_COMMIT
@@ -73,7 +74,7 @@ steps:
7374
# skip: "use this flag to conditionally skip the benchmark step, useful for PR testing"
7475
agents:
7576
queue: H100
76-
depends_on: block-h100
77+
depends_on: wait-for-container-image
7778
plugins:
7879
- docker#v5.12.0:
7980
image: public.ecr.aws/q9t5s3a7/vllm-ci-postmerge-repo:$BUILDKITE_COMMIT

.buildkite/nightly-benchmarks/scripts/convert-results-json-to-markdown.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,5 @@
1+
# SPDX-License-Identifier: Apache-2.0
2+
13
import json
24
import os
35
from pathlib import Path

.buildkite/nightly-benchmarks/scripts/download-tokenizer.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,5 @@
1+
# SPDX-License-Identifier: Apache-2.0
2+
13
import argparse
24

35
from transformers import AutoTokenizer

.buildkite/nightly-benchmarks/scripts/generate-nightly-markdown.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,5 @@
1+
# SPDX-License-Identifier: Apache-2.0
2+
13
import argparse
24
import json
35
from pathlib import Path

.buildkite/nightly-benchmarks/scripts/get-lmdeploy-modelname.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,5 @@
1+
# SPDX-License-Identifier: Apache-2.0
2+
13
from lmdeploy.serve.openai.api_client import APIClient
24

35
api_client = APIClient("http://localhost:8000")

.buildkite/nightly-benchmarks/scripts/nightly-annotate.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -43,7 +43,7 @@ main() {
4343

4444

4545

46-
# The figures should be genereated by a separate process outside the CI/CD pipeline
46+
# The figures should be generated by a separate process outside the CI/CD pipeline
4747

4848
# # generate figures
4949
# python3 -m pip install tabulate pandas matplotlib

0 commit comments

Comments
 (0)