Skip to content

Commit ba1b36b

Browse files
committed
fix: change default subset names
1 parent f4f62b4 commit ba1b36b

File tree

4 files changed

+9
-9
lines changed

4 files changed

+9
-9
lines changed

bigcodebench/data/bigcodebench.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@
1616
BIGCODEBENCH_HF = "bigcode/bigcodebench"
1717
BIGCODEBENCH_VERSION = "v0.1.0_hf"
1818

19-
def _ready_bigcodebench_path(subset="", version="default") -> str:
19+
def _ready_bigcodebench_path(subset="full", version="default") -> str:
2020
if BIGCODEBENCH_OVERRIDE_PATH:
2121
return BIGCODEBENCH_OVERRIDE_PATH
2222

@@ -39,7 +39,7 @@ def _ready_bigcodebench_path(subset="", version="default") -> str:
3939

4040

4141
def get_bigcodebench(
42-
err_incomplete=True, subset="", version="default"
42+
err_incomplete=True, subset="full", version="default"
4343
) -> Dict[str, Dict]:
4444
"""Get BigCodeBench from BigCode's github repo and return as a list of parsed dicts.
4545
@@ -63,7 +63,7 @@ def get_bigcodebench(
6363
completeness_check("BigCodeBench", data)
6464
return data
6565

66-
def get_bigcodebench_hash(subset="", version="default") -> str:
66+
def get_bigcodebench_hash(subset="full", version="default") -> str:
6767
"""Get the hash of BigCodeBench.
6868
Returns:
6969
str: The hash of BigCodeBench

bigcodebench/data/utils.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -11,8 +11,8 @@
1111
CACHE_DIR = user_cache_dir("bigcodebench")
1212

1313

14-
def get_dataset_metadata(version: str, subset: str=""):
15-
extra = "-" + subset.capitalize() if subset else ""
14+
def get_dataset_metadata(version: str, subset: str="full"):
15+
extra = "-" + subset.capitalize() if subset != "full" else ""
1616
url = f"https://github.com/bigcode-project/bigcodebench-annotation/releases/download/{version}/BigCodeBench{extra}.jsonl.gz"
1717
cache_path = os.path.join(CACHE_DIR, f"BigCodeBench{extra}-{version}.jsonl")
1818
return url, cache_path

bigcodebench/evaluate.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -287,7 +287,7 @@ def main():
287287
parser.add_argument(
288288
"--split", required=True, type=str, choices=["complete", "instruct"]
289289
)
290-
parser.add_argument("--subset", default="", choices=["", "hard"], type=str)
290+
parser.add_argument("--subset", default="full", choices=["full", "hard"], type=str)
291291
parser.add_argument("--samples", required=True, type=str)
292292
parser.add_argument("--parallel", default=None, type=int)
293293
parser.add_argument("--min-time-limit", default=1, type=float)

bigcodebench/generate.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -24,7 +24,7 @@ def codegen(
2424
id_range=None,
2525
resume=True,
2626
):
27-
extra = "-" + subset.capitalize() if subset else ""
27+
extra = "-" + subset.capitalize()
2828
with Progress(
2929
TextColumn(f"BigCodeBench--{split} ({extra}) •" + "[progress.percentage]{task.percentage:>3.0f}%"),
3030
BarColumn(),
@@ -108,7 +108,7 @@ def main():
108108
parser = argparse.ArgumentParser()
109109
parser.add_argument("--model", required=True, type=str)
110110
parser.add_argument("--split", required=True, type=str)
111-
parser.add_argument("--subset", default="", type=str)
111+
parser.add_argument("--subset", default="full", type=str)
112112
parser.add_argument("--save_path", default=None, type=str)
113113
parser.add_argument("--bs", default=1, type=int)
114114
parser.add_argument("--n_samples", default=1, type=int)
@@ -125,7 +125,7 @@ def main():
125125

126126

127127
assert args.split in ["complete", "instruct"], f"Invalid split {args.split}"
128-
assert args.subset in ["", "hard"], f"Invalid subset {args.subset}"
128+
assert args.subset in ["full", "hard"], f"Invalid subset {args.subset}"
129129
assert args.backend in ["vllm", "hf", "openai", "mistral", "anthropic", "google"]
130130

131131
if args.greedy and (args.temperature != 0 or args.bs != 1 or args.n_samples != 1)\

0 commit comments

Comments
 (0)