Skip to content

Commit c526883

Browse files
committed
print out update tokenizer
1 parent 60c752b commit c526883

File tree

1 file changed

+11
-0
lines changed

1 file changed

+11
-0
lines changed

analysis/get_results.py

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -17,6 +17,7 @@ def update_model_info(model_info):
1717
for model, info in model_info.items():
1818
if "https://huggingface.co/" in info["link"]:
1919
hf_model = info["link"].split("https://huggingface.co/")[-1]
20+
print(hf_model)
2021
tokenizer = AutoTokenizer.from_pretrained(hf_model, trust_remote_code=True)
2122
if tokenizer.chat_template is None:
2223
model_info[model]["direct_complete"] = True
@@ -315,6 +316,16 @@ def push_ds(ds, path, local=False):
315316
files = []
316317
complete_data, complete_files = read_task_perf("complete")
317318
instruct_data, instruct_files = read_task_perf("instruct")
319+
320+
complete_map = {model.replace("-","_").replace("+","_plus").replace(" ","_"):
321+
Dataset.from_dict({"task_id": list(task_perf.keys()), "status": list(task_perf.values())}) for model, task_perf in complete_data.items()}
322+
instruct_map = {model.replace("-","_").replace("+","_plus").replace(" ","_"):
323+
Dataset.from_dict({"task_id": list(task_perf.keys()), "status": list(task_perf.values())}) for model, task_perf in instruct_data.items()}
324+
complete_ds = DatasetDict(complete_map)
325+
instruct_ds = DatasetDict(instruct_map)
326+
push_ds(complete_ds, "bigcode/bigcodebench-complete-perf")
327+
push_ds(instruct_ds, "bigcode/bigcodebench-instruct-perf")
328+
318329
files.extend(complete_files)
319330
files.extend(instruct_files)
320331
shutil.rmtree("eval_results", ignore_errors=True)

0 commit comments

Comments
 (0)