@@ -17,6 +17,7 @@ def update_model_info(model_info):
1717 for model , info in model_info .items ():
1818 if "https://huggingface.co/" in info ["link" ]:
1919 hf_model = info ["link" ].split ("https://huggingface.co/" )[- 1 ]
20+ print (hf_model )
2021 tokenizer = AutoTokenizer .from_pretrained (hf_model , trust_remote_code = True )
2122 if tokenizer .chat_template is None :
2223 model_info [model ]["direct_complete" ] = True
@@ -315,6 +316,16 @@ def push_ds(ds, path, local=False):
315316 files = []
316317 complete_data , complete_files = read_task_perf ("complete" )
317318 instruct_data , instruct_files = read_task_perf ("instruct" )
319+
320+ complete_map = {model .replace ("-" ,"_" ).replace ("+" ,"_plus" ).replace (" " ,"_" ):
321+ Dataset .from_dict ({"task_id" : list (task_perf .keys ()), "status" : list (task_perf .values ())}) for model , task_perf in complete_data .items ()}
322+ instruct_map = {model .replace ("-" ,"_" ).replace ("+" ,"_plus" ).replace (" " ,"_" ):
323+ Dataset .from_dict ({"task_id" : list (task_perf .keys ()), "status" : list (task_perf .values ())}) for model , task_perf in instruct_data .items ()}
324+ complete_ds = DatasetDict (complete_map )
325+ instruct_ds = DatasetDict (instruct_map )
326+ push_ds (complete_ds , "bigcode/bigcodebench-complete-perf" )
327+ push_ds (instruct_ds , "bigcode/bigcodebench-instruct-perf" )
328+
318329 files .extend (complete_files )
319330 files .extend (instruct_files )
320331 shutil .rmtree ("eval_results" , ignore_errors = True )
0 commit comments