@@ -468,20 +468,19 @@ def validate_doc_reqs(data):
468468 os .makedirs ("data/processed" , exist_ok = True )
469469 with open ("data/open-eval.jsonl" , "w" ) as f :
470470 for i , file in enumerate (tqdm (glob ("data/clean/*.py" ))):
471- if "zhihan" in file :
472- data = extract_content (file , f"f_{ i } " )
473- if not validate_lib_num (data ):
474- print (file .replace ('clean/' , 'raw/' ), "Less than 2 libraries are used" )
475- if not validate_doc_example (data ):
476- print (file .replace ('clean/' , 'raw/' ), "Example is missing" )
477- if not validate_doc_returns (data ):
478- print (file .replace ('clean/' , 'raw/' ), "Returns is missing" )
479- if not validate_doc_reqs (data ):
480- print (file .replace ('clean/' , 'raw/' ), "Requirements is missing" )
481- if not evaluate_test_class (data ["prompt" ] + "\n \n " + data ["test" ]):
482- print (file .replace ('clean/' , 'raw/' ), "TestCases class is missing" )
483- f .write (json .dumps (data ) + "\n " )
484- file_name = file .split ("/" )[- 1 ].split ("." )[0 ]
485- file_name = file_name + "_wo_doc" if check_test_wo_doc (data ) else file_name + "_w_doc"
486- with open (f"data/processed/{ file_name } .py" , "w" ) as f2 :
487- f2 .write (reconstruct_problem (data ))
471+ data = extract_content (file , f"f_{ i } " )
472+ if not validate_lib_num (data ):
473+ print (file .replace ('clean/' , 'raw/' ), "Less than 2 libraries are used" )
474+ if not validate_doc_example (data ):
475+ print (file .replace ('clean/' , 'raw/' ), "Example is missing" )
476+ if not validate_doc_returns (data ):
477+ print (file .replace ('clean/' , 'raw/' ), "Returns is missing" )
478+ if not validate_doc_reqs (data ):
479+ print (file .replace ('clean/' , 'raw/' ), "Requirements is missing" )
480+ if not evaluate_test_class (data ["prompt" ] + "\n \n " + data ["test" ]):
481+ print (file .replace ('clean/' , 'raw/' ), "TestCases class is missing" )
482+ f .write (json .dumps (data ) + "\n " )
483+ file_name = file .split ("/" )[- 1 ].split ("." )[0 ]
484+ file_name = file_name + "_wo_doc" if check_test_wo_doc (data ) else file_name + "_w_doc"
485+ with open (f"data/processed/{ file_name } .py" , "w" ) as f2 :
486+ f2 .write (reconstruct_problem (data ))
0 commit comments