Skip to content

Commit 29c877a

Browse files
committed
update: update the parse.py to all
1 parent 5b58335 commit 29c877a

File tree

1 file changed

+16
-17
lines changed

1 file changed

+16
-17
lines changed

script/parse.py

Lines changed: 16 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -468,20 +468,19 @@ def validate_doc_reqs(data):
468468
os.makedirs("data/processed", exist_ok=True)
469469
with open("data/open-eval.jsonl", "w") as f:
470470
for i, file in enumerate(tqdm(glob("data/clean/*.py"))):
471-
if "zhihan" in file:
472-
data = extract_content(file, f"f_{i}")
473-
if not validate_lib_num(data):
474-
print(file.replace('clean/', 'raw/'), "Less than 2 libraries are used")
475-
if not validate_doc_example(data):
476-
print(file.replace('clean/', 'raw/'), "Example is missing")
477-
if not validate_doc_returns(data):
478-
print(file.replace('clean/', 'raw/'), "Returns is missing")
479-
if not validate_doc_reqs(data):
480-
print(file.replace('clean/', 'raw/'), "Requirements is missing")
481-
if not evaluate_test_class(data["prompt"] + "\n\n" + data["test"]):
482-
print(file.replace('clean/', 'raw/'), "TestCases class is missing")
483-
f.write(json.dumps(data) + "\n")
484-
file_name = file.split("/")[-1].split(".")[0]
485-
file_name = file_name + "_wo_doc" if check_test_wo_doc(data) else file_name + "_w_doc"
486-
with open(f"data/processed/{file_name}.py", "w") as f2:
487-
f2.write(reconstruct_problem(data))
471+
data = extract_content(file, f"f_{i}")
472+
if not validate_lib_num(data):
473+
print(file.replace('clean/', 'raw/'), "Less than 2 libraries are used")
474+
if not validate_doc_example(data):
475+
print(file.replace('clean/', 'raw/'), "Example is missing")
476+
if not validate_doc_returns(data):
477+
print(file.replace('clean/', 'raw/'), "Returns is missing")
478+
if not validate_doc_reqs(data):
479+
print(file.replace('clean/', 'raw/'), "Requirements is missing")
480+
if not evaluate_test_class(data["prompt"] + "\n\n" + data["test"]):
481+
print(file.replace('clean/', 'raw/'), "TestCases class is missing")
482+
f.write(json.dumps(data) + "\n")
483+
file_name = file.split("/")[-1].split(".")[0]
484+
file_name = file_name + "_wo_doc" if check_test_wo_doc(data) else file_name + "_w_doc"
485+
with open(f"data/processed/{file_name}.py", "w") as f2:
486+
f2.write(reconstruct_problem(data))

0 commit comments

Comments
 (0)