Skip to content

Commit d27767d

Browse files
authored
Update parsed_to_df.py
1 parent 8a001a6 commit d27767d

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

cadmus/post_retrieval/parsed_to_df.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@ def parsed_to_df(path = './output/retrieved_parsed_files/content_text/'):
1313
files.append(command[i].split()[-1][:-4])
1414
content_text = []
1515
for i in range(len(files)):
16-
with zipfile.ZipFile(f"{path}/{files[i]}.txt.zip", "r") as z:
16+
with zipfile.ZipFile(f"{path}/{files[i]}.zip", "r") as z:
1717
for filename in z.namelist():
1818
with z.open(filename) as f:
1919
d = f.read()
@@ -23,4 +23,4 @@ def parsed_to_df(path = './output/retrieved_parsed_files/content_text/'):
2323
z.close()
2424
df = pd.DataFrame(content_text, columns=["content_text"])
2525
df.index = files
26-
return df
26+
return df

0 commit comments

Comments
 (0)