Skip to content

Commit ffd3013

Browse files
committed
update fr-litbank dataset loading
1 parent 148e564 commit ffd3013

File tree

1 file changed

+4
-8
lines changed

1 file changed

+4
-8
lines changed

tibert/bertcoref.py

Lines changed: 4 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -332,9 +332,9 @@ def torch_call(self, features) -> Union[dict, BatchEncoding]:
332332
# same length yet.
333333
return_tensors=None,
334334
)
335-
self.tokenizer.deprecation_warnings[
336-
"Asking-to-pad-a-fast-tokenizer"
337-
] = warning_state
335+
self.tokenizer.deprecation_warnings["Asking-to-pad-a-fast-tokenizer"] = (
336+
warning_state
337+
)
338338

339339
# keep encoding info
340340
batch._encodings = [f.encodings[0] for f in features]
@@ -686,11 +686,7 @@ def load_fr_litbank_dataset(
686686
):
687687
root_path = os.path.expanduser(root_path.rstrip("/"))
688688
return CoreferenceDataset.from_sacr_dir(
689-
f"{root_path}/sacr/Pers_Entites",
690-
tokenizer,
691-
max_span_size,
692-
"en",
693-
ignored_files=["schema.sacr", "elisabeth_Seton.sacr"],
689+
f"{root_path}/sacr/annot_nested/annotInitiale", tokenizer, max_span_size, "fr"
694690
)
695691

696692

0 commit comments

Comments
 (0)