We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents d0c0e51 + 66e8aca commit 7ac492bCopy full SHA for 7ac492b
nltk/tokenize/punkt.py
@@ -1761,7 +1761,7 @@ def load_punkt_params(lang_dir):
1761
# Make a new Parameters object:
1762
params = PunktParameters()
1763
with open(f"{lang_dir}/collocations.tab", encoding="utf-8") as f:
1764
- params.collocations = pdec.tab2tups(f)
+ params.collocations = set(pdec.tab2tups(f))
1765
with open(f"{lang_dir}/sent_starters.txt", encoding="utf-8") as f:
1766
params.sent_starters = pdec.txt2set(f)
1767
with open(f"{lang_dir}/abbrev_types.txt", encoding="utf-8") as f:
0 commit comments