Skip to content

Commit 0b309e6

Browse files
chg: Capture repeated tokens in test
1 parent d8f060d commit 0b309e6

File tree

1 file changed

+29
-1
lines changed

1 file changed

+29
-1
lines changed

tests/prodigy/test_reference_to_token_annotations.py

Lines changed: 29 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -210,7 +210,7 @@ def test_reference_spans_ii(splitter):
210210
assert out == after
211211

212212

213-
def test_reference_spans_author(splitter):
213+
def test_reference_spans_parsing(splitter):
214214

215215
tokens = [
216216
{"start": 0, "end": 0, "id": 0},
@@ -236,6 +236,34 @@ def test_reference_spans_author(splitter):
236236

237237
assert out == after
238238

239+
def test_reference_spans_parsing_single_token(splitter):
240+
241+
tokens = [
242+
{"start": 0, "end": 0, "id": 0},
243+
{"start": 1, "end": 1, "id": 1},
244+
{"start": 2, "end": 2, "id": 2},
245+
{"start": 3, "end": 3, "id": 3},
246+
{"start": 4, "end": 4, "id": 4},
247+
{"start": 5, "end": 5, "id": 5},
248+
{"start": 6, "end": 6, "id": 6},
249+
]
250+
251+
spans = [
252+
{"start": 2, "end": 2, "token_start": 2, "token_end": 2, "label": "author"},
253+
{"start": 4, "end": 4, "token_start": 4, "token_end": 4, "label": "year"},
254+
]
255+
256+
expected = [
257+
{"start": 2, "end": 2, "token_start": 2, "token_end": 2, "label": "author"},
258+
{"start": 4, "end": 4, "token_start": 4, "token_end": 4, "label": "year"},
259+
]
260+
261+
actual = splitter.reference_spans(spans, tokens, task="parsing")
262+
263+
print(actual)
264+
265+
assert actual == expected
266+
239267

240268
def test_outside_spans(splitter):
241269

0 commit comments

Comments
 (0)