Skip to content

Commit 67efc81

Browse files
Merge pull request #4 from wellcometrust/ivyleavedtoadflax/add_missing_test
new: Add missing test
2 parents a58cb95 + 7872fcd commit 67efc81

File tree

1 file changed

+51
-0
lines changed

1 file changed

+51
-0
lines changed

tests/test_labels_to_prodigy.py

Lines changed: 51 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,51 @@
1+
#!/usr/bin/env python3
2+
# coding: utf-8
3+
4+
from deep_reference_parser.reference_utils import labels_to_prodigy
5+
6+
def test_labels_to_prodigy():
7+
8+
tokens = [
9+
['Ackerman', 'J', '.', 'S', '.,', 'Palladio', ',', 'Torino', '1972', '.']
10+
]
11+
12+
labels = [
13+
['b-r', 'i-r', 'i-r', 'i-r', 'i-r', 'i-r', 'i-r', 'i-r', 'i-r', 'e-r']
14+
]
15+
16+
expected = [
17+
{
18+
"text": "Ackerman J . S ., Palladio , Torino 1972 .",
19+
"tokens": [
20+
{'text': 'Ackerman', 'id': 0, 'start': 0, 'end': 8},
21+
{'text': 'J', 'id': 1, 'start': 9, 'end': 10},
22+
{'text': '.', 'id': 2, 'start': 11, 'end': 12},
23+
{'text': 'S', 'id': 3, 'start': 13, 'end': 14},
24+
{'text': '.,', 'id': 4, 'start': 15, 'end': 17},
25+
{'text': 'Palladio', 'id': 5, 'start': 18, 'end': 26},
26+
{'text': ',', 'id': 6, 'start': 27, 'end': 28},
27+
{'text': 'Torino', 'id': 7, 'start': 29, 'end': 35},
28+
{'text': '1972', 'id': 8, 'start': 36, 'end': 40},
29+
{'text': '.', 'id': 9, 'start': 41, 'end': 42}
30+
],
31+
"spans": [
32+
{'label': 'b-r', 'start': 0, 'end': 8, 'token_start': 0, 'token_end': 0},
33+
{'label': 'i-r', 'start': 9, 'end': 10, 'token_start': 1, 'token_end': 1},
34+
{'label': 'i-r', 'start': 11, 'end': 12, 'token_start': 2, 'token_end': 2},
35+
{'label': 'i-r', 'start': 13, 'end': 14, 'token_start': 3, 'token_end': 3},
36+
{'label': 'i-r', 'start': 15, 'end': 17, 'token_start': 4, 'token_end': 4},
37+
{'label': 'i-r', 'start': 18, 'end': 26, 'token_start': 5, 'token_end': 5},
38+
{'label': 'i-r', 'start': 27, 'end': 28, 'token_start': 6, 'token_end': 6},
39+
{'label': 'i-r', 'start': 29, 'end': 35, 'token_start': 7, 'token_end': 7},
40+
{'label': 'i-r', 'start': 36, 'end': 40, 'token_start': 8, 'token_end': 8},
41+
{'label': 'e-r', 'start': 41, 'end': 42, 'token_start': 9, 'token_end': 9}
42+
],
43+
"meta": {"line": 0}
44+
}
45+
46+
]
47+
48+
out = labels_to_prodigy(tokens, labels)
49+
50+
assert out == expected
51+

0 commit comments

Comments
 (0)