|
17 | 17 | Note: Unit tests for this module can be found in test/unit/test_senna.py |
18 | 18 |
|
19 | 19 | >>> from nltk.tag import SennaTagger |
20 | | ->>> tagger = SennaTagger('/usr/share/senna-v3.0') |
| 20 | +>>> tagger = SennaTagger('/usr/share/senna-v3.0') # doctest: +SKIP |
21 | 21 | >>> tagger.tag('What is the airspeed of an unladen swallow ?'.split()) # doctest: +SKIP |
22 | 22 | [('What', 'WP'), ('is', 'VBZ'), ('the', 'DT'), ('airspeed', 'NN'), |
23 | 23 | ('of', 'IN'), ('an', 'DT'), ('unladen', 'NN'), ('swallow', 'NN'), ('?', '.')] |
24 | 24 |
|
25 | 25 | >>> from nltk.tag import SennaChunkTagger |
26 | | ->>> chktagger = SennaChunkTagger('/usr/share/senna-v3.0') |
| 26 | +>>> chktagger = SennaChunkTagger('/usr/share/senna-v3.0') # doctest: +SKIP |
27 | 27 | >>> chktagger.tag('What is the airspeed of an unladen swallow ?'.split()) # doctest: +SKIP |
28 | 28 | [('What', 'B-NP'), ('is', 'B-VP'), ('the', 'B-NP'), ('airspeed', 'I-NP'), |
29 | 29 | ('of', 'B-PP'), ('an', 'B-NP'), ('unladen', 'I-NP'), ('swallow', 'I-NP'), |
30 | 30 | ('?', 'O')] |
31 | 31 |
|
32 | 32 | >>> from nltk.tag import SennaNERTagger |
33 | | ->>> nertagger = SennaNERTagger('/usr/share/senna-v3.0') |
| 33 | +>>> nertagger = SennaNERTagger('/usr/share/senna-v3.0') # doctest: +SKIP |
34 | 34 | >>> nertagger.tag('Shakespeare theatre was in London .'.split()) # doctest: +SKIP |
35 | 35 | [('Shakespeare', 'B-PER'), ('theatre', 'O'), ('was', 'O'), ('in', 'O'), |
36 | 36 | ('London', 'B-LOC'), ('.', 'O')] |
@@ -80,14 +80,14 @@ def bio_to_chunks(self, tagged_sent, chunk_type): |
80 | 80 | Extracts the chunks in a BIO chunk-tagged sentence. |
81 | 81 |
|
82 | 82 | >>> from nltk.tag import SennaChunkTagger |
83 | | - >>> chktagger = SennaChunkTagger('/usr/share/senna-v3.0') |
| 83 | + >>> chktagger = SennaChunkTagger('/usr/share/senna-v3.0') # doctest: +SKIP |
84 | 84 | >>> sent = 'What is the airspeed of an unladen swallow ?'.split() |
85 | | - >>> tagged_sent = chktagger.tag(sent) # doctest: +SKIP |
86 | | - >>> tagged_sent # doctest: +SKIP |
| 85 | + >>> tagged_sent = chktagger.tag(sent) # doctest: +SKIP |
| 86 | + >>> tagged_sent # doctest: +SKIP |
87 | 87 | [('What', 'B-NP'), ('is', 'B-VP'), ('the', 'B-NP'), ('airspeed', 'I-NP'), |
88 | 88 | ('of', 'B-PP'), ('an', 'B-NP'), ('unladen', 'I-NP'), ('swallow', 'I-NP'), |
89 | 89 | ('?', 'O')] |
90 | | - >>> list(chktagger.bio_to_chunks(tagged_sent, chunk_type='NP')) # doctest: +SKIP |
| 90 | + >>> list(chktagger.bio_to_chunks(tagged_sent, chunk_type='NP')) # doctest: +SKIP |
91 | 91 | [('What', '0'), ('the airspeed', '2-3'), ('an unladen swallow', '5-6-7')] |
92 | 92 |
|
93 | 93 | :param tagged_sent: A list of tuples of word and BIO chunk tag. |
|
0 commit comments