Skip to content

Commit d2d514b

Browse files
committed
update to LT 6.1
1 parent 59c9f2a commit d2d514b

File tree

8 files changed

+14
-22
lines changed

8 files changed

+14
-22
lines changed

gradle.properties

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
1-
ltVersion=6.0
2-
ltUkVersion=6.0
1+
ltVersion=6.1
2+
ltUkVersion=6.1
33
#ltUkVersion=6.1-SNAPSHOT
44
groovyVersion=4.0.10
55
# nlp_uk version
6-
version=3.1.2-SNAPSHOT
6+
version=3.2.1

src/main/groovy/ua/net/nlp/bruk/ContextToken.groovy

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -135,9 +135,8 @@ class ContextToken {
135135
return w
136136
}
137137

138-
private static final USE_RIGHT_CTX_PATTERN = ~/є|її|це|саме|всередині|перед|протягом|брати|англійською|українською|рівні|доросл.*/
138+
private static final USE_RIGHT_CTX_PATTERN = ~/є|її|це|саме|[ву]с[еі]|всередині|перед|протягом|брати|англійською|українською|рівні|доросл.*/
139139

140-
@CompileStatic
141140
static boolean useRightContext(String token) {
142141
// token.toLowerCase() ==~ /це|його|її|їх|як|є|саме|все/
143142
token.toLowerCase() ==~ USE_RIGHT_CTX_PATTERN

src/main/groovy/ua/net/nlp/other/CleanText.groovy

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -24,10 +24,8 @@ package ua.net.nlp.other
2424
// mark/rate or remove Russian paragraphs
2525

2626
@GrabConfig(systemClassLoader=true)
27-
@Grab(group='org.languagetool', module='language-uk', version='6.0')
28-
//@Grab(group='ua.net.nlp', module='morfologik-ukrainian-lt', version='6.1.0-SNAPSHOT')
29-
//@Grab(group='org.languagetool', module='language-uk', version='6.1-SNAPSHOT')
30-
@Grab(group='org.languagetool', module='language-ru', version='6.0')
27+
@Grab(group='org.languagetool', module='language-uk', version='6.1')
28+
@Grab(group='org.languagetool', module='language-ru', version='6.1')
3129
@Grab(group='ch.qos.logback', module='logback-classic', version='1.4.+')
3230
@Grab(group='info.picocli', module='picocli', version='4.6.+')
3331

src/main/groovy/ua/net/nlp/tools/TagText.groovy

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -3,10 +3,8 @@
33
package ua.net.nlp.tools
44

55
@GrabConfig(systemClassLoader=true)
6-
@Grab(group='org.languagetool', module='language-uk', version='6.0')
7-
//@Grab(group='org.languagetool', module='language-uk', version='6.1-SNAPSHOT')
8-
//@Grab(group='ua.net.nlp', module='morfologik-ukrainian-lt', version='6.0.2-SNAPSHOT')
9-
@Grab(group='org.languagetool', module='language-ru', version='6.0')
6+
@Grab(group='org.languagetool', module='language-uk', version='6.1')
7+
@Grab(group='org.languagetool', module='language-ru', version='6.1')
108
@Grab(group='ch.qos.logback', module='logback-classic', version='1.4.+')
119
@Grab(group='info.picocli', module='picocli', version='4.6.+')
1210

src/main/groovy/ua/net/nlp/tools/tag/DisambigStats.groovy

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -24,7 +24,7 @@ public class DisambigStats {
2424
private static final Pattern UPPERCASED_PATTERN = Pattern.compile(/[А-ЯІЇЄҐ][а-яіїєґ'-]+/)
2525
private static final boolean USE_SUFFIX_2 = false
2626
private static final String statsFile = "/ua/net/nlp/tools/stats/lemma_freqs_hom.txt"
27-
static final String statsVersion = "3.1.2"
27+
static final String statsVersion = "3.2.1"
2828

2929
boolean disambigBySuffix = true //DisambigModule.wordEnding in options.disambiguate
3030
boolean disambigByContext = true

src/test/groovy/ua/net/nlp/tools/TagTextSemTest.groovy

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,6 @@ class TagTextSemTest {
3737
<token value="усе" lemma="усе" tags="adv" semtags="1:dur:max" />
3838
<token value="усе" lemma="усе" tags="noun:inanim:n:v_naz:&amp;pron:gen" semtags="1:quantif" />
3939
<token value="усе" lemma="усе" tags="noun:inanim:n:v_zna:&amp;pron:gen" semtags="1:quantif" />
40-
<token value="усе" lemma="усе" tags="part" />
4140
<token value="усе" lemma="увесь" tags="adj:n:v_naz:&amp;pron:gen" semtags="1:quantif" />
4241
<token value="усе" lemma="увесь" tags="adj:n:v_zna:&amp;pron:gen" semtags="1:quantif" />
4342
</tokenReading>

src/test/groovy/ua/net/nlp/tools/TagTextUnknownTest.groovy

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -47,11 +47,11 @@ public class TagTextUnknownTest {
4747
"""
4848
assertEquals expected, tagged.tagged
4949

50-
tagged = tagText.tagText("аквамарафон")
50+
tagged = tagText.tagText("стратомарафон")
5151

5252
expected =
5353
"""<sentence>
54-
<token value="аквамарафон" lemma="аквамарафон" tags="noun:inanim:m:v_zna" q="-0.5" />
54+
<token value="стратомарафон" lemma="стратомарафон" tags="noun:inanim:m:v_zna" q="-0.5" />
5555
</sentence>
5656
<paragraph/>
5757
"""
@@ -176,12 +176,12 @@ public class TagTextUnknownTest {
176176
//"""
177177
// assertEquals expected, tagged.tagged
178178

179-
tagged = tagText.tagText("Наталія Галібаренко")
179+
tagged = tagText.tagText("Наталія Алібаренко")
180180

181181
expected =
182182
"""<sentence>
183183
<token value="Наталія" lemma="Наталія" tags="noun:anim:f:v_naz:prop:fname" />
184-
<token value="Галібаренко" lemma="Галібаренко" tags="noun:anim:f:v_naz:nv:prop:lname" q="-0.5" />
184+
<token value="Алібаренко" lemma="Алібаренко" tags="noun:anim:f:v_naz:nv:prop:lname" q="-0.5" />
185185
</sentence>
186186
<paragraph/>
187187
"""

src/test/resources/tag/unknown.txt

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -52,7 +52,7 @@
5252
ст
5353
ред
5454
ій
55-
СОКЕРЧАК
55+
СОКУРЧАК
5656
Тел
5757
Со
5858
года
@@ -94,7 +94,6 @@
9494
лі
9595
лет
9696
пе
97-
Ейрін
9897
дес
9998
стр
10099
см-1
@@ -146,7 +145,6 @@
146145
они
147146
пов
148147
зап
149-
Гальярдо
150148
#племени
151149
куда
152150
#Русского

0 commit comments

Comments
 (0)