Skip to content

Commit bc7b691

Browse files
author
Kate Ivanova
committed
Update itextcore hyph xml files encoding to utf-8
DEVSIX-6326
1 parent 6874bfa commit bc7b691

File tree

14 files changed

+6851
-6851
lines changed

14 files changed

+6851
-6851
lines changed

itext/itext.hyph/de.xml

Lines changed: 267 additions & 267 deletions
Large diffs are not rendered by default.

itext/itext.hyph/de_DR.xml

Lines changed: 313 additions & 313 deletions
Large diffs are not rendered by default.

itext/itext.hyph/el.xml

Lines changed: 363 additions & 363 deletions
Large diffs are not rendered by default.

itext/itext.hyph/en.xml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
<?xml version="1.0" encoding="US-ASCII"?>
1+
<?xml version="1.0" encoding="utf-8"?>
22
<!--
33
%
44
% Created by Jeff Kingston, 16 November 1996, from a TeX

itext/itext.hyph/en_GB.xml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
<?xml version="1.0" encoding="US-ASCII"?>
1+
<?xml version="1.0" encoding="utf-8"?>
22
<!--
33
%
44
% Created by Jeff Kingston, 16 November 1996, from a TeX

itext/itext.hyph/en_US.xml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
<?xml version="1.0" encoding="US-ASCII"?>
1+
<?xml version="1.0" encoding="utf-8"?>
22
<!--
33
%
44
% Created by Jeff Kingston, 16 November 1996, from a TeX

itext/itext.hyph/es.xml

Lines changed: 48 additions & 48 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
<?xml version="1.0" encoding="iso-8859-1"?>
1+
<?xml version="1.0" encoding="utf-8"?>
22

33
<!-- Adapted by Carlos Villegas from Lout's spanish.lh.
44
Spanish is probably the easiest language to hyphenate!
@@ -53,13 +53,13 @@ wW
5353
xX
5454
yY
5555
zZ
56-
áÁ
57-
éÉ
58-
íÍ
59-
óÓ
60-
úÚ
61-
üÜ
62-
ñÑ
56+
áÁ
57+
éÉ
58+
íÍ
59+
óÓ
60+
úÚ
61+
üÜ
62+
ñÑ
6363
</classes>
6464

6565
<patterns>
@@ -68,7 +68,7 @@ zZ
6868
% Compiled by Julio Sanchez ([email protected]) on September 1991.
6969
%
7070
% These patterns have been derived from "On Word Division in Spanish",
71-
% José A. Mañas, Communications of the ACM, and implemented in his
71+
% José A. Mañas, Communications of the ACM, and implemented in his
7272
% package ftc. You can get ftc and a draft of the abovementioned
7373
% paper from goya.dit.upm.es in src/text.proc/ftc.Z. FTP access may
7474
% be available. Otherwise, send help to [email protected] for
@@ -140,50 +140,50 @@ zZ
140140
% Rule SR2
141141
% Attach vowel groups to left consonant
142142
-->
143-
1ba 1be 1bo 1bá 1bé 1bí 1bó 1bú 1bi 1bu 1bü
144-
1ca 1ce 1co 1cá 1cé 1cí 1có 1cú 1ci 1cu 1cü
145-
1da 1de 1do 1dá 1dé 1dí 1dó 1dú 1di 1du 1dü
146-
1fa 1fe 1fo 1fá 1fé 1fí 1fó 1fú 1fi 1fu 1fü
147-
1ga 1ge 1go 1gá 1gé 1gí 1gó 1gú 1gi 1gu 1gü
148-
1ja 1je 1jo 1já 1jé 1jí 1jó 1jú 1ji 1ju 1jü
149-
1ka 1ke 1ko 1ká 1ké 1kí 1kó 1kú 1ki 1ku 1kü
150-
1la 1le 1lo 1lá 1lé 1lí 1ló 1lú 1li 1lu 1lü
151-
1ma 1me 1mo 1má 1mé 1mí 1mó 1mú 1mi 1mu 1mü
152-
1na 1ne 1no 1ná 1né 1ní 1nó 1nú 1ni 1nu 1nü
153-
1pa 1pe 1po 1pá 1pé 1pí 1pó 1pú 1pi 1pu 1pü
154-
1qa 1qe 1qo 1qá 1qé 1qí 1qó 1qú 1qi 1qu 1qü
155-
1ra 1re 1ro 1rá 1ré 1rí 1ró 1rú 1ri 1ru 1rü
156-
1sa 1se 1so 1sá 1sé 1sí 1só 1sú 1si 1su 1sü
157-
1ta 1te 1to 1tá 1té 1tí 1tó 1tú 1ti 1tu 1tü
158-
1va 1ve 1vo 1vá 1vé 1ví 1vó 1vú 1vi 1vu 1vü
159-
1wa 1we 1wo 1wá 1wé 1wí 1wó 1wú 1wi 1wu 1wü
160-
1xa 1xe 1xo 1xá 1xé 1xí 1xó 1xú 1xi 1xu 1xü
161-
1ya 1ye 1yo 1yá 1yé 1yí 1yó 1yú 1yi 1yu 1yü
162-
1za 1ze 1zo 1zá 1zé 1zí 1zó 1zú 1zi 1zu 1zü
163-
1ña 1ñe 1ño 1ñá 1ñé 1ñí 1ñó 1ñú 1ñi 1ñu 1ñü
143+
1ba 1be 1bo 1bá 1bé 1bí 1bó 1bú 1bi 1bu 1bü
144+
1ca 1ce 1co 1cá 1cé 1cí 1có 1cú 1ci 1cu 1cü
145+
1da 1de 1do 1dá 1dé 1dí 1dó 1dú 1di 1du 1dü
146+
1fa 1fe 1fo 1fá 1fé 1fí 1fó 1fú 1fi 1fu 1fü
147+
1ga 1ge 1go 1gá 1gé 1gí 1gó 1gú 1gi 1gu 1gü
148+
1ja 1je 1jo 1já 1jé 1jí 1jó 1jú 1ji 1ju 1jü
149+
1ka 1ke 1ko 1ká 1ké 1kí 1kó 1kú 1ki 1ku 1kü
150+
1la 1le 1lo 1lá 1lé 1lí 1ló 1lú 1li 1lu 1lü
151+
1ma 1me 1mo 1má 1mé 1mí 1mó 1mú 1mi 1mu 1mü
152+
1na 1ne 1no 1ná 1né 1ní 1nó 1nú 1ni 1nu 1nü
153+
1pa 1pe 1po 1pá 1pé 1pí 1pó 1pú 1pi 1pu 1pü
154+
1qa 1qe 1qo 1qá 1qé 1qí 1qó 1qú 1qi 1qu 1qü
155+
1ra 1re 1ro 1rá 1ré 1rí 1ró 1rú 1ri 1ru 1rü
156+
1sa 1se 1so 1sá 1sé 1sí 1só 1sú 1si 1su 1sü
157+
1ta 1te 1to 1tá 1té 1tí 1tó 1tú 1ti 1tu 1tü
158+
1va 1ve 1vo 1vá 1vé 1ví 1vó 1vú 1vi 1vu 1vü
159+
1wa 1we 1wo 1wá 1wé 1wí 1wó 1wú 1wi 1wu 1wü
160+
1xa 1xe 1xo 1xá 1xé 1xí 1xó 1xú 1xi 1xu 1xü
161+
1ya 1ye 1yo 1yá 1yé 1yí 1yó 1yú 1yi 1yu 1yü
162+
1za 1ze 1zo 1zá 1zé 1zí 1zó 1zú 1zi 1zu 1zü
163+
1ña 1ñe 1ño 1ñá 1ñé 1ñí 1ñó 1ñú 1ñi 1ñu 1ñü
164164
<!--
165165
% Rule SR3
166166
% Build legal consonant groups, leave other consonants bound to
167167
% the previous group. This overrides part of the SR2 pattern
168168
% group.
169169
-->
170-
1c2ha 1c2he 1c2ho 1c2há 1c2hé 1c2hí 1c2hó 1c2hú 1c2hi 1c2hu 1c2hü
171-
1l2la 1l2le 1l2lo 1l2lá 1l2lé 1l2lí 1l2ló 1l2lú 1l2li 1l2lu 1l2lü
172-
1r2ra 1r2re 1r2ro 1r2rá 1r2ré 1r2rí 1r2ró 1r2rú 1r2ri 1r2ru 1r2rü
173-
1b2la 1b2le 1b2lo 1b2lá 1b2lé 1b2lí 1b2ló 1b2lú 1b2li 1b2lu 1b2lü
174-
1b2ra 1b2re 1b2ro 1b2rá 1b2ré 1b2rí 1b2ró 1b2rú 1b2ri 1b2ru 1b2rü
175-
1c2la 1c2le 1c2lo 1c2lá 1c2lé 1c2lí 1c2ló 1c2lú 1c2li 1c2lu 1c2lü
176-
1c2ra 1c2re 1c2ro 1c2rá 1c2ré 1c2rí 1c2ró 1c2rú 1c2ri 1c2ru 1c2rü
177-
1d2ra 1d2re 1d2ro 1d2rá 1d2ré 1d2rí 1d2ró 1d2rú 1d2ri 1d2ru 1d2rü
178-
1f2la 1f2le 1f2lo 1f2lá 1f2lé 1f2lí 1f2ló 1f2lú 1f2li 1f2lu 1f2lü
179-
1f2ra 1f2re 1f2ro 1f2rá 1f2ré 1f2rí 1f2ró 1f2rú 1f2ri 1f2ru 1f2rü
180-
1g2la 1g2le 1g2lo 1g2lá 1g2lé 1g2lí 1g2ló 1g2lú 1g2li 1g2lu 1g2lü
181-
1g2ra 1g2re 1g2ro 1g2rá 1g2ré 1g2rí 1g2ró 1g2rú 1g2ri 1g2ru 1g2rü
182-
1k2la 1k2le 1k2lo 1k2lá 1k2lé 1k2lí 1k2ló 1k2lú 1k2li 1k2lu 1k2lü
183-
1k2ra 1k2re 1k2ro 1k2rá 1k2ré 1k2rí 1k2ró 1k2rú 1k2ri 1k2ru 1k2rü
184-
1p2la 1p2le 1p2lo 1p2lá 1p2lé 1p2lí 1p2ló 1p2lú 1p2li 1p2lu 1p2lü
185-
1p2ra 1p2re 1p2ro 1p2rá 1p2ré 1p2rí 1p2ró 1p2rú 1p2ri 1p2ru 1p2rü
186-
1t2ra 1t2re 1t2ro 1t2rá 1t2ré 1t2rí 1t2ró 1t2rú 1t2ri 1t2ru 1t2rü
170+
1c2ha 1c2he 1c2ho 1c2há 1c2hé 1c2hí 1c2hó 1c2hú 1c2hi 1c2hu 1c2hü
171+
1l2la 1l2le 1l2lo 1l2lá 1l2lé 1l2lí 1l2ló 1l2lú 1l2li 1l2lu 1l2lü
172+
1r2ra 1r2re 1r2ro 1r2rá 1r2ré 1r2rí 1r2ró 1r2rú 1r2ri 1r2ru 1r2rü
173+
1b2la 1b2le 1b2lo 1b2lá 1b2lé 1b2lí 1b2ló 1b2lú 1b2li 1b2lu 1b2lü
174+
1b2ra 1b2re 1b2ro 1b2rá 1b2ré 1b2rí 1b2ró 1b2rú 1b2ri 1b2ru 1b2rü
175+
1c2la 1c2le 1c2lo 1c2lá 1c2lé 1c2lí 1c2ló 1c2lú 1c2li 1c2lu 1c2lü
176+
1c2ra 1c2re 1c2ro 1c2rá 1c2ré 1c2rí 1c2ró 1c2rú 1c2ri 1c2ru 1c2rü
177+
1d2ra 1d2re 1d2ro 1d2rá 1d2ré 1d2rí 1d2ró 1d2rú 1d2ri 1d2ru 1d2rü
178+
1f2la 1f2le 1f2lo 1f2lá 1f2lé 1f2lí 1f2ló 1f2lú 1f2li 1f2lu 1f2lü
179+
1f2ra 1f2re 1f2ro 1f2rá 1f2ré 1f2rí 1f2ró 1f2rú 1f2ri 1f2ru 1f2rü
180+
1g2la 1g2le 1g2lo 1g2lá 1g2lé 1g2lí 1g2ló 1g2lú 1g2li 1g2lu 1g2lü
181+
1g2ra 1g2re 1g2ro 1g2rá 1g2ré 1g2rí 1g2ró 1g2rú 1g2ri 1g2ru 1g2rü
182+
1k2la 1k2le 1k2lo 1k2lá 1k2lé 1k2lí 1k2ló 1k2lú 1k2li 1k2lu 1k2lü
183+
1k2ra 1k2re 1k2ro 1k2rá 1k2ré 1k2rí 1k2ró 1k2rú 1k2ri 1k2ru 1k2rü
184+
1p2la 1p2le 1p2lo 1p2lá 1p2lé 1p2lí 1p2ló 1p2lú 1p2li 1p2lu 1p2lü
185+
1p2ra 1p2re 1p2ro 1p2rá 1p2ré 1p2rí 1p2ró 1p2rú 1p2ri 1p2ru 1p2rü
186+
1t2ra 1t2re 1t2ro 1t2rá 1t2ré 1t2rí 1t2ró 1t2rú 1t2ri 1t2ru 1t2rü
187187
<!--
188188
% Rule SR4 is implicitly implemented by the default values
189189
% Rule HE1 is implemented by TeX parameters \lefthyphenmin and
@@ -193,7 +193,7 @@ zZ
193193
% Rule HE2
194194
% Break between a consonant and an h
195195
-->
196-
b1h d1h f1h g1h j1h k1h l1h m1h n1h p1h q1h r1h s1h t1h v1h w1h x1h y1h z1h ñ1h
196+
b1h d1h f1h g1h j1h k1h l1h m1h n1h p1h q1h r1h s1h t1h v1h w1h x1h y1h z1h ñ1h
197197
<!-- % We now avoid some problematic breaks. -->
198198
su2b2r su2b2l
199199
<!--

itext/itext.hyph/fi.xml

Lines changed: 57 additions & 57 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
<?xml version="1.0" encoding="iso-8859-1"?>
1+
<?xml version="1.0" encoding="utf-8"?>
22
<!-- Constructed by Jarno Elovirta from fi8hyph.tex file:
33
44
% fi8hyph.tex, based on fihyph.tex
@@ -53,8 +53,8 @@ wW
5353
xX
5454
yY
5555
zZ
56-
äÄ
57-
öÖ
56+
äÄ
57+
öÖ
5858
</classes>
5959
<patterns>
6060
1be
@@ -68,8 +68,8 @@ zZ
6868
1do
6969
1du
7070
1dy
71-
1dä
72-
1dö
71+
1dä
72+
1dö
7373
1fa
7474
1fe
7575
1fi
@@ -82,96 +82,96 @@ zZ
8282
1go
8383
1gu
8484
1gy
85-
1gä
86-
1gö
85+
1gä
86+
1gö
8787
1ha
8888
1he
8989
1hi
9090
1ho
9191
1hu
9292
1hy
93-
1hä
94-
1hö
93+
1hä
94+
1hö
9595
1ja
9696
1je
9797
1ji
9898
1jo
9999
1ju
100100
1jy
101-
1jä
102-
1jö
101+
1jä
102+
1jö
103103
1ka
104104
1ke
105105
1ki
106106
1ko
107107
1ku
108108
1ky
109-
1kä
110-
1kö
109+
1kä
110+
1kö
111111
1la
112112
1le
113113
1li
114114
1lo
115115
1lu
116116
1ly
117-
1lä
118-
1lö
117+
1lä
118+
1lö
119119
1ma
120120
1me
121121
1mi
122122
1mo
123123
1mu
124124
1my
125-
1mä
126-
1mö
125+
1mä
126+
1mö
127127
1na
128128
1ne
129129
1ni
130130
1no
131131
1nu
132132
1ny
133-
1nä
134-
1nö
133+
1nä
134+
1nö
135135
1pa
136136
1pe
137137
1pi
138138
1po
139139
1pu
140140
1py
141-
1pä
142-
1pö
141+
1pä
142+
1pö
143143
1ra
144144
1re
145145
1ri
146146
1ro
147147
1ru
148148
1ry
149-
1rä
150-
1rö
149+
1rä
150+
1rö
151151
1sa
152152
1se
153153
1si
154154
1so
155155
1su
156156
1sy
157-
1sä
158-
1sö
157+
1sä
158+
1sö
159159
1ta
160160
1te
161161
1ti
162162
1to
163163
1tu
164164
1ty
165-
1tä
166-
1tö
165+
1tä
166+
1tö
167167
1va
168168
1ve
169169
1vi
170170
1vo
171171
1vu
172172
1vy
173-
1vä
174-
1vö
173+
1vä
174+
1vö
175175
<!-- % ======= Some common words borrowed from other languages ======= -->
176176
<!-- % ======= This part could be updated from time to time ======= -->
177177
<!-- % -->
@@ -180,29 +180,29 @@ zZ
180180
<!-- % ====== Some special cases occuring with compound words only ==== -->
181181
<!-- % ====== There still remains well known problem as 'kaivos\-aukko' etc. -->
182182
<!-- %a1y (common in borrowed words) -->
183-
ä2y
183+
ä2y
184184
y1a2
185185
y1o2
186186
o1y
187-
ö2y
187+
ö2y
188188
u1y2
189189
y1u2
190-
ö3a2
191-
ö3o2
192-
ä3a2
193-
ä3o2
194-
ä1u2
195-
ö1u2
196-
a1ä <!-- % (a1ä2 ei mahdollinen!) -->
197-
a1ö
198-
o1ä
199-
o1ö
200-
u1ä2
201-
u1ö2
202-
ä2ä
203-
ö2ö
204-
ä2ö
205-
ö2ä
190+
ö3a2
191+
ö3o2
192+
ä3a2
193+
ä3o2
194+
ä1u2
195+
ö1u2
196+
a1ä <!-- % (a1ä2 ei mahdollinen!) -->
197+
a1ö
198+
o1ä
199+
o1ö
200+
u1ä2
201+
u1ö2
202+
ä2ä
203+
ö2ö
204+
ä2ö
205+
ö2ä
206206
<!-- % lyhyt/pitka -vokaalipareja, tavallisesti sanarajalla -->
207207
aa1i2 <!-- % maa-ikkuna -->
208208
aa1e2
@@ -228,13 +228,13 @@ a1uu <!-- % kala-uuni -->
228228
i1uu <!-- % ravi-uutiset -->
229229
e1uu <!-- % virhe-uutinen -->
230230
o1uu <!-- % radio-uutiset -->
231-
ää1i
232-
ää1e
233-
ää3y
234-
i1ää
235-
e1ää
236-
y1ää
237-
i1öö <!-- % yhti-öön etc. -->
231+
ää1i
232+
ää1e
233+
ää3y
234+
i1ää
235+
e1ää
236+
y1ää
237+
i1öö <!-- % yhti-öön etc. -->
238238
<!-- %i1eu % keski-eurooppalainen -->
239239
<!-- % vokaalikolmikkoja etc. yhdyssanojen rajoissa -->
240240
<!-- % =======- vowel triples by Fred Karlsson -->
@@ -274,9 +274,9 @@ uo1a
274274
<!-- % uo1i % ambiguous -->
275275
uo1u
276276
<!-- % ================ End of vowel triples ==================== -->
277-
e1ö2
278-
ö1e2
279-
.ä2 <!-- % don't hyphenate ä-lyllinen etc. -->
277+
e1ö2
278+
ö1e2
279+
.ä2 <!-- % don't hyphenate ä-lyllinen etc. -->
280280
<!-- % -->
281281
<!-- % The following patterns contain no general scientific rule. They -->
282282
<!-- % are selected more or less intuitively to solve problems -->

0 commit comments

Comments
 (0)