Skip to content

Commit 0dfdb8f

Browse files
committed
Partial utf8proc porting progress
* Data generator from JuliaStrings/utf8proc#258 * Partial porting progress of utf8proc functions to Julia * Some APIs from Base.Unicode and Unicode stdlib
1 parent 29404aa commit 0dfdb8f

File tree

7 files changed

+18955
-1
lines changed

7 files changed

+18955
-1
lines changed

data/Makefile

Lines changed: 51 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,51 @@
1+
# Unicode data generation rules. Except for the test data files, most
2+
# users will not use these Makefile rules, which are primarily to re-generate
3+
# data.jl when we get a new Unicode version or charwidth data
4+
5+
# programs
6+
CURL=curl
7+
JULIA=julia
8+
CURLFLAGS = --retry 5 --location
9+
10+
.PHONY: clean rawdata
11+
12+
.DELETE_ON_ERROR:
13+
14+
data.new.jl: data_generator.jl rawdata
15+
$(JULIA) --project=. data_generator.jl Julia > $@
16+
17+
# Unicode data version (must also update utf8proc_unicode_version function)
18+
UNICODE_VERSION=15.1.0
19+
20+
rawdata: UnicodeData.txt GraphemeBreakProperty.txt DerivedCoreProperties.txt CompositionExclusions.txt CaseFolding.txt EastAsianWidth.txt emoji-data.txt
21+
22+
UnicodeData.txt:
23+
$(CURL) $(CURLFLAGS) -o $@ https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/UnicodeData.txt
24+
25+
EastAsianWidth.txt:
26+
$(CURL) $(CURLFLAGS) -o $@ $(URLCACHE)https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/EastAsianWidth.txt
27+
28+
GraphemeBreakProperty.txt:
29+
$(CURL) $(CURLFLAGS) -o $@ $(URLCACHE)https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/auxiliary/GraphemeBreakProperty.txt
30+
31+
DerivedCoreProperties.txt:
32+
$(CURL) $(CURLFLAGS) -o $@ $(URLCACHE)https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/DerivedCoreProperties.txt
33+
34+
CompositionExclusions.txt:
35+
$(CURL) $(CURLFLAGS) -o $@ $(URLCACHE)https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/CompositionExclusions.txt
36+
37+
CaseFolding.txt:
38+
$(CURL) $(CURLFLAGS) -o $@ $(URLCACHE)https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/CaseFolding.txt
39+
40+
NormalizationTest.txt:
41+
$(CURL) $(CURLFLAGS) -o $@ $(URLCACHE)https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/NormalizationTest.txt
42+
43+
GraphemeBreakTest.txt:
44+
$(CURL) $(CURLFLAGS) -o $@ $(URLCACHE)https://www.unicode.org/Public/$(UNICODE_VERSION)/ucd/auxiliary/GraphemeBreakTest.txt
45+
46+
emoji-data.txt:
47+
$(CURL) $(CURLFLAGS) -o $@ $(URLCACHE)https://unicode.org/Public/$(UNICODE_VERSION)/ucd/emoji/emoji-data.txt
48+
49+
clean:
50+
rm -f UnicodeData.txt EastAsianWidth.txt GraphemeBreakProperty.txt DerivedCoreProperties.txt CompositionExclusions.txt CaseFolding.txt NormalizationTest.txt GraphemeBreakTest.txt emoji-data.txt
51+
rm -f data.new.jl

data/Manifest.toml

Lines changed: 69 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,69 @@
1+
# This file is machine-generated - editing it directly is not advised
2+
3+
julia_version = "1.9.3"
4+
manifest_format = "2.0"
5+
project_hash = "bc0740aa2247b17bd49ba693fb87f41bbbddead6"
6+
7+
[[deps.Adapt]]
8+
deps = ["LinearAlgebra", "Requires"]
9+
git-tree-sha1 = "cde29ddf7e5726c9fb511f340244ea3481267608"
10+
uuid = "79e6a3ab-5dfb-504d-930d-738a2a938a0e"
11+
version = "3.7.2"
12+
13+
[deps.Adapt.extensions]
14+
AdaptStaticArraysExt = "StaticArrays"
15+
16+
[deps.Adapt.weakdeps]
17+
StaticArrays = "90137ffa-7385-5640-81b9-e52037218182"
18+
19+
[[deps.Artifacts]]
20+
uuid = "56f22d72-fd6d-98f1-02f0-08ddc0907c33"
21+
22+
[[deps.CompilerSupportLibraries_jll]]
23+
deps = ["Artifacts", "Libdl"]
24+
uuid = "e66e0078-7015-5450-92f7-15fbd957f2ae"
25+
version = "1.0.5+0"
26+
27+
[[deps.Libdl]]
28+
uuid = "8f399da3-3557-5675-b5ff-fb832c97cbdb"
29+
30+
[[deps.LinearAlgebra]]
31+
deps = ["Libdl", "OpenBLAS_jll", "libblastrampoline_jll"]
32+
uuid = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
33+
34+
[[deps.OffsetArrays]]
35+
deps = ["Adapt"]
36+
git-tree-sha1 = "2ac17d29c523ce1cd38e27785a7d23024853a4bb"
37+
uuid = "6fe1bfb0-de20-5000-8ca7-80f57d26f881"
38+
version = "1.12.10"
39+
40+
[[deps.OpenBLAS_jll]]
41+
deps = ["Artifacts", "CompilerSupportLibraries_jll", "Libdl"]
42+
uuid = "4536629a-c528-5b80-bd46-f80d51c5b363"
43+
version = "0.3.21+4"
44+
45+
[[deps.Random]]
46+
deps = ["SHA", "Serialization"]
47+
uuid = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
48+
49+
[[deps.Requires]]
50+
deps = ["UUIDs"]
51+
git-tree-sha1 = "838a3a4188e2ded87a4f9f184b4b0d78a1e91cb7"
52+
uuid = "ae029012-a4dd-5104-9daa-d747884805df"
53+
version = "1.3.0"
54+
55+
[[deps.SHA]]
56+
uuid = "ea8e919c-243c-51af-8825-aaa63cd721ce"
57+
version = "0.7.0"
58+
59+
[[deps.Serialization]]
60+
uuid = "9e88b42a-f829-5b0c-bbe9-9e923198166b"
61+
62+
[[deps.UUIDs]]
63+
deps = ["Random", "SHA"]
64+
uuid = "cf7118a7-6976-5b1a-9a39-7adc72f591a4"
65+
66+
[[deps.libblastrampoline_jll]]
67+
deps = ["Artifacts", "Libdl"]
68+
uuid = "8e850b90-86db-534c-a0d3-1478176c7d93"
69+
version = "5.8.0+0"

data/Project.toml

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,2 @@
1+
[deps]
2+
OffsetArrays = "6fe1bfb0-de20-5000-8ca7-80f57d26f881"

0 commit comments

Comments
 (0)