Skip to content

Commit 808cdbc

Browse files
committed
Make: Bump StringZilla for Unicode
1 parent 82f528a commit 808cdbc

File tree

4 files changed

+1275
-957
lines changed

4 files changed

+1275
-957
lines changed

Cargo.lock

Lines changed: 9 additions & 8 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

Cargo.toml

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ categories = ["text-processing", "development-tools::profiling"]
1414
[dependencies]
1515
criterion = "0.7.0"
1616
stringtape = "2.4.0"
17-
stringzilla = { git = "https://github.com/ashvardanian/StringZilla.git", branch = "main-dev", default-features = false }
17+
stringzilla = { version = "4.4.0", default-features = false }
1818

1919
# To use a local version of StringZilla, set the path:
2020
# stringzilla = { path = "../StringZilla/", features = ["cpus"] }
@@ -34,6 +34,7 @@ bench_unicode = [
3434
"simdutf", # SIMD UTF-8 validation and transcoding
3535
"unicase", # Case-insensitive string wrapper
3636
"focaccia", # Unicode case folding
37+
"rand", # Random needle sampling
3738
]
3839
bench_hash = [
3940
"bit-set", # for collision counting

pyproject.toml

Lines changed: 9 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -9,23 +9,23 @@ authors = [
99
]
1010
license = { text = "Apache 2.0" }
1111

12+
# Keep the base install minimal; opt into extras per-bench
13+
dependencies = []
14+
1215
[project.urls]
1316
Homepage = "https://ashvardanian.com/posts/stringwars-on-gpus"
1417
Repository = "https://github.com/ashvardanian/StringWars"
1518

16-
# Keep the base install minimal; opt into extras per-bench
17-
dependencies = []
18-
1919
[project.optional-dependencies]
2020
# Substring/byteset + transforms
21-
find = ["stringzilla", "pyahocorasick"]
21+
find = ["stringzilla>=4.4.0", "pyahocorasick"]
2222

2323
# Sequence ops (split/sort)
24-
sequence = ["stringzilla", "pandas", "pyarrow", "polars"]
24+
sequence = ["stringzilla>=4.4.0", "pandas", "pyarrow", "polars"]
2525

2626
# Fingerprinting/sketching
2727
fingerprints = [
28-
"stringzilla",
28+
"stringzilla>=4.4.0",
2929
"stringzillas-cpus",
3030
"datasketch",
3131
"numpy",
@@ -34,7 +34,7 @@ fingerprints = [
3434

3535
# Similarities / edit distances
3636
similarities = [
37-
"stringzilla",
37+
"stringzilla>=4.4.0",
3838
"stringzillas-cpus",
3939
"jellyfish",
4040
"python-Levenshtein",
@@ -47,10 +47,10 @@ similarities = [
4747
]
4848

4949
# Hash functions
50-
hash = ["stringzilla", "xxhash", "blake3", "google-crc32c", "mmh3", "cityhash"]
50+
hash = ["stringzilla>=4.4.0", "xxhash", "blake3", "google-crc32c", "mmh3", "cityhash"]
5151

5252
# Random byte generators and translation tables
53-
memory = ["stringzilla", "numpy", "pycryptodome", "opencv-python"]
53+
memory = ["stringzilla>=4.4.0", "numpy", "pycryptodome", "opencv-python"]
5454

5555
[tool.ruff]
5656
# Enforce 120-column lines across formatting and linting

0 commit comments

Comments
 (0)