Skip to content

Commit cc71d1a

Browse files
committed
Merge branch 'main-dev' of https://github.com/ashvardanian/StringZilla into main-dev
2 parents e467649 + 4cb096b commit cc71d1a

31 files changed

+3836
-1806
lines changed

.cmake-format.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -16,4 +16,4 @@
1616

1717
# If a statement is wrapped to more than one line, than dangle the closing
1818
# parenthesis on its own line.
19-
dangle_parens = True
19+
dangle_parens = True

.git-blame-ignore-revs

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -39,4 +39,4 @@ bd547453122e9f8565e5be15f137e7b0de37caca
3939
22e3d1e34d62d68c1e89df7c8bdc201faa18a9de
4040
ecb377541d0c706cf8997faff4f026b07e3f76f3
4141
0d982a45f842287d7e344f0d8b360f52482017f5
42-
42+
467b4b81cb4bc0e9a64844748a417762378918c9

.github/workflows/prerelease.yml

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -87,10 +87,11 @@ jobs:
8787
run: build_artifacts/stringzilla_test_cpp20
8888
- name: Test on Real World Data
8989
run: |
90+
build_artifacts/stringzilla_bench_memory ${DATASET_PATH} # for string copies and fills
9091
build_artifacts/stringzilla_bench_search ${DATASET_PATH} # for substring search
9192
build_artifacts/stringzilla_bench_token ${DATASET_PATH} # for hashing, equality comparisons, etc.
9293
build_artifacts/stringzilla_bench_similarity ${DATASET_PATH} # for edit distances and alignment scores
93-
build_artifacts/stringzilla_bench_sort ${DATASET_PATH} # for sorting arrays of strings
94+
build_artifacts/stringzilla_bench_sequence ${DATASET_PATH} # for sorting arrays of strings
9495
build_artifacts/stringzilla_bench_container ${DATASET_PATH} # for STL containers with string keys
9596
env:
9697
DATASET_PATH: ./README.md
@@ -174,7 +175,7 @@ jobs:
174175
build_artifacts/stringzilla_bench_search ${DATASET_PATH} # for substring search
175176
build_artifacts/stringzilla_bench_token ${DATASET_PATH} # for hashing, equality comparisons, etc.
176177
build_artifacts/stringzilla_bench_similarity ${DATASET_PATH} # for edit distances and alignment scores
177-
build_artifacts/stringzilla_bench_sort ${DATASET_PATH} # for sorting arrays of strings
178+
build_artifacts/stringzilla_bench_sequence ${DATASET_PATH} # for sorting arrays of strings
178179
build_artifacts/stringzilla_bench_container ${DATASET_PATH} # for STL containers with string keys
179180
env:
180181
DATASET_PATH: ./README.md
@@ -306,7 +307,7 @@ jobs:
306307
build_artifacts/stringzilla_bench_search ${DATASET_PATH} # for substring search
307308
build_artifacts/stringzilla_bench_token ${DATASET_PATH} # for hashing, equality comparisons, etc.
308309
build_artifacts/stringzilla_bench_similarity ${DATASET_PATH} # for edit distances and alignment scores
309-
build_artifacts/stringzilla_bench_sort ${DATASET_PATH} # for sorting arrays of strings
310+
build_artifacts/stringzilla_bench_sequence ${DATASET_PATH} # for sorting arrays of strings
310311
build_artifacts/stringzilla_bench_container ${DATASET_PATH} # for STL containers with string keys
311312
env:
312313
DATASET_PATH: ./README.md
@@ -379,7 +380,7 @@ jobs:
379380
.\build_artifacts\stringzilla_bench_search.exe ${DATASET_PATH} # for substring search
380381
.\build_artifacts\stringzilla_bench_token.exe ${DATASET_PATH} # for hashing, equality comparisons, etc.
381382
.\build_artifacts\stringzilla_bench_similarity.exe ${DATASET_PATH} # for edit distances and alignment scores
382-
.\build_artifacts\stringzilla_bench_sort.exe ${DATASET_PATH} # for sorting arrays of strings
383+
.\build_artifacts\stringzilla_bench_sequence.exe ${DATASET_PATH} # for sorting arrays of strings
383384
.\build_artifacts\stringzilla_bench_container.exe ${DATASET_PATH} # for STL containers with string keys
384385
env:
385386
DATASET_PATH: ./README.md

.vscode/launch.json

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -50,6 +50,10 @@
5050
{
5151
"name": "ASAN_OPTIONS",
5252
"value": "detect_leaks=0:atexit=1:strict_init_order=1:strict_string_checks=1"
53+
},
54+
{
55+
"name": "STRINGWARS_DATASET",
56+
"value": "leipzig1M.txt"
5357
}
5458
],
5559
"stopAtEntry": false,

.vscode/settings.json

Lines changed: 14 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -69,6 +69,7 @@
6969
"hexdigits",
7070
"Hirschberg's",
7171
"Horspool",
72+
"Hutter",
7273
"Hyyro",
7374
"illformed",
7475
"initproc",
@@ -100,6 +101,7 @@
100101
"Morten",
101102
"Mosè",
102103
"MSVC",
104+
"Nadav",
103105
"napi",
104106
"nargsf",
105107
"ndim",
@@ -112,13 +114,15 @@
112114
"NOMINMAX",
113115
"NOTIMPLEMENTED",
114116
"npos",
117+
"nullary",
115118
"numpy",
116119
"octdigits",
117120
"octogram",
118121
"pgram",
119122
"pgrams",
120123
"Plouffe",
121124
"printables",
125+
"ptrdiff",
122126
"pytest",
123127
"Pythonic",
124128
"qsort",
@@ -134,24 +138,31 @@
134138
"Ritchie",
135139
"rmatcher",
136140
"rmatches",
141+
"Rotem",
137142
"rpartition",
138143
"rsplit",
139144
"rsplits",
140145
"rstrip",
146+
"Sankoff",
147+
"Sergey",
141148
"SIMD",
142149
"sklearn",
143150
"Skylake",
151+
"Slotin",
144152
"splitlines",
145153
"ssize",
146154
"startswith",
147155
"STL",
156+
"StringWa.rs",
157+
"STRINGWARS",
148158
"stringzilla",
149159
"stringzilla_bare",
150160
"Strs",
151161
"strzl",
152162
"substr",
153163
"SWAR",
154164
"Tanimoto",
165+
"Taras",
155166
"thyrotropin",
156167
"Titin",
157168
"tparam",
@@ -163,6 +174,7 @@
163174
"VBMI",
164175
"vectorcallfunc",
165176
"Vectorizer",
177+
"Vintsyuk",
166178
"Wagner",
167179
"whitespaces",
168180
"Wunsch",
@@ -299,6 +311,7 @@
299311
"xstring": "cpp",
300312
"xtr1common": "cpp",
301313
"xtree": "cpp",
302-
"xutility": "cpp"
314+
"xutility": "cpp",
315+
"regex": "cpp"
303316
}
304317
}

0 commit comments

Comments
 (0)