Skip to content

Commit 102ee19

Browse files
committed
Bump version to v0.4.0 for release
1 parent be3d7c5 commit 102ee19

File tree

3 files changed

+8
-2
lines changed

3 files changed

+8
-2
lines changed

CHANGELOG.md

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,8 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
77

88
## Unreleased
99

10+
## [v0.4.0](https://github.com/gagan3012/PolyDeDupe/releases/tag/v0.4.0) - 2023-11-27
11+
1012
## [v0.3.0](https://github.com/gagan3012/PolyDeDupe/releases/tag/v0.3.0) - 2023-11-27
1113

1214
## [v0.2.0](https://github.com/gagan3012/PolyDeDupe/releases/tag/v0.2.0) - 2023-11-27

PolyDeDupe/polydedupe.py

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -126,7 +126,8 @@ def make_duplicate_clusters(dataset_iterator: Type[Dataset], jaccard_threshold:
126126
di = DuplicationIndex(duplication_jaccard_threshold=jaccard_threshold)
127127

128128
for filename, min_hash in tqdm(
129-
ThreadedIterator(minhash_iter(enumerate(dataset_iterator)), max_queue_size=100), total=len(dataset_iterator)
129+
ThreadedIterator(minhash_iter(enumerate(dataset_iterator)), max_queue_size=100), total=len(dataset_iterator),
130+
desc="Deduplicating"
130131
):
131132
di.add(filename, min_hash)
132133

@@ -205,6 +206,7 @@ def find_extremes(cluster_list, dataset, jaccard_threshold):
205206
cluster_list,
206207
),
207208
total=len(cluster_list),
209+
desc="Finding extremes",
208210
):
209211
extremes_list.append(extremes)
210212
return extremes_list
@@ -230,6 +232,8 @@ def display_dataset_entries(dataset, duplicate_clusters):
230232
print(f"Base Index: {base_index}, Data: {data_entry}")
231233

232234
print("\n") # Separate clusters by a newline for clarity
235+
236+
233237

234238

235239
def deduplicate_dataset(

PolyDeDupe/version.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
_MAJOR = "0"
2-
_MINOR = "3"
2+
_MINOR = "4"
33
# On main and in a nightly release the patch should be one ahead of the last
44
# released build.
55
_PATCH = "0"

0 commit comments

Comments
 (0)