Skip to content

Commit 7fdbded

Browse files
committed
Explore use of nostril to check copyrights #2402
Signed-off-by: Jono Yang <[email protected]>
1 parent 930e30e commit 7fdbded

File tree

2 files changed

+4
-1
lines changed

2 files changed

+4
-1
lines changed

setup.cfg

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -117,6 +117,7 @@ install_requires =
117117
typecode[full] >= 30.0.1
118118
extractcode[full] >= 31.0.0
119119
cyseq >= 0.0.2
120+
nostril-detector
120121

121122

122123
[options.packages.find]

src/cluecode/copyrights.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,6 +17,7 @@
1717
from time import time
1818

1919
import attr
20+
from nostril_detector.nonsense_detector import generate_nonsense_detector
2021

2122
from commoncode.text import toascii
2223
from commoncode.text import unixlinesep
@@ -197,8 +198,9 @@ def detect_copyrights_from_lines(
197198
if TRACE or TRACE_DEEP:
198199
logger_debug(f'\n========================================================================')
199200
logger_debug(f'detect_copyrights_from_lines: processing candidate_lines group:')
201+
nonsense = generate_nonsense_detector(min_length=1)
200202
for can in candidate_lines:
201-
logger_debug(f' {can}')
203+
logger_debug(f' {can[1]} (is_nonsense({nonsense(can[1])}))')
202204

203205
detections = detector.detect(
204206
numbered_lines=candidate_lines,

0 commit comments

Comments
 (0)