Skip to content

Commit 0739b4c

Browse files
authored
DeepSeek token pattern improvement. (#821)
1 parent c3a38c4 commit 0739b4c

File tree

5 files changed

+6
-5
lines changed

5 files changed

+6
-5
lines changed

.github/workflows/check.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -93,7 +93,7 @@ jobs:
9393
run: |
9494
banner="$(python -m credsweeper --banner | grep CredSweeper | head -1)"
9595
echo "banner = '${banner}'"
96-
if [ "CredSweeper 1.15.0 crc32:439081df" != "${banner}" ]; then
96+
if [ "CredSweeper 1.15.1 crc32:58b9cbea" != "${banner}" ]; then
9797
echo "Update the check for '${banner}'"
9898
exit 1
9999
fi

credsweeper/__init__.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -24,4 +24,4 @@
2424
"__version__"
2525
]
2626

27-
__version__ = "1.15.0"
27+
__version__ = "1.15.1"

credsweeper/rules/config.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1363,7 +1363,7 @@
13631363
confidence: moderate
13641364
type: pattern
13651365
values:
1366-
- (?P<value>sk-[0-9a-f]{32,64})(?![0-9A-Za-z_-])
1366+
- (?:^|/|[^\\0-9A-Za-z+_-]|\\[0abfnrtv]|(?:%|\\x)[0-9A-Fa-f]{2}|\\[0-7]{3}|\\[Uu][0-9A-Fa-f]{4}|\x1B\[[0-9;]{0,80}m)(?P<value>sk-[0-9a-f]{32,64})(?![0-9A-Za-z_-])
13671367
min_line_len: 35
13681368
filter_type:
13691369
- ValuePatternCheck

tests/samples/deepseek

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,3 @@
11
>>>sk-615ef152bf865a131f88b23571dc4ee6<<<
22
<<<sk-2f8d9514cce7a8a3f1f34b64acedfake>>>
3+
scan-disk-615ef152bf865a131f88b23571dc4ee6

tests/test_app.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -503,7 +503,7 @@ def test_depth_p(self) -> None:
503503
cvs_checksum = hashlib.md5(f.read()).digest()
504504
checksum = bytes(a ^ b for a, b in zip(checksum, cvs_checksum))
505505
# update the checksum manually and keep line endings in the samples as is (git config core.autocrlf false)
506-
self.assertEqual("021c37fc3b5d65d32667062cc2ae50e7", binascii.hexlify(checksum).decode())
506+
self.assertEqual("b5f001b2a8ce5af6271bbcec2e986fa3", binascii.hexlify(checksum).decode())
507507
normal_report = []
508508
sorted_report = []
509509
with tempfile.TemporaryDirectory() as tmp_dir:
@@ -614,7 +614,7 @@ def test_rules_ml_p(self) -> None:
614614
rules_text = yaml.dump_all(rules, sort_keys=True)
615615
checksum = hashlib.md5(rules_text.encode()).hexdigest()
616616
# update the expected value manually if some changes
617-
self.assertEqual("64441b2969e9cf41142c1d0fb45450a8", checksum)
617+
self.assertEqual("6363b53925305e2f52fa64798c8e6985", checksum)
618618
rules_set = set([i["name"] for i in rules if "code" in i["target"]])
619619
self.assertSetEqual(rules_set, report_set)
620620
self.assertEqual(SAMPLES_POST_CRED_COUNT, len(report))

0 commit comments

Comments
 (0)