Skip to content

Commit 177bcbc

Browse files
authored
Update benchmark scores (#714)
* Update benchmark.txt [no ci] * Update benchmark.yml [no ci] * Update test_main.py for CI trigger
1 parent 4785dbc commit 177bcbc

File tree

3 files changed

+34
-33
lines changed

3 files changed

+34
-33
lines changed

.ci/benchmark.txt

Lines changed: 25 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -1,9 +1,9 @@
1-
META MD5 39966c3cbfe713b3d9c2e0ad68ac5416
2-
DATA MD5 bfd00203840d99eefc189ae75713eb0c
3-
DATA: 16664944 interested lines. MARKUP: 62071 items
1+
META MD5 9f42361b819a06e1a411b290214ef526
2+
DATA MD5 d0c51cce420271d1e947e82fb0aa21f7
3+
DATA: 16707548 interested lines. MARKUP: 62260 items
44
FileType FileNumber ValidLines Positives Negatives Templates
55
--------------- ------------ ------------ ----------- ----------- -----------
6-
676 69134 134 420 72
6+
677 69435 135 420 72
77
.04 2 149 4
88
.1 2 641 2 5
99
.admx 1 26 1
@@ -66,17 +66,18 @@ FileType FileNumber ValidLines Positives Negatives Templat
6666
.gd 1 37 1
6767
.gml 3 3075 16
6868
.gni 3 5017 19
69-
.go 1240 682004 1228 4128 741
69+
.go 1280 718915 1362 4133 741
7070
.golden 5 1168 1 13 29
7171
.gradle 50 4295 7 90 100
7272
.graphql 8 454 2 13
7373
.graphqls 1 30 1
7474
.groovy 22 5113 24 214 1
75+
.gtpl 1 15 2
7576
.h 10 2269 38
7677
.haml 9 191 17
7778
.hbs 2 54 3
7879
.hs 14 4140 29 61 4
79-
.html 61 19419 84 108 18
80+
.html 60 19400 84 107 18
8081
.idl 3 1625 37 5
8182
.iml 6 699 30
8283
.in 7 2242 8 44 10
@@ -88,7 +89,7 @@ FileType FileNumber ValidLines Positives Negatives Templat
8889
.java 670 144140 477 1325 170
8990
.jenkinsfile 1 58 2 6
9091
.jinja2 1 64 2
91-
.js 658 533148 569 2470 284
92+
.js 656 532595 569 2467 284
9293
.json 886 13114472 1304 10018 132
9394
.jsp 13 3202 1 37
9495
.jsx 7 857 19
@@ -114,7 +115,7 @@ FileType FileNumber ValidLines Positives Negatives Templat
114115
.lua 10 1924 37 3
115116
.m 16 13358 19 158 3
116117
.manifest 3 102 9 6
117-
.markdown 3 139 3 1
118+
.markdown 38 5862 54 3 1
118119
.markerb 3 12 3
119120
.marko 1 21 2
120121
.md 761 180542 892 2347 584
@@ -206,7 +207,7 @@ FileType FileNumber ValidLines Positives Negatives Templat
206207
.template 19 1633 4 36 11
207208
.test 2 24 22 1 4
208209
.testsettings 1 21 1 10
209-
.tf 21 1377 3 30 1
210+
.tf 27 1644 14 30 1
210211
.tfstate 6 431 49 7 4
211212
.tfvars 1 31 3 2
212213
.tl 2 2161 154 2
@@ -228,21 +229,21 @@ FileType FileNumber ValidLines Positives Negatives Templat
228229
.xib 11 503 164
229230
.xsl 1 311 1
230231
.yaml 168 24422 201 341 42
231-
.yml 556 54557 1239 908 364
232+
.yml 555 54516 1236 908 364
232233
.zsh 6 872 12
233234
.zsh-theme 1 97 1
234-
TOTAL: 11414 16664944 14836 46717 4910
235-
credsweeper result_cnt : 14430, lost_cnt : 0, true_cnt : 14242, false_cnt : 188
235+
TOTAL: 11493 16707548 15035 46718 4910
236+
credsweeper result_cnt : 14629, lost_cnt : 0, true_cnt : 14438, false_cnt : 191
236237
Rules Positives Negatives Templates Reported TP FP TN FN FPR FNR ACC PRC RCL F1
237238
------------------------------ ----------- ----------- ----------- ---------- ----- ---- ----- ---- -------- -------- -------- -------- -------- --------
238-
API 235 3172 187 227 227 0 3359 8 0.000000 0.034043 0.997774 1.000000 0.965957 0.982684
239-
AWS Client ID 182 19 0 174 174 0 19 8 0.000000 0.043956 0.960199 1.000000 0.956044 0.977528
239+
API 239 3172 187 228 228 0 3359 11 0.000000 0.046025 0.996943 1.000000 0.953975 0.976445
240+
AWS Client ID 191 19 0 183 183 0 19 8 0.000000 0.041885 0.961905 1.000000 0.958115 0.978610
240241
AWS Multi 82 10 0 34 34 0 10 48 0.000000 0.585366 0.478261 1.000000 0.414634 0.586207
241242
AWS S3 Bucket 67 23 0 92 67 23 0 0 1.000000 0.000000 0.744444 0.744444 1.000000 0.853503
242243
Atlassian Old PAT token 5 8 0 11 5 6 2 0 0.750000 0.000000 0.538462 0.454545 1.000000 0.625000
243-
Auth 1074 2754 81 1058 1050 8 2827 24 0.002822 0.022346 0.991814 0.992439 0.977654 0.984991
244+
Auth 1075 2754 81 1059 1051 8 2827 24 0.002822 0.022326 0.991816 0.992446 0.977674 0.985005
244245
Azure Access Token 21 0 0 13 13 0 0 8 0.380952 0.619048 1.000000 0.619048 0.764706
245-
BASE64 Private Key 19 4 0 19 19 0 4 0 0.000000 0.000000 1.000000 1.000000 1.000000 1.000000
246+
BASE64 Private Key 21 4 0 21 21 0 4 0 0.000000 0.000000 1.000000 1.000000 1.000000 1.000000
246247
BASE64 encoded PEM Private Key 12 0 0 10 10 0 0 2 0.166667 0.833333 1.000000 0.833333 0.909091
247248
Bitbucket Client ID 36 66 0 48 31 16 50 5 0.242424 0.138889 0.794118 0.659574 0.861111 0.746988
248249
Bitbucket Client Secret 46 90 1 88 41 46 45 5 0.505495 0.108696 0.627737 0.471264 0.891304 0.616541
@@ -257,7 +258,7 @@ Dropbox App secret 73 144 0 5
257258
Facebook Access Token 0 1 0 0 0 1 0 0.000000 1.000000
258259
Firebase Domain 7 1 0 8 7 1 0 0 1.000000 0.000000 0.875000 0.875000 1.000000 0.933333
259260
Github Old Token 1 0 0 1 1 0 0 0 0.000000 1.000000 1.000000 1.000000 1.000000
260-
Gitlab Feed Token 206 757 85 77 56 17 825 150 0.020190 0.728155 0.840649 0.767123 0.271845 0.401434
261+
Gitlab Feed Token 205 757 85 76 55 17 825 150 0.020190 0.731707 0.840497 0.763889 0.268293 0.397112
261262
Gitlab Incoming Email Token 38 11 0 25 20 5 6 18 0.454545 0.473684 0.530612 0.800000 0.526316 0.634921
262263
Google API Key 12 0 0 12 12 0 0 0 0.000000 1.000000 1.000000 1.000000 1.000000
263264
Google Multi 10 2 0 11 10 1 1 0 0.500000 0.000000 0.916667 0.909091 1.000000 0.952381
@@ -266,21 +267,21 @@ Grafana Provisioned API Key 22 1 0
266267
JSON Web Token 180 61 0 141 141 0 61 39 0.000000 0.216667 0.838174 1.000000 0.783333 0.878505
267268
Jira / Confluence PAT token 0 4 0 0 0 4 0 0.000000 1.000000
268269
Jira 2FA 36 1 1 31 30 1 1 6 0.500000 0.166667 0.815789 0.967742 0.833333 0.895522
269-
Key 4188 15722 483 4174 4163 11 16194 25 0.000679 0.005969 0.998235 0.997365 0.994031 0.995695
270+
Key 4209 15726 483 4198 4184 14 16195 25 0.000864 0.005940 0.998090 0.996665 0.994060 0.995361
270271
Nonce 113 49 0 111 111 0 49 2 0.000000 0.017699 0.987654 1.000000 0.982301 0.991071
271272
Other 9 7446 5 0 0 7451 9 0.000000 1.000000 0.998794 0.000000
272-
PEM Private Key 1135 1483 0 1139 1135 4 1479 0 0.002697 0.000000 0.998472 0.996488 1.000000 0.998241
273-
Password 2202 7548 2539 2157 2133 24 10063 69 0.002379 0.031335 0.992432 0.988873 0.968665 0.978665
273+
PEM Private Key 1140 1483 0 1144 1140 4 1479 0 0.002697 0.000000 0.998475 0.996503 1.000000 0.998249
274+
Password 2320 7545 2539 2275 2251 24 10060 69 0.002380 0.029741 0.992502 0.989451 0.970259 0.979761
274275
SQL Password 44 13 0 41 41 0 13 3 0.000000 0.068182 0.947368 1.000000 0.931818 0.964706
275276
Salesforce Credentials 6 0 0 5 5 0 0 1 0.166667 0.833333 1.000000 0.833333 0.909091
276277
Salt 83 74 1 81 81 0 75 2 0.000000 0.024096 0.987342 1.000000 0.975904 0.987805
277-
Secret 1474 1576 799 1475 1468 7 2368 6 0.002947 0.004071 0.996622 0.995254 0.995929 0.995592
278+
Secret 1486 1576 799 1487 1480 7 2368 6 0.002947 0.004038 0.996633 0.995293 0.995962 0.995627
278279
Seed 1 6 0 0 0 6 1 0.000000 1.000000 0.857143 0.000000
279280
Slack Token 4 1 0 4 4 0 1 0 0.000000 0.000000 1.000000 1.000000 1.000000 1.000000
280281
Stripe Credentials 2 0 0 2 2 0 0 0 0.000000 1.000000 1.000000 1.000000 1.000000
281282
Tencent WeChat API App ID 8 0 0 8 8 0 0 0 0.000000 1.000000 1.000000 1.000000 1.000000
282-
Token 917 4172 455 845 842 3 4624 75 0.000648 0.081788 0.985931 0.996450 0.918212 0.955732
283+
Token 929 4172 455 857 854 3 4624 75 0.000648 0.080732 0.985961 0.996499 0.919268 0.956327
283284
Twilio Credentials 30 39 0 30 30 0 39 0 0.000000 0.000000 1.000000 1.000000 1.000000 1.000000
284285
URL Credentials 225 168 197 225 225 0 365 0 0.000000 0.000000 1.000000 1.000000 1.000000 1.000000
285-
UUID 1841 265 0 1824 1823 1 264 18 0.003774 0.009777 0.990978 0.999452 0.990223 0.994816
286-
14836 46717 4910 14439 14242 188 46529 594 0.004024 0.040038 0.987296 0.986972 0.959962 0.973280
286+
UUID 1857 265 0 1840 1839 1 264 18 0.003774 0.009693 0.991046 0.999457 0.990307 0.994861
287+
15035 46718 4910 14638 14438 191 46527 597 0.004088 0.039707 0.987239 0.986944 0.960293 0.973436

.github/workflows/benchmark.yml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -31,7 +31,7 @@ jobs:
3131
uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2 - 2024.10.23
3232
with:
3333
repository: Samsung/CredData
34-
ref: ea8910359f66c63a3ac27517e8715129c0e0bbf3
34+
ref: 5c93f142f9c28c03ff35ee0862dc819b73cdb673
3535

3636
- name: Markup hashing
3737
run: |
@@ -87,7 +87,7 @@ jobs:
8787
uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2 - 2024.10.23
8888
with:
8989
repository: Samsung/CredData
90-
ref: ea8910359f66c63a3ac27517e8715129c0e0bbf3
90+
ref: 5c93f142f9c28c03ff35ee0862dc819b73cdb673
9191

9292
- name: Markup hashing
9393
run: |
@@ -190,7 +190,7 @@ jobs:
190190
uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2 - 2024.10.23
191191
with:
192192
repository: Samsung/CredData
193-
ref: ea8910359f66c63a3ac27517e8715129c0e0bbf3
193+
ref: 5c93f142f9c28c03ff35ee0862dc819b73cdb673
194194

195195
- name: Markup hashing
196196
run: |
@@ -378,7 +378,7 @@ jobs:
378378
uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2 - 2024.10.23
379379
with:
380380
repository: Samsung/CredData
381-
ref: ea8910359f66c63a3ac27517e8715129c0e0bbf3
381+
ref: 5c93f142f9c28c03ff35ee0862dc819b73cdb673
382382

383383
- name: Markup hashing
384384
run: |

tests/test_main.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -342,11 +342,11 @@ def test_scan_bytes_n(self) -> None:
342342
def test_colored_line_p(self) -> None:
343343
cred_sweeper = CredSweeper()
344344
for to_scan in [
345-
"토큰MTAwMDoxVKvgS4Y7K7UIXHqBmV50aWFs5sb2heWGb3dy사용".encode(),
346-
b'\x1b[93mMTAwMDoxVKvgS4Y7K7UIXHqBmV50aWFs5sb2heWGb3dy\x1b[0m',
347-
b'\r\nMTAwMDoxVKvgS4Y7K7UIXHqBmV50aWFs5sb2heWGb3dy\r\n',
348-
b'\tMTAwMDoxVKvgS4Y7K7UIXHqBmV50aWFs5sb2heWGb3dy\n',
349-
b'%3DMTAwMDoxVKvgS4Y7K7UIXHqBmV50aWFs5sb2heWGb3dy%3B',
345+
"토큰MTAwMDoxVKvgS4Y7K7UIXHqBmV50aWFs5sb2heWGb3dy사용".encode(), #
346+
b'\x1b[93mMTAwMDoxVKvgS4Y7K7UIXHqBmV50aWFs5sb2heWGb3dy\x1b[0m', #
347+
b'\r\nMTAwMDoxVKvgS4Y7K7UIXHqBmV50aWFs5sb2heWGb3dy\r\n', #
348+
b'\tMTAwMDoxVKvgS4Y7K7UIXHqBmV50aWFs5sb2heWGb3dy\n', #
349+
b'%3DMTAwMDoxVKvgS4Y7K7UIXHqBmV50aWFs5sb2heWGb3dy%3B', #
350350
]:
351351
provider = ByteContentProvider(to_scan)
352352
results = cred_sweeper.file_scan(provider)

0 commit comments

Comments
 (0)