Skip to content

Commit 82bb772

Browse files
authored
Update random seed logic for obfuscation (#264)
* Update random seed logic for obfuscation * Update regex pattern to include 'key' in obfuscation * Update DATA MD5 checksum in benchmark.txt * BM update & fix 2025-11-05T10:24:07+02:00 (#265)
1 parent 5566eb8 commit 82bb772

File tree

14 files changed

+42
-41
lines changed

14 files changed

+42
-41
lines changed

.ci/benchmark.txt

Lines changed: 23 additions & 23 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
1-
META MD5 11f567db76995e39f2c680e9181bb935
2-
DATA MD5 c762dc235592a58e75101381ec396e24
3-
DATA: 17230760 interested lines. MARKUP: 62338 items
1+
META MD5 199de33d449fd669cdd1894ca41236fb
2+
DATA MD5 ff9697a1c5e9f5a361e52e4151b320a6
3+
DATA: 17230760 interested lines. MARKUP: 62339 items
44
FileType FileNumber ValidLines Positives Negatives
55
--------------- ------------ ------------ ----------- -----------
66
689 567668 138 487
@@ -37,7 +37,7 @@ FileType FileNumber ValidLines Positives Negatives
3737
.creds 1 10 2 1
3838
.crlf 1 27 1
3939
.crt 2 4979 126
40-
.cs 269 82841 257 1057
40+
.cs 269 82841 259 1057
4141
.cshtml 5 180 12
4242
.csp 3 379 9
4343
.csproj 1 14 1
@@ -64,7 +64,7 @@ FileType FileNumber ValidLines Positives Negatives
6464
.gd 1 37 1
6565
.gml 3 3075 16
6666
.gni 3 5017 19
67-
.go 1280 718792 1516 4861
67+
.go 1280 718792 1517 4860
6868
.golden 5 1168 1 42
6969
.gradle 50 4295 8 189
7070
.graphql 8 454 2 13
@@ -77,7 +77,7 @@ FileType FileNumber ValidLines Positives Negatives
7777
.hbs 2 54 3
7878
.hpp 1 237 2
7979
.hs 14 4140 30 65
80-
.html 127 34238 192 147
80+
.html 127 34238 194 147
8181
.idl 3 1625 37 5
8282
.iml 6 699 30
8383
.in 7 2242 10 50
@@ -90,7 +90,7 @@ FileType FileNumber ValidLines Positives Negatives
9090
.jenkinsfile 1 58 2 6
9191
.jinja2 1 64 2
9292
.js 666 537560 886 2712
93-
.json 927 13140680 1963 10177
93+
.json 927 13140680 1963 10178
9494
.jsp 13 3202 1 37
9595
.jsx 7 857 19
9696
.jwt 1 1 2
@@ -118,7 +118,7 @@ FileType FileNumber ValidLines Positives Negatives
118118
.markdown 38 5862 69 5
119119
.markerb 3 12 3
120120
.marko 1 21 2
121-
.md 789 185743 1075 2890
121+
.md 789 185743 1076 2890
122122
.mdx 3 549 7
123123
.mjml 1 18 1
124124
.mjs 22 4424 102 369
@@ -130,7 +130,7 @@ FileType FileNumber ValidLines Positives Negatives
130130
.mqh 1 1023 2
131131
.msg 1 26644 1 1
132132
.mysql 1 36 2
133-
.ndjson 2 5006 81 228
133+
.ndjson 2 5006 82 228
134134
.nix 4 211 12
135135
.nolint 1 2 1
136136
.odd 1 1281 43
@@ -159,14 +159,14 @@ FileType FileNumber ValidLines Positives Negatives
159159
.pug 2 193 2
160160
.purs 1 69 4
161161
.pxd 1 150 2 4
162-
.py 904 297181 749 3936
162+
.py 904 297181 751 3936
163163
.pyi 4 1361 9
164164
.pyp 1 167 1
165165
.python 1 213
166166
.pyx 2 1094 23
167167
.r 4 62 5 2
168168
.rake 2 51 2
169-
.rb 852 130684 426 2968
169+
.rb 852 130684 427 2968
170170
.re 1 31 1
171171
.red 1 159 1
172172
.release 1 13 4
@@ -187,7 +187,7 @@ FileType FileNumber ValidLines Positives Negatives
187187
.sbt 3 570 7
188188
.scala 53 5626 38 99
189189
.secrets 1 11 1
190-
.sh 152 24184 71 484
190+
.sh 152 24184 72 483
191191
.slim 1 153 3
192192
.smali 1 775 18
193193
.snap 3 1708 9 31
@@ -212,8 +212,8 @@ FileType FileNumber ValidLines Positives Negatives
212212
.token 1 1 4
213213
.toml 86 2471 65 251
214214
.tpl 1 43 1
215-
.travis 1 34 2 4
216-
.ts 609 109982 262 1970
215+
.travis 1 34 4 4
216+
.ts 609 109982 265 1970
217217
.tsx 54 7914 1 120
218218
.ttar 1 452 1
219219
.txt 324 89406 5259 4387
@@ -229,13 +229,13 @@ FileType FileNumber ValidLines Positives Negatives
229229
.yml 564 57042 1933 1218
230230
.zsh 6 872 12
231231
.zsh-theme 1 97 1
232-
TOTAL: 11640 17230760 17512 50249
232+
TOTAL: 11640 17230760 17528 50248
233233
credsweeper result_cnt : 0, lost_cnt : 0, true_cnt : 0, false_cnt : 0
234234
Rules Positives Negatives Reported TP FP TN FN FPR FNR ACC PRC RCL F1
235235
------------------------------ ----------- ----------- ---------- ---- ---- ----- ----- -------- -------- -------- ----- -------- ----
236236
API 242 3371 0 0 3371 242 0.000000 1.000000 0.933020 0.000000
237237
AWS Client ID 205 19 0 0 19 205 0.000000 1.000000 0.084821 0.000000
238-
AWS Multi 82 10 0 0 10 82 0.000000 1.000000 0.108696 0.000000
238+
AWS Multi 82 11 0 0 11 82 0.000000 1.000000 0.118280 0.000000
239239
AWS S3 Bucket 67 23 0 0 23 67 0.000000 1.000000 0.255556 0.000000
240240
Akamai Credentials 6 2 0 0 2 6 0.000000 1.000000 0.250000 0.000000
241241
Atlassian Old PAT token 9 8 0 0 8 9 0.000000 1.000000 0.470588 0.000000
@@ -245,19 +245,19 @@ BASE64 Private Key 22 4 0 0
245245
BASE64 encoded PEM Private Key 12 0 0 0 0 12 1.000000 0.000000 0.000000
246246
Basic Authorization 688 554 0 0 554 688 0.000000 1.000000 0.446055 0.000000
247247
Bearer Authorization 178 0 0 0 0 178 1.000000 0.000000 0.000000
248-
Bitbucket Client ID 39 72 0 0 72 39 0.000000 1.000000 0.648649 0.000000
249-
Bitbucket Client Secret 44 116 0 0 116 44 0.000000 1.000000 0.725000 0.000000
248+
Bitbucket Client ID 41 72 0 0 72 41 0.000000 1.000000 0.637168 0.000000
249+
Bitbucket Client Secret 47 116 0 0 116 47 0.000000 1.000000 0.711656 0.000000
250250
CMD ConvertTo-SecureString 13 4 0 0 4 13 0.000000 1.000000 0.235294 0.000000
251251
CMD Password 33 137 0 0 137 33 0.000000 1.000000 0.805882 0.000000
252252
CMD Secret 1 17 0 0 17 1 0.000000 1.000000 0.944444 0.000000
253253
CMD Token 6 2 0 0 2 6 0.000000 1.000000 0.250000 0.000000
254254
CURL User Password 7 2 0 0 2 7 0.000000 1.000000 0.222222 0.000000
255255
Credential 98 499 0 0 499 98 0.000000 1.000000 0.835846 0.000000
256256
Docker Swarm Token 2 0 0 0 0 2 1.000000 0.000000 0.000000
257-
Dropbox App secret 73 144 0 0 144 73 0.000000 1.000000 0.663594 0.000000
257+
Dropbox App secret 75 144 0 0 144 75 0.000000 1.000000 0.657534 0.000000
258258
Facebook Access Token 0 1 0 0 1 0 0.000000 1.000000
259259
Firebase Domain 38 1 0 0 1 38 0.000000 1.000000 0.025641 0.000000
260-
Gitlab Feed Token 204 843 0 0 843 204 0.000000 1.000000 0.805158 0.000000
260+
Gitlab Feed Token 205 843 0 0 843 205 0.000000 1.000000 0.804389 0.000000
261261
Gitlab Incoming Email Token 38 12 0 0 12 38 0.000000 1.000000 0.240000 0.000000
262262
Google API Key 13 0 0 0 0 13 1.000000 0.000000 0.000000
263263
Google Multi 10 2 0 0 2 10 0.000000 1.000000 0.166667 0.000000
@@ -271,10 +271,10 @@ Key 4284 16396 0 0
271271
MailGun API Key 8 0 0 0 0 8 1.000000 0.000000 0.000000
272272
NKEY Seed 60 0 0 0 0 60 1.000000 0.000000 0.000000
273273
Nonce 130 55 0 0 55 130 0.000000 1.000000 0.297297 0.000000
274-
OTP / 2FA Secret 58 3 0 0 3 58 0.000000 1.000000 0.049180 0.000000
274+
OTP / 2FA Secret 64 3 0 0 3 64 0.000000 1.000000 0.044776 0.000000
275275
Other 9 7321 0 0 7321 9 0.000000 1.000000 0.998772 0.000000
276276
PEM Private Key 1150 76 0 0 76 1150 0.000000 1.000000 0.061990 0.000000
277-
Password 2575 9934 0 0 9934 2575 0.000000 1.000000 0.794148 0.000000
277+
Password 2577 9932 0 0 9932 2577 0.000000 1.000000 0.793988 0.000000
278278
Postman Credentials 2 0 0 0 0 2 1.000000 0.000000 0.000000
279279
SQL Password 44 14 0 0 14 44 0.000000 1.000000 0.241379 0.000000
280280
Salesforce Credentials 6 0 0 0 0 6 1.000000 0.000000 0.000000
@@ -287,4 +287,4 @@ Token 1137 4670 0 0
287287
Twilio Credentials 30 39 0 0 39 30 0.000000 1.000000 0.565217 0.000000
288288
URL Credentials 225 382 0 0 382 225 0.000000 1.000000 0.629325 0.000000
289289
UUID 2508 280 0 0 280 2508 0.000000 1.000000 0.100430 0.000000
290-
17512 50249 0 0 0 50249 17512 0.000000 1.000000 0.741562 0.000000
290+
17528 50248 0 0 0 50248 17528 0.000000 1.000000 0.741383 0.000000

meta/106c7cd2.csv

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ Id,FileID,Domain,RepoName,FilePath,LineStart,LineEnd,GroundTruth,ValueStart,Valu
1515
30897,95b00c7f,GitHub,106c7cd2,data/106c7cd2/resource/assets/95b00c7f.js,44,44,X,13,28,,,Key
1616
31231,a3046da0,GitHub,106c7cd2,data/106c7cd2/_/a3046da0.example,14,14,X,12,18,,,Password
1717
32304,166d9d33,GitHub,106c7cd2,data/106c7cd2/_/166d9d33.travis,3,3,T,8,59,,,Key
18-
32557,166d9d33,GitHub,106c7cd2,data/106c7cd2/_/166d9d33.travis,44,44,T,11,43,,,Secret
18+
32557,166d9d33,GitHub,106c7cd2,data/106c7cd2/_/166d9d33.travis,44,44,T,11,43,,,Secret:Bitbucket Client ID:Bitbucket Client Secret
1919
41553,166d9d33,GitHub,106c7cd2,data/106c7cd2/_/166d9d33.travis,26,26,F,,,,,Password
2020
55895,1798b1bc,GitHub,106c7cd2,data/106c7cd2/test/api/1798b1bc.php,60,60,F,,,,,Token
2121
61647,a3046da0,GitHub,106c7cd2,data/106c7cd2/_/a3046da0.example,38,38,F,,,,,Key

meta/34cb4bc8.csv

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -61,7 +61,7 @@ Id,FileID,Domain,RepoName,FilePath,LineStart,LineEnd,GroundTruth,ValueStart,Valu
6161
29723,932c288e,GitHub,34cb4bc8,data/34cb4bc8/test/932c288e.cs,78,78,X,25,35,,,Token
6262
29827,475d6673,GitHub,34cb4bc8,data/34cb4bc8/docs/475d6673.rst,104,104,X,18,26,,,Token
6363
32233,1a6fe6a9,GitHub,34cb4bc8,data/34cb4bc8/test/kube/1a6fe6a9.cs,50,50,T,31,63,,,Token:Bitbucket Client ID:Bitbucket Client Secret
64-
34485,1a6fe6a9,GitHub,34cb4bc8,data/34cb4bc8/test/kube/1a6fe6a9.cs,69,69,T,32,64,,,Token:Bearer Authorization
64+
34485,1a6fe6a9,GitHub,34cb4bc8,data/34cb4bc8/test/kube/1a6fe6a9.cs,69,69,T,32,64,,,Token:Bearer Authorization:Bitbucket Client ID:Bitbucket Client Secret
6565
36037,9453018f,GitHub,34cb4bc8,data/34cb4bc8/sample/api/kube/9453018f.json,15,15,T,16,48,,,Token:Bitbucket Client ID:Bitbucket Client Secret
6666
36038,ac423ded,GitHub,34cb4bc8,data/34cb4bc8/docs/kube/ac423ded.rst,52,52,T,16,48,,,Token:Bitbucket Client ID:Bitbucket Client Secret
6767
37550,ac423ded,GitHub,34cb4bc8,data/34cb4bc8/docs/kube/ac423ded.rst,69,69,T,13,45,,,Token:Bitbucket Client ID:Bitbucket Client Secret

meta/39def7b4.csv

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -316,7 +316,7 @@ Id,FileID,Domain,RepoName,FilePath,LineStart,LineEnd,GroundTruth,ValueStart,Valu
316316
25814,651c73dd,GitHub,39def7b4,data/39def7b4/spec/651c73dd.rb,640,640,F,,,,,Password
317317
27428,52694a75,GitHub,39def7b4,data/39def7b4/spec/api/52694a75.rb,40,40,T,33,51,,,Bitbucket Client ID:Credential
318318
34067,e44c9925,GitHub,39def7b4,data/39def7b4/lib/rest/e44c9925.rb,119,121,F,,,Private,,PEM Private Key
319-
35024,be070dc3,GitHub,39def7b4,data/39def7b4/spec/be070dc3.rb,78,78,T,25,57,,,Secret
319+
35024,be070dc3,GitHub,39def7b4,data/39def7b4/spec/be070dc3.rb,78,78,T,25,57,,,Secret:OTP / 2FA Secret
320320
35075,52694a75,GitHub,39def7b4,data/39def7b4/spec/api/52694a75.rb,61,61,T,23,41,,,Bitbucket Client ID:Password
321321
35094,be070dc3,GitHub,39def7b4,data/39def7b4/spec/be070dc3.rb,42,42,F,29,153,,,Key
322322
40626,2010d338,GitHub,39def7b4,data/39def7b4/lib/rest/2010d338.rb,119,121,F,,,,,PEM Private Key

meta/41659445.csv

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -109,8 +109,8 @@ Id,FileID,Domain,RepoName,FilePath,LineStart,LineEnd,GroundTruth,ValueStart,Valu
109109
35338,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,34,34,F,15,21,,,Token
110110
35339,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,23,23,T,16,48,,,Secret:OTP / 2FA Secret
111111
35340,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,33,33,T,16,48,,,Secret:OTP / 2FA Secret
112-
35341,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,8,8,T,16,48,,,Secret
113-
35342,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,13,13,T,16,48,,,Secret
112+
35341,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,8,8,T,16,48,,,Secret:OTP / 2FA Secret
113+
35342,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,13,13,T,16,48,,,Secret:OTP / 2FA Secret
114114
35343,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,28,28,T,16,48,,,Secret:OTP / 2FA Secret
115115
35344,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,18,18,T,16,48,,,Secret:OTP / 2FA Secret
116116
35345,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,38,38,T,16,48,,,Secret:OTP / 2FA Secret
@@ -121,7 +121,7 @@ Id,FileID,Domain,RepoName,FilePath,LineStart,LineEnd,GroundTruth,ValueStart,Valu
121121
37420,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,68,68,X,12,18,,,Token
122122
37421,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,82,82,X,12,18,,,Token
123123
37422,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,67,67,T,13,45,,,Secret:OTP / 2FA Secret
124-
37423,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,73,73,T,13,45,,,Secret
124+
37423,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,73,73,T,13,45,,,Secret:OTP / 2FA Secret
125125
37424,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,80,80,T,13,45,,,Secret:OTP / 2FA Secret
126126
47806,eb85e4f0,GitHub,41659445,data/41659445/test/src/util/eb85e4f0.ts,119,119,X,15,25,,,Secret
127127
47991,074dc7a7,GitHub,41659445,data/41659445/test/sample/074dc7a7.ts,78,78,F,,,,,Other

meta/6aae1316.csv

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -326,3 +326,4 @@ Id,FileID,Domain,RepoName,FilePath,LineStart,LineEnd,GroundTruth,ValueStart,Valu
326326
1494336,0e1cae4f,GitHub,6aae1316,data/6aae1316/lib/spec/0e1cae4f.rb,74,74,T,46,60,,,API:Token
327327
1494337,a21f5d95,GitHub,6aae1316,data/6aae1316/spec/a21f5d95.rb,19,19,T,40,54,,,API:Token
328328
1494338,a21f5d95,GitHub,6aae1316,data/6aae1316/spec/a21f5d95.rb,29,29,T,40,54,,,API:Token
329+
11524151,22ac2671,GitHub,6aae1316,data/6aae1316/fixture/spec/build/22ac2671.json,49,56,F,304,266,,,AWS Multi

0 commit comments

Comments
 (0)