Skip to content

Commit 6768d08

Browse files
authored
Markup corrections (#260)
* improve markup_report.py script * markup for most true candidates * corrections
1 parent 6183d74 commit 6768d08

File tree

6 files changed

+23
-20
lines changed

6 files changed

+23
-20
lines changed

.ci/benchmark.txt

Lines changed: 15 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
1-
META MD5 95346ca85ce4d3fcefd03fe87803bff8
2-
DATA MD5 c58c9fab721263eac09dbe0929c62cdd
3-
DATA: 17230760 interested lines. MARKUP: 62334 items
1+
META MD5 bc317a1d47d2e41f1ed8ff8136f9353a
2+
DATA MD5 f0d2c0fa3a044b0399671e5ab0a4a895
3+
DATA: 17230760 interested lines. MARKUP: 62337 items
44
FileType FileNumber ValidLines Positives Negatives
55
--------------- ------------ ------------ ----------- -----------
66
689 567668 138 487
@@ -90,7 +90,7 @@ FileType FileNumber ValidLines Positives Negatives
9090
.jenkinsfile 1 58 2 6
9191
.jinja2 1 64 2
9292
.js 666 537560 886 2712
93-
.json 927 13140680 1965 10175
93+
.json 927 13140680 1963 10177
9494
.jsp 13 3202 1 37
9595
.jsx 7 857 19
9696
.jwt 1 1 2
@@ -118,10 +118,10 @@ FileType FileNumber ValidLines Positives Negatives
118118
.markdown 38 5862 69 5
119119
.markerb 3 12 3
120120
.marko 1 21 2
121-
.md 789 185743 1073 2890
121+
.md 789 185743 1075 2890
122122
.mdx 3 549 7
123123
.mjml 1 18 1
124-
.mjs 22 4424 101 369
124+
.mjs 22 4424 102 369
125125
.mk 1 5878 13
126126
.ml 1 1856 16
127127
.mlir 2 1596 19
@@ -159,7 +159,7 @@ FileType FileNumber ValidLines Positives Negatives
159159
.pug 2 193 2
160160
.purs 1 69 4
161161
.pxd 1 150 2 4
162-
.py 904 297181 750 3935
162+
.py 904 297181 749 3936
163163
.pyi 4 1361 9
164164
.pyp 1 167 1
165165
.python 1 213
@@ -216,7 +216,7 @@ FileType FileNumber ValidLines Positives Negatives
216216
.ts 609 109982 262 1970
217217
.tsx 54 7914 1 120
218218
.ttar 1 452 1
219-
.txt 324 89406 5261 4385
219+
.txt 324 89406 5259 4387
220220
.utf8 1 77 1
221221
.vsixmanifest 1 36 1
222222
.vsmdi 1 6 2
@@ -229,7 +229,7 @@ FileType FileNumber ValidLines Positives Negatives
229229
.yml 564 57042 1933 1218
230230
.zsh 6 872 12
231231
.zsh-theme 1 97 1
232-
TOTAL: 11640 17230760 17510 50246
232+
TOTAL: 11640 17230760 17508 50251
233233
credsweeper result_cnt : 0, lost_cnt : 0, true_cnt : 0, false_cnt : 0
234234
Rules Positives Negatives Reported TP FP TN FN FPR FNR ACC PRC RCL F1
235235
------------------------------ ----------- ----------- ---------- ---- ---- ----- ----- -------- -------- -------- ----- -------- ----
@@ -265,11 +265,11 @@ Google OAuth Access Token 3 0 0 0
265265
Google OAuth Refresh Token 1 2 0 0 2 1 0.000000 1.000000 0.666667 0.000000
266266
Grafana Provisioned API Key 22 1 0 0 1 22 0.000000 1.000000 0.043478 0.000000
267267
JSON Web Token 174 61 0 0 61 174 0.000000 1.000000 0.259574 0.000000
268-
JWK 79 0 0 0 0 79 1.000000 0.000000 0.000000
268+
JWK 80 0 0 0 0 80 1.000000 0.000000 0.000000
269269
Jira / Confluence PAT token 0 4 0 0 4 0 0.000000 1.000000
270270
Key 4284 16395 0 0 16395 4284 0.000000 1.000000 0.792833 0.000000
271271
MailGun API Key 8 0 0 0 0 8 1.000000 0.000000 0.000000
272-
NKEY Seed 58 0 0 0 0 58 1.000000 0.000000 0.000000
272+
NKEY Seed 60 0 0 0 0 60 1.000000 0.000000 0.000000
273273
Nonce 130 55 0 0 55 130 0.000000 1.000000 0.297297 0.000000
274274
OTP / 2FA Secret 58 3 0 0 3 58 0.000000 1.000000 0.049180 0.000000
275275
Other 9 7321 0 0 7321 9 0.000000 1.000000 0.998772 0.000000
@@ -278,13 +278,13 @@ Password 2574 9935 0 0
278278
Postman Credentials 2 0 0 0 0 2 1.000000 0.000000 0.000000
279279
SQL Password 44 14 0 0 14 44 0.000000 1.000000 0.241379 0.000000
280280
Salesforce Credentials 6 0 0 0 0 6 1.000000 0.000000 0.000000
281-
Salt 92 78 0 0 78 92 0.000000 1.000000 0.458824 0.000000
282-
Secret 1528 2378 0 0 2378 1528 0.000000 1.000000 0.608807 0.000000
281+
Salt 90 80 0 0 80 90 0.000000 1.000000 0.470588 0.000000
282+
Secret 1527 2379 0 0 2379 1527 0.000000 1.000000 0.609063 0.000000
283283
Slack Token 15 1 0 0 1 15 0.000000 1.000000 0.062500 0.000000
284284
Stripe Credentials 2 0 0 0 0 2 1.000000 0.000000 0.000000
285285
Tencent WeChat API App ID 47 0 0 0 0 47 1.000000 0.000000 0.000000
286-
Token 1138 4668 0 0 4668 1138 0.000000 1.000000 0.803996 0.000000
286+
Token 1136 4670 0 0 4670 1136 0.000000 1.000000 0.804340 0.000000
287287
Twilio Credentials 30 39 0 0 39 30 0.000000 1.000000 0.565217 0.000000
288288
URL Credentials 225 382 0 0 382 225 0.000000 1.000000 0.629325 0.000000
289289
UUID 2508 280 0 0 280 2508 0.000000 1.000000 0.100430 0.000000
290-
17510 50246 0 0 0 50246 17510 0.000000 1.000000 0.741573 0.000000
290+
17508 50251 0 0 0 50251 17508 0.000000 1.000000 0.741614 0.000000

meta/0f133e09.csv

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -284,7 +284,7 @@ Id,FileID,Domain,RepoName,FilePath,LineStart,LineEnd,GroundTruth,ValueStart,Valu
284284
29612,6d89ddbd,GitHub,0f133e09,data/0f133e09/test/6d89ddbd.txt,7,7,F,9,,,,Key
285285
29614,6d89ddbd,GitHub,0f133e09,data/0f133e09/test/6d89ddbd.txt,10,10,F,57,437,,,Key
286286
29616,a0a75a16,GitHub,0f133e09,data/0f133e09/test/a0a75a16.txt,10,10,F,57,437,,,Key
287-
30738,d90d9e92,GitHub,0f133e09,data/0f133e09/test/d90d9e92.py,375,375,T,27,67,,,Secret
287+
30738,d90d9e92,GitHub,0f133e09,data/0f133e09/test/d90d9e92.py,375,375,F,27,67,,digits_only-test,Secret
288288
30876,d4a67d01,GitHub,0f133e09,data/0f133e09/test/d4a67d01.txt,10,10,F,57,437,,,Key
289289
30877,d6019b5f,GitHub,0f133e09,data/0f133e09/test/d6019b5f.txt,10,10,F,74,454,,,Key
290290
30883,7400d4c5,GitHub,0f133e09,data/0f133e09/test/7400d4c5.txt,10,10,F,9,389,,,Key

meta/23689bd1.csv

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -591,3 +591,4 @@ Id,FileID,Domain,RepoName,FilePath,LineStart,LineEnd,GroundTruth,ValueStart,Valu
591591
1509831,b5304871,GitHub,23689bd1,data/23689bd1/test/b5304871.mjs,813,818,T,12,38,,,JWK
592592
1509832,b5304871,GitHub,23689bd1,data/23689bd1/test/b5304871.mjs,877,882,T,12,38,,,JWK
593593
1509833,fb6ba96e,GitHub,23689bd1,data/23689bd1/test/fb6ba96e.mjs,126,127,T,12,18,,,JWK
594+
11524147,b5304871,GitHub,23689bd1,data/23689bd1/test/b5304871.mjs,182,188,T,12,358,,,JWK

meta/2ba83c6a.csv

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -8360,8 +8360,8 @@ Id,FileID,Domain,RepoName,FilePath,LineStart,LineEnd,GroundTruth,ValueStart,Valu
83608360
113103,08190bfc,GitHub,2ba83c6a,data/2ba83c6a/test/08190bfc.txt,45,45,T,7,23,,,Salt
83618361
113104,08190bfc,GitHub,2ba83c6a,data/2ba83c6a/test/08190bfc.txt,53,53,T,7,23,,,Salt
83628362
113105,08190bfc,GitHub,2ba83c6a,data/2ba83c6a/test/08190bfc.txt,61,61,T,7,23,,,Salt
8363-
113106,03161260,GitHub,2ba83c6a,data/2ba83c6a/test/03161260.txt,26,26,T,12,21,,,Salt
8364-
113107,03161260,GitHub,2ba83c6a,data/2ba83c6a/test/03161260.txt,34,34,T,12,21,,,Salt
8363+
113106,03161260,GitHub,2ba83c6a,data/2ba83c6a/test/03161260.txt,26,26,F,12,21,,too_short,Salt
8364+
113107,03161260,GitHub,2ba83c6a,data/2ba83c6a/test/03161260.txt,34,34,F,12,21,,too_short,Salt
83658365
113108,03161260,GitHub,2ba83c6a,data/2ba83c6a/test/03161260.txt,42,42,T,15,31,,,Salt
83668366
113109,03161260,GitHub,2ba83c6a,data/2ba83c6a/test/03161260.txt,50,50,T,12,31,,,Salt
83678367
113110,03161260,GitHub,2ba83c6a,data/2ba83c6a/test/03161260.txt,59,59,T,12,31,,,Salt

meta/64c97cb8.csv

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,8 @@
11
Id,FileID,Domain,RepoName,FilePath,LineStart,LineEnd,GroundTruth,ValueStart,ValueEnd,CryptographyKey,PredefinedPattern,Category
22
96981,602fb3c8,GitHub,64c97cb8,data/64c97cb8/src/assets/602fb3c8.xaml,115,115,F,18,28,,,Key
33
96983,22b0da6b,GitHub,64c97cb8,data/64c97cb8/test/22b0da6b.cs,37,37,T,61,113,,,Token
4-
1112601,d58d6be8,GitHub,64c97cb8,data/64c97cb8/test/d58d6be8.json,173,173,T,314,361,,,Token
5-
96985,d58d6be8,GitHub,64c97cb8,data/64c97cb8/test/d58d6be8.json,173,173,T,473,481,,,Token
4+
1112601,d58d6be8,GitHub,64c97cb8,data/64c97cb8/test/d58d6be8.json,173,173,F,314,361,,digits-letters-digits,Token
5+
96985,d58d6be8,GitHub,64c97cb8,data/64c97cb8/test/d58d6be8.json,173,173,F,473,481,,hash,Token
66
1112609,d58d6be8,GitHub,64c97cb8,data/64c97cb8/test/d58d6be8.json,173,173,F,383,447,,,Token
77
96986,6bbf6684,GitHub,64c97cb8,data/64c97cb8/docs/6bbf6684.md,3,3,F,205,232,,,Credential
88
96987,b3356305,GitHub,64c97cb8,data/64c97cb8/_/b3356305.md,14,14,F,47,64,,,Credential

meta/93ff401b.csv

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -95,3 +95,5 @@ Id,FileID,Domain,RepoName,FilePath,LineStart,LineEnd,GroundTruth,ValueStart,Valu
9595
11495526,ee27877f,GitHub,93ff401b,data/93ff401b/example/ee27877f.html,63,63,F,509,517,,,Password
9696
11495527,ee27877f,GitHub,93ff401b,data/93ff401b/example/ee27877f.html,99,99,F,508,516,,,Password
9797
11519270,5e0626e3,GitHub,93ff401b,data/93ff401b/conf/sys/5e0626e3.md,91,91,T,36,44,,,Password
98+
11524148,f0681755,GitHub,93ff401b,data/93ff401b/_/f0681755.md,1479,1479,T,28,86,,,NKEY Seed
99+
11524149,f0681755,GitHub,93ff401b,data/93ff401b/_/f0681755.md,1596,1596,T,24,82,,,NKEY Seed

0 commit comments

Comments
 (0)