Skip to content

Commit 599151a

Browse files
committed
two separate warning sets for 2019 dataset
1 parent 4fb3c87 commit 599151a

File tree

1 file changed

+6
-1
lines changed

1 file changed

+6
-1
lines changed

scripts/bundle-html-dataset.sh

+6-1
Original file line numberDiff line numberDiff line change
@@ -19,8 +19,13 @@ psql -h $PGADDRESS -U cortex -t -o "$DTPATH/$CORPUSNAME-no_problem-tasks.txt" -c
1919
psql -h $PGADDRESS -U cortex -t -o "$DTPATH/$CORPUSNAME-warning-tasks.txt" -c "SELECT entry FROM tasks WHERE corpus_id=$CORPUSID and service_id=$SERVICEID and status=-2"
2020
psql -h $PGADDRESS -U cortex -t -o "$DTPATH/$CORPUSNAME-error-tasks.txt" -c "SELECT entry FROM tasks WHERE corpus_id=$CORPUSID and service_id=$SERVICEID and status=-3"
2121

22+
# Specific to the 08.2019 dataset
23+
split -l 500000 arxmliv-warning-tasks.txt
24+
mv xaa arxmliv-warning_1-tasks.txt
25+
mv xab arxmliv-warning_2-tasks.txt
26+
2227
# For each severity, prepare a dataset archive of HTML files
23-
severitylist="no_problem warning error"
28+
severitylist="no_problem warning_1 warning_2 error"
2429

2530
for severity in $severitylist; do
2631
mkdir $DTPATH/$severity

0 commit comments

Comments
 (0)