4
4
# filename: standard_dashboard.sh
5
5
# authors: Sage Wright, Kevin Libuit, Frank Ambrosio
6
6
7
- VERSION=" Google Dashboarding v0.1 "
7
+ VERSION=" Google Dashboarding v0.3 "
8
8
9
9
showHelp () {
10
10
cat << EOF
11
- Google Dashboarding v0.1
11
+ Google Dashboarding v0.3
12
12
This script is configured to work within a Google Batch job managed by a Google Workflow and Trigger.
13
13
The following variables need to be passed in as input parameters.
14
14
CAUTION: The entire command length must be under 400 characters; using the short version of arguments is recommended
@@ -29,13 +29,14 @@ Usage: ./standard_dashboard.sh
29
29
[ -q | --big-query-table-name ] the name of the big query table to upload to ("sars_cov_2_dashboard.workflow_la_state_gisaid_specimens_test")
30
30
[ -m | --puerto-rico ] apply Puerto Rico-specific changes. available options: true or false
31
31
[ -i | --input-tar-file ] the tar file given to the script by the Google Trigger
32
-
32
+ [ -k | --skip-bq-load ] skips the bq load step. available options: true or false
33
+ [ -x | --helix ] apply Helix-specific changes. available options: true or false
33
34
Happy dashboarding!
34
35
EOF
35
36
}
36
37
37
38
# use getopt to parse the input arguments
38
- PARSED_ARGUMENTS=$( getopt -n " standard-dashboard" -o " hvd:j: s:b:o:t:g:r:p:w:q:m:i:" -l " version,help,dashboard-gcp-uri:,dashboard-newline-json:,dashboard- schema:,gisaid-backup-dir:,output-dir:,trigger-bucket:,terra-gcp-uri:,terra-table-root-entity:,terra-project:,terra-workspace:,big-query-table-name:,puerto-rico:,input-tar-file:" -a -- " $@ " )
39
+ PARSED_ARGUMENTS=$( getopt -n " standard-dashboard" -o " hvd:s:b:o:t:g:r:p:w:q:m:i:k:x: " -l " version,help,dashboard-gcp-uri:,dashboard-schema:,gisaid-backup-dir:,output-dir:,trigger-bucket:,terra-gcp-uri:,terra-table-root-entity:,terra-project:,terra-workspace:,big-query-table-name:,puerto-rico:,input-tar-file:,skip-bq-load:,helix :" -a -- " $@ " )
39
40
40
41
eval set -- " $PARSED_ARGUMENTS "
41
42
@@ -47,8 +48,6 @@ while true; do
47
48
showHelp; exit 0;;
48
49
-d|--dashboard-gcp-uri)
49
50
dashboard_gcp_uri=$2 ; shift 2;;
50
- -j|--dashboard-newline-json)
51
- dashboard_newline_json=$2 ; shift 2;;
52
51
-s|--dashboard_schema)
53
52
dashboard_schema=$2 ; shift 2;;
54
53
-b|--gisaid-backup-dir)
@@ -71,6 +70,10 @@ while true; do
71
70
puerto_rico=$2 ; shift 2;;
72
71
-i|--input-tar-file)
73
72
input_tar_file=$2 ; shift 2;;
73
+ -k|--skip-bq-load)
74
+ skip_bq_load=$2 ; shift 2;;
75
+ -x|--helix)
76
+ helix=$2 ; shift 2;;
74
77
--) shift ; break ;;
75
78
* ) echo " Unexpected option: $1 -- this should not happen." ; exit 1;;
76
79
esac
@@ -100,7 +103,7 @@ make_directory ${output_dir}/backup_jsons
100
103
101
104
# echo the variables that were provided
102
105
echo -e " Dashboarding Automated System initiated at ${date_tag} \n" | tee ${output_dir} /automation_logs/dashboard-${date_tag} .log
103
- echo -e " Input variables:\ndashboard_gcp_uri: ${dashboard_gcp_uri} ,\ndashboard_newline_json: ${dashboard_newline_json} ,\ ndashboard_bq_load_schema: ${dashboard_schema} ,\ngisaid_backup_dir: ${gisaid_backup_dir} ,\nmounted_output_dir: ${output_dir} ,\ntrigger_bucket_gcp_uri: ${trigger_bucket} ,\nterra_gcp_uri: ${terra_gcp_uri} ,\nterra_table_root_entity: ${terra_table_root_entity} ,\nterra_project: ${terra_project} ,\nterra_workspace: ${terra_workspace} ,\nbig_query_table_name: ${big_query_table_name} \n" >> ${output_dir} /automation_logs/dashboard-${date_tag} .log
106
+ echo -e " Input variables:\ndashboard_gcp_uri: ${dashboard_gcp_uri} ,\ndashboard_bq_load_schema: ${dashboard_schema} ,\ngisaid_backup_dir: ${gisaid_backup_dir} ,\nmounted_output_dir: ${output_dir} ,\ntrigger_bucket_gcp_uri: ${trigger_bucket} ,\nterra_gcp_uri: ${terra_gcp_uri} ,\nterra_table_root_entity: ${terra_table_root_entity} ,\nterra_project: ${terra_project} ,\nterra_workspace: ${terra_workspace} ,\nbig_query_table_name: ${big_query_table_name} \n" >> ${output_dir} /automation_logs/dashboard-${date_tag} .log
104
107
105
108
# take in file as input from trigger
106
109
file=${trigger_bucket} /${input_tar_file}
@@ -131,17 +134,17 @@ if [[ "$file" == *"gisaid_auspice_input"*"tar" ]]; then
131
134
\n
132
135
# Create individual fasta files from GISAID multifasta
133
136
\n
134
- python3 /scripts/gisaid_multifasta_parser.py ${gisaid_dir} /*.sequences.fasta ${gisaid_dir} ${puerto_rico}
137
+ python3 /scripts/gisaid_multifasta_parser.py ${gisaid_dir} /*.sequences.fasta ${gisaid_dir} ${puerto_rico} ${helix}
135
138
\n
136
139
\n
137
140
# Deposit individual fasta files into Terra GCP bucket
138
141
\n
139
- gsutil -m cp ${gisaid_dir} /individual_gisaid_assemblies_$( date -I ) /*.fasta ${terra_gcp_uri} /uploads/gisaid_individual_assemblies_$( date -I ) /
142
+ gsutil -m cp ${gisaid_dir} /individual_gisaid_assemblies_${date_tag} /*.fasta ${terra_gcp_uri} /uploads/gisaid_individual_assemblies_${date_tag} /
140
143
\n
141
144
\n
142
145
# Create and import Terra Data table containing GCP pointers to deposited assemblies
143
146
\n
144
- /scripts/terra_table_from_gcp_assemblies.sh ${terra_gcp_uri} /uploads/gisaid_individual_assemblies_$( date -I ) ${terra_project} ${terra_workspace} ${terra_table_root_entity} ${gisaid_dir} \" .fasta\" $( date -I )
147
+ /scripts/terra_table_from_gcp_assemblies.sh ${terra_gcp_uri} /uploads/gisaid_individual_assemblies_${date_tag} ${terra_project} ${terra_workspace} ${terra_table_root_entity} ${gisaid_dir} \" .fasta\" ${date_tag}
145
148
\n
146
149
\n
147
150
# Capture, reformat, and prune GISAID metadata
@@ -154,6 +157,38 @@ if [[ "$file" == *"gisaid_auspice_input"*"tar" ]]; then
154
157
python3 /scripts/import_large_tsv/import_large_tsv.py --project ${terra_project} --workspace ${terra_workspace} --tsv ${gisaid_dir} /gisaid_metadata_${date_tag} .tsv
155
158
\n
156
159
\n
160
+ if ${skip_bq_load} ; then
161
+ \n
162
+ # Make a set table
163
+ \n
164
+ /scripts/make_set_table.sh ${terra_gcp_uri} /uploads/gisaid_individual_assemblies_${date_tag} ${terra_project} ${terra_workspace} ${terra_table_root_entity} ${gisaid_dir} \" .fasta\" ${date_tag}
165
+ \n
166
+ \n
167
+ # Run TheiaCoV_FASTA on the set
168
+ \n
169
+ TOKEN=` gcloud auth print-access-token`
170
+ \n
171
+ curl -X 'POST' \
172
+ 'https://api.firecloud.org/api/workspaces/${terra_project} /${terra_workspace} /submissions' \
173
+ -H 'accept: */*' \
174
+ -H " Authorization: Bearer ${TOKEN} " \
175
+ -H 'Content-Type: application/json' \
176
+ -d \" {
177
+ \" methodConfigurationNamespace\" : \" ${terra_project} \" ,
178
+ \" methodConfigurationName\" : \" TheiaCoV_FASTA_PHB\" ,
179
+ \" entityType\" : \" ${terra_table_root_entity} _set\" ,
180
+ \" entityName\" : \" ${date_tag} -set\" ,
181
+ \" expression\" : \" this.${terra_table_root_entity} s\" ,
182
+ \" useCallCache\" : true,
183
+ \" deleteIntermediateOutputFiles\" : false,
184
+ \" useReferenceDisks\" : false,
185
+ \" memoryRetryMultiplier\" : 1,
186
+ \" workflowFailureMode\" : \" NoNewCalls\" ,
187
+ \" userComment\" : \" ${date_tag} -set automatically launched\"
188
+ }\"
189
+ \n
190
+ \n
191
+ else
157
192
# Capture the entire Terra data table as a tsv
158
193
\n
159
194
python3 /scripts/export_large_tsv/export_large_tsv.py --project ${terra_project} --workspace ${terra_workspace} --entity_type ${terra_table_root_entity} --tsv_filename ${gisaid_dir} /full_${terra_table_root_entity} _terra_table_${date_tag} .tsv
@@ -175,6 +210,8 @@ if [[ "$file" == *"gisaid_auspice_input"*"tar" ]]; then
175
210
\n
176
211
bq load --ignore_unknown_values=true --replace=true --source_format=NEWLINE_DELIMITED_JSON ${big_query_table_name} ${dashboard_gcp_uri} /${terra_table_root_entity} .json ${dashboard_schema}
177
212
\n
213
+ fi
214
+ \n
178
215
\n
179
216
"
180
217
# write the commands that will be run to the automation log
0 commit comments