broadinstitute
diff --git a/‎CLAUDE.md‎
Lines changed: 47 additions & 0 deletions b/‎CLAUDE.md‎
Lines changed: 47 additions & 0 deletions
diff --git a/‎pipes/WDL/tasks/tasks_assembly.wdl‎
Lines changed: 50 additions & 18 deletions b/‎pipes/WDL/tasks/tasks_assembly.wdl‎
Lines changed: 50 additions & 18 deletions
diff --git a/‎pipes/WDL/tasks/tasks_demux.wdl‎
Lines changed: 7 additions & 7 deletions b/‎pipes/WDL/tasks/tasks_demux.wdl‎
Lines changed: 7 additions & 7 deletions
diff --git a/‎pipes/WDL/tasks/tasks_interhost.wdl‎
Lines changed: 1 addition & 1 deletion b/‎pipes/WDL/tasks/tasks_interhost.wdl‎
Lines changed: 1 addition & 1 deletion
@@ -188,3 +188,50 @@ Image versions are pinned in `requirements-modules.txt` and must be kept in sync
 ## Dockstore Integration
 
 Workflows are registered on Dockstore for easy import to Terra, DNAnexus, and other platforms. The `.dockstore.yml` file defines all published workflows and their test parameter files.
+
+## Terra Performance Analysis
+
+When analyzing workflow performance from Terra submissions, use the Terra MCP tools for structure/status queries and direct GCS access for log analysis.
+
+### Timing Methodology for WDL Tasks
+
+When measuring task execution time from Terra logs:
+
+1. **Start time**: Use first Python log timestamp in stderr
+   - Pattern: `^(\d{4}-\d{2}-\d{2} \d{2}:\d{2}:\d{2}),\d+`
+
+2. **End time**: Use GCS file modification timestamp of stderr
+   - Get via: `gcloud storage ls -l <path>/stderr`
+   - This captures ALL execution including post-Python BAM I/O
+
+3. **Why not use Python log end time?**
+   - Many tasks run external tools (Java, pysam) after Python logging ends
+   - Python logs don't capture full execution time
+
+### Efficient GCS Queries with Wildcards
+
+Use wildcards to batch GCS queries instead of iterating:
+```bash
+# Get all stderr files from a submission with timestamps in one query
+gcloud storage ls -l "gs://bucket/submissions/<sub_id>/classify_single/*/call-deplete/stderr"
+gcloud storage ls -l "gs://bucket/submissions/<sub_id>/classify_single/*/call-deplete/attempt-*/stderr"
+```
+
+### Handling Preemption Retries
+
+When a task is preempted, Cromwell creates `attempt-*` directories:
+```
+call-deplete/
+  stderr           # First attempt (may be incomplete)
+  attempt-2/       # Second attempt
+    stderr         # Final successful run
+```
+
+**Always use the final (highest-numbered) attempt** for performance analysis - preemption time shouldn't count against code performance.
+
+### Sample Identification
+
+To identify which workflow corresponds to which sample:
+1. Read first few KB of stderr from each workflow
+2. Look for sample name in BAM file paths (e.g., `/S20.l1.xxxx.bam`)
+3. Cache the sample-to-workflow mapping for reuse
@@ -60,7 +60,7 @@ task assemble {
 
     Int disk_size = 375
 
-    command {
+    command <<<
         set -ex -o pipefail
 
         # find 90% memory
@@ -82,20 +82,28 @@ task assemble {
           --loglevel=DEBUG
 
         samtools view -c ~{sample_name}.subsamp.bam | tee subsample_read_count >&2
-    }
+
+        cat /proc/uptime | cut -f 1 -d ' ' > UPTIME_SEC
+        cat /proc/loadavg | cut -f 3 -d ' ' > LOAD_15M
+        set +o pipefail
+        { if [ -f /sys/fs/cgroup/memory.peak ]; then cat /sys/fs/cgroup/memory.peak; elif [ -f /sys/fs/cgroup/memory/memory.peak ]; then cat /sys/fs/cgroup/memory/memory.peak; elif [ -f /sys/fs/cgroup/memory/memory.max_usage_in_bytes ]; then cat /sys/fs/cgroup/memory/memory.max_usage_in_bytes; else echo "0"; fi; } > MEM_BYTES
+    >>>
 
     output {
         File   contigs_fasta        = "~{sample_name}.assembly1-spades.fasta"
         File   subsampBam           = "~{sample_name}.subsamp.bam"
         Int    subsample_read_count = read_int("subsample_read_count")
+        Int    max_ram_gb           = ceil(read_float("MEM_BYTES")/1000000000)
+        Int    runtime_sec          = ceil(read_float("UPTIME_SEC"))
+        Int    cpu_load_15min       = ceil(read_float("LOAD_15M"))
         String viralngs_version     = read_string("VERSION")
     }
 
     runtime {
         docker: docker
         memory: select_first([machine_mem_gb, 63]) + " GB"
         cpu: 4
-        disks:  "local-disk " + disk_size + " LOCAL"
+        disks:  "local-disk " + disk_size + " HDD"
         disk: disk_size + " GB" # TES
         dx_instance_type: "mem1_ssd1_v2_x8"
         maxRetries: 2
@@ -162,6 +170,11 @@ task select_references {
     # create top-hits output files
     cut -f 1 "~{contigs_basename}.refs_skani_dist.top.tsv" | tail +2 > TOP_FASTAS
     for f in $(cat TOP_FASTAS); do basename "$f" .fasta; done > TOP_FASTAS_BASENAMES
+
+    cat /proc/uptime | cut -f 1 -d ' ' > UPTIME_SEC
+    cat /proc/loadavg | cut -f 3 -d ' ' > LOAD_15M
+    set +o pipefail
+    { if [ -f /sys/fs/cgroup/memory.peak ]; then cat /sys/fs/cgroup/memory.peak; elif [ -f /sys/fs/cgroup/memory/memory.peak ]; then cat /sys/fs/cgroup/memory/memory.peak; elif [ -f /sys/fs/cgroup/memory/memory.max_usage_in_bytes ]; then cat /sys/fs/cgroup/memory/memory.max_usage_in_bytes; else echo "0"; fi; } > MEM_BYTES
   >>>
 
   output {
@@ -171,13 +184,16 @@ task select_references {
     Array[File]          top_matches_per_cluster_fastas = read_lines("TOP_FASTAS")
     File                 skani_dist_full_tsv = "~{contigs_basename}.refs_skani_dist.full.tsv"
     File                 skani_dist_top_tsv  = "~{contigs_basename}.refs_skani_dist.top.tsv"
+    Int                  max_ram_gb     = ceil(read_float("MEM_BYTES")/1000000000)
+    Int                  runtime_sec    = ceil(read_float("UPTIME_SEC"))
+    Int                  cpu_load_15min = ceil(read_float("LOAD_15M"))
   }
 
   runtime {
     docker: docker
     memory: machine_mem_gb + " GB"
     cpu:    cpu
-    disks:  "local-disk " + disk_size + " LOCAL"
+    disks:  "local-disk " + disk_size + " HDD"
     disk: disk_size + " GB" # TESs
     dx_instance_type: "mem1_ssd1_v2_x2"
     preemptible: 2
@@ -197,9 +213,9 @@ task scaffold {
       Int          replace_length=55
       Boolean      allow_incomplete_output = false
 
-      Int?          skani_m
-      Int?          skani_s
-      Int?          skani_c
+      Int?         skani_m
+      Int?         skani_s
+      Int?         skani_c
 
       Int?         nucmer_max_gap
       Int?         nucmer_min_match
@@ -387,6 +403,11 @@ task scaffold {
             ~{'--aligner=' + aligner} \
             --loglevel=DEBUG
         fi
+
+        cat /proc/uptime | cut -f 1 -d ' ' > UPTIME_SEC
+        cat /proc/loadavg | cut -f 3 -d ' ' > LOAD_15M
+        set +o pipefail
+        { if [ -f /sys/fs/cgroup/memory.peak ]; then cat /sys/fs/cgroup/memory.peak; elif [ -f /sys/fs/cgroup/memory/memory.peak ]; then cat /sys/fs/cgroup/memory/memory.peak; elif [ -f /sys/fs/cgroup/memory/memory.max_usage_in_bytes ]; then cat /sys/fs/cgroup/memory/memory.max_usage_in_bytes; else echo "0"; fi; } > MEM_BYTES
     >>>
 
     output {
@@ -406,14 +427,17 @@ task scaffold {
         Float  skani_ani                             = read_float("SKANI_ANI")
         Float  skani_ref_aligned_frac                = read_float("SKANI_REF_AF")
         Float  skani_contigs_aligned_frac            = read_float("SKANI_CONTIGS_AF")
+        Int    max_ram_gb                            = ceil(read_float("MEM_BYTES")/1000000000)
+        Int    runtime_sec                           = ceil(read_float("UPTIME_SEC"))
+        Int    cpu_load_15min                        = ceil(read_float("LOAD_15M"))
         String viralngs_version                      = read_string("VERSION")
     }
 
     runtime {
         docker: docker
         memory: select_first([machine_mem_gb, 63]) + " GB"
         cpu: 4
-        disks:  "local-disk " + disk_size + " LOCAL"
+        disks:  "local-disk " + disk_size + " HDD"
         disk: disk_size + " GB" # TES
         dx_instance_type: "mem1_ssd1_v2_x8"
         maxRetries: 2
@@ -498,7 +522,7 @@ task skani_triangle {
     docker: docker
     memory: machine_mem_gb + " GB"
     cpu:    cpu
-    disks:  "local-disk " + disk_size + " LOCAL"
+    disks:  "local-disk " + disk_size + " SSD"
     disk: disk_size + " GB" # TES
     dx_instance_type: "mem1_ssd1_v2_x4"
     preemptible: 2
@@ -550,7 +574,7 @@ task ivar_trim {
       }
     }
 
-    command {
+    command <<<
         ivar version | head -1 | tee VERSION
         if [ -f "~{trim_coords_bed}" ]; then
           ivar trim -e \
@@ -569,7 +593,7 @@ task ivar_trim {
         PCT=$(grep "Trimmed primers from" IVAR_OUT | perl -lape 's/Trimmed primers from (\S+)%.*/$1/')
         if [[ $PCT = -* ]]; then echo 0; else echo $PCT; fi > IVAR_TRIM_PCT
         grep "Trimmed primers from" IVAR_OUT | perl -lape 's/Trimmed primers from \S+% \((\d+)\).*/$1/' > IVAR_TRIM_COUNT
-    }
+    >>>
 
     output {
         File   aligned_trimmed_bam         = "~{bam_basename}.trimmed.bam"
@@ -582,7 +606,7 @@ task ivar_trim {
         docker: docker
         memory: select_first([machine_mem_gb, 7]) + " GB"
         cpu: 4
-        disks:  "local-disk " + disk_size + " LOCAL"
+        disks:  "local-disk " + disk_size + " HDD"
         disk: disk_size + " GB" # TES
         dx_instance_type: "mem1_ssd1_v2_x4"
         maxRetries: 2
@@ -672,7 +696,7 @@ task align_reads {
 
     Int?     cpu
     Int?     machine_mem_gb
-    String   docker = "quay.io/broadinstitute/viral-core:2.5.18"
+    String   docker = "quay.io/broadinstitute/viral-core:2.5.20"
 
     String   sample_name = basename(basename(basename(reads_unmapped_bam, ".bam"), ".taxfilt"), ".clean")
   }
@@ -787,7 +811,7 @@ task align_reads {
     docker: docker
     memory: machine_mem_gb_actual + " GB"
     cpu: cpu_actual
-    disks:  "local-disk " + disk_size + " LOCAL"
+    disks:  "local-disk " + disk_size + " SSD"
     disk: disk_size + " GB" # TES
     dx_instance_type: "mem1_ssd1_v2_x8"
     preemptible: 1
@@ -905,6 +929,11 @@ task refine_assembly_with_aligned_reads {
         set +o pipefail # grep will exit 1 if it fails to find the pattern
         grep -v '^>' trimmed.fasta | tr -d '\n' | wc -c | tee assembly_length
         grep -v '^>' trimmed.fasta | tr -d '\nNn' | wc -c | tee assembly_length_unambiguous
+
+        cat /proc/uptime | cut -f 1 -d ' ' > UPTIME_SEC
+        cat /proc/loadavg | cut -f 3 -d ' ' > LOAD_15M
+        set +o pipefail
+        { if [ -f /sys/fs/cgroup/memory.peak ]; then cat /sys/fs/cgroup/memory.peak; elif [ -f /sys/fs/cgroup/memory/memory.peak ]; then cat /sys/fs/cgroup/memory/memory.peak; elif [ -f /sys/fs/cgroup/memory/memory.max_usage_in_bytes ]; then cat /sys/fs/cgroup/memory/memory.max_usage_in_bytes; else echo "0"; fi; } > MEM_BYTES
     >>>
 
     output {
@@ -914,14 +943,17 @@ task refine_assembly_with_aligned_reads {
         Int    assembly_length_unambiguous = read_int("assembly_length_unambiguous")
         Int    dist_to_ref_snps            = read_int("num_snps")
         Int    dist_to_ref_indels          = read_int("num_indels")
+        Int    max_ram_gb                  = ceil(read_float("MEM_BYTES")/1000000000)
+        Int    runtime_sec                 = ceil(read_float("UPTIME_SEC"))
+        Int    cpu_load_15min              = ceil(read_float("LOAD_15M"))
         String viralngs_version            = read_string("VERSION")
     }
 
     runtime {
         docker: docker
         memory: machine_mem_gb + " GB"
         cpu: 8
-        disks:  "local-disk " + disk_size + " LOCAL"
+        disks:  "local-disk " + disk_size + " SSD"
         disk: disk_size + " GB" # TES
         dx_instance_type: "mem1_ssd1_v2_x8"
         maxRetries: 2
@@ -940,7 +972,7 @@ task run_discordance {
       String out_basename = "run"
       Int    min_coverage = 4
 
-      String docker = "quay.io/broadinstitute/viral-core:2.5.18"
+      String docker = "quay.io/broadinstitute/viral-core:2.5.20"
     }
     parameter_meta {
       reads_aligned_bam: {
@@ -960,7 +992,7 @@ task run_discordance {
 
     Int disk_size = 100
 
-    command {
+    command <<<
         set -ex -o pipefail
 
         read_utils.py --version | tee VERSION
@@ -1026,7 +1058,7 @@ task run_discordance {
           echo 0 > num_discordant_snps
           echo 0 > num_discordant_indels
         fi
-    }
+    >>>
 
     output {
         File   discordant_sites_vcf = "~{out_basename}.discordant.vcf"
 
@@ -6,12 +6,12 @@ task merge_tarballs {
     String       out_filename
 
     Int?         machine_mem_gb
-    String       docker = "quay.io/broadinstitute/viral-core:2.5.18"
+    String       docker = "quay.io/broadinstitute/viral-core:2.5.20"
   }
 
   Int disk_size = 2625
 
-  command {
+  command <<<
     set -ex -o pipefail
 
     if [ -z "$TMPDIR" ]; then
@@ -23,7 +23,7 @@ task merge_tarballs {
     file_utils.py merge_tarballs \
       ~{out_filename} ~{sep=' ' tar_chunks} \
       --loglevel=DEBUG
-  }
+  >>>
 
   output {
     File   combined_tar     = "~{out_filename}"
@@ -181,7 +181,7 @@ task illumina_demux {
     # --- options for VM shape ----------------------
     Int?    machine_mem_gb
     Int     disk_size = 2625
-    String  docker    = "quay.io/broadinstitute/viral-core:2.5.18"
+    String  docker    = "quay.io/broadinstitute/viral-core:2.5.20"
   }
 
   parameter_meta {
@@ -823,7 +823,7 @@ task get_illumina_run_metadata {
     String? sequencing_center
 
     Int?   machine_mem_gb
-    String docker = "quay.io/broadinstitute/viral-core:2.5.18"
+    String docker = "quay.io/broadinstitute/viral-core:2.5.20"
   }
 
   parameter_meta {
@@ -927,7 +927,7 @@ task demux_fastqs {
     Int?    machine_mem_gb
     Int     max_cpu = 32       # Maximum CPU cap for autoscaling (use 16 for 2-barcode, 64 for 3-barcode)
     Int     disk_size = 750
-    String  docker = "quay.io/broadinstitute/viral-core:2.5.18"
+    String  docker = "quay.io/broadinstitute/viral-core:2.5.20"
   }
 
   # Calculate total input size for autoscaling
@@ -1056,7 +1056,7 @@ task merge_demux_metrics {
   input {
     Array[File]+ metrics_files
     String       output_filename = "merged_demux_metrics.txt"
-    String       docker = "quay.io/broadinstitute/viral-core:2.5.18"
+    String       docker = "quay.io/broadinstitute/viral-core:2.5.20"
   }
 
   parameter_meta {
 
@@ -351,7 +351,7 @@ task index_ref {
     File?  novocraft_license
 
     Int?   machine_mem_gb
-    String docker = "quay.io/broadinstitute/viral-core:2.5.18"
+    String docker = "quay.io/broadinstitute/viral-core:2.5.20"
   }
 
   Int disk_size = 100
Original file line number	Diff line number	Diff line change
`@@ -351,7 +351,7 @@ task index_ref {`
`351`	`351`	`File? novocraft_license`
`352`	`352`
`353`	`353`	`Int? machine_mem_gb`
`354`		`- String docker = "quay.io/broadinstitute/viral-core:2.5.18"`
	`354`	`+ String docker = "quay.io/broadinstitute/viral-core:2.5.20"`
`355`	`355`	`}`
`356`	`356`
`357`	`357`	`Int disk_size = 100`