Skip to content

Commit 99df412

Browse files
authored
Merge pull request #147 from sanger-tol/dev
Dev
2 parents dcd6e07 + bc04469 commit 99df412

51 files changed

Lines changed: 1870 additions & 254 deletions

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

.nf-core.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -48,4 +48,4 @@ template:
4848
- seqera_platform
4949
- multiqc
5050
- rocrate
51-
version: 1.6.0
51+
version: 1.6.1

CHANGELOG.md

Lines changed: 24 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -3,6 +3,30 @@
33
The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/)
44
and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
55

6+
## [[1.6.1](https://github.com/sanger-tol/curationpretext/releases/tag/1.6.1)] - UNSC Trafalgar (H1) - [2025-03-13]
7+
8+
## Added and Fixed
9+
10+
- Update to add the `--run_ultra` parameter
11+
- Enum of ["yes", "no", "force"]
12+
- When run as 'yes', ultra resolution maps will be generated if the genome is > 4.Gb.
13+
- When run as 'ultra', an ultra resolution map will be generated regardless of genome size.
14+
- Update to `pretextmap` to a version that supports `--ultraRes`
15+
- Update to add the `--snapshot_order` now supported by `pretextsnapshot`
16+
- This is a `.txt` with a scaffold name per line.
17+
- Update the `repeat_density` subworkflow from local to `sanger-tol`
18+
- Update to config file to support the above fixes.
19+
- Addition of example params file `assets/example_params_file.yaml`
20+
21+
### Software Dependencies
22+
23+
Note, since the pipeline is using Nextflow DSL2, each process will be run with its own Biocontainer. This means that on occasion it is entirely possible for the pipeline to be using different versions of the same tool. However, the overall software dependency changes compared to the last release have been listed below for reference.
24+
25+
| Module | Old Version | New Versions |
26+
| ----------------- | ----------- | ------------ |
27+
| `PRETEXTMAP` | 0.1.9 | 0.2.4 |
28+
| `PRETEXTSNAPSHOT` | 0.0.5 | 0.0.7 |
29+
630
## [[1.6.0](https://github.com/sanger-tol/curationpretext/releases/tag/1.6.0)] - UNSC Trafalgar - [2025-02-19]
731

832
## Added and Fixed

README.md

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -77,6 +77,15 @@ Currently, the pipeline uses the following flags:
7777
- `--cram_chunk_size`
7878
- The number of records in a cram file should be chunked into, defaults to 10000.
7979

80+
- `--run_hires`
81+
- A boolean to run the pipeline in hires mode, i.e., generate hires resolution maps. Default is `true`
82+
83+
- `--run_ultra`
84+
- A string argument to run the pipeline in ultra resolution mode, i.e., generate ultra resolution maps. Options are: `yes`, `force`, `no`. Default is `yes`, this runs ultra resolution maps is the genome file is > 4.Gb.
85+
86+
- `--snapshot_order`
87+
- A path to a `genome`, `sizes` or `fai` file containing the scaffolds in the order required for the output snapshot png file.
88+
8089
Now, you can run the pipeline using:
8190

8291
```bash

assets/example_params_file.yaml

Lines changed: 14 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,14 @@
1+
sample: "CurationPretextTest_MIN"
2+
teloseq: "TTA"
3+
aligner: "bwamem2"
4+
all_output: false
5+
skip_tracks: "NONE"
6+
run_hires: false
7+
run_ultra: "force"
8+
split_telomere: true
9+
input: "https://tolit.cog.sanger.ac.uk/test-data/resources/treeval/TreeValTinyData/assembly/draft/grTriPseu1.fa"
10+
reads:
11+
- "https://tolit.cog.sanger.ac.uk/test-data/resources/treeval/TreeValTinyData/genomic_data/pacbio/seqkitPacbio50000.fasta.gz"
12+
cram:
13+
- "https://tolit.cog.sanger.ac.uk/test-data/resources/treeval/TreeValTinyData/genomic_data/hic-arima/SUBSET-1000.cram"
14+
- "https://tolit.cog.sanger.ac.uk/test-data/resources/treeval/TreeValTinyData/genomic_data/hic-arima/SUBSET-2000.cram"

assets/schema_input.json

Lines changed: 0 additions & 33 deletions
This file was deleted.

conf/base.config

Lines changed: 10 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -47,7 +47,7 @@ process {
4747

4848
withName: ".*:ALIGN_CRAM:CRAMALIGN_BWAMEM2ALIGNHIC" {
4949
cpus = { 16 * 1 }
50-
memory = { 1.GB * ( reference.size() < 2e9 ? 80 : Math.ceil( ( reference.size() / 1e+9 ) * 30 ) * Math.ceil( task.attempt * 1 ) ) }
50+
memory = { 1.GB * ( reference.size() < 2e9 ? 80 : Math.ceil( ( reference.size() / 1e+9 ) * 30 ) * task.attempt ) }
5151
}
5252

5353
withName: ".*:ALIGN_CRAM:CRAMALIGN_MINIMAP2ALIGNHIC" {
@@ -69,14 +69,20 @@ process {
6969
}
7070

7171
withName: ".*:CREATE_MAPS_STDRD:PRETEXTMAP" {
72-
cpus = { 8 * 1 }
72+
cpus = { 6 * 1 }
7373
memory = { 3.GB * task.attempt }
7474
time = { 1.h * ( ( fasta.size() < 4e9 ? 24 : 48 ) * task.attempt ) }
7575
}
7676

7777
withName: ".*:CREATE_MAPS_HIRES:PRETEXTMAP" {
78-
cpus = { 8 * task.attempt }
79-
memory = { 20.GB * Math.ceil( task.attempt * 2.6 ) }
78+
cpus = { 6 * task.attempt }
79+
memory = { 20.GB * task.attempt }
80+
time = { 1.h * ( ( fasta.size() < 4e9 ? 24 : 48 ) * Math.ceil( task.attempt * 1 ) ) }
81+
}
82+
83+
withName: ".*:CREATE_MAPS_ULTRA:PRETEXTMAP" {
84+
cpus = { 6 * task.attempt }
85+
memory = { 40.GB * task.attempt }
8086
time = { 1.h * ( ( fasta.size() < 4e9 ? 24 : 48 ) * Math.ceil( task.attempt * 1 ) ) }
8187
}
8288

conf/modules.config

Lines changed: 17 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ process {
1515
//
1616
// NOTE: GROUP THE PUBLISHDIR DIRECTIVES
1717
//
18-
withName: 'PRETEXT_INGEST_SNDRD|PRETEXT_INGEST_HIRES' {
18+
withName: 'PRETEXT_INGEST_SNDRD|PRETEXT_INGEST_HIRES|PRETEXT_INGEST_ULTRA' {
1919
publishDir = [
2020
[
2121
path: { "${params.outdir}/pretext_maps_processed" },
@@ -29,6 +29,12 @@ process {
2929
mode: params.publish_dir_mode,
3030
saveAs: { filename -> filename.equals('versions.yml') ? null : filename },
3131
],
32+
[
33+
path: { "${params.outdir}/pretext_maps_processed" },
34+
pattern: "*ultra.pretext",
35+
mode: params.publish_dir_mode,
36+
saveAs: { filename -> filename.equals('versions.yml') ? null : filename },
37+
],
3238
]
3339
}
3440

@@ -40,7 +46,7 @@ process {
4046
saveAs: { filename -> filename.equals('versions.yml') ? null : filename },
4147
]
4248
]
43-
ext.args = { "--sequences '=full' --resolution 1440 --memory ${task.memory}" }
49+
ext.args = { (order_file ? "" : "--sequences '=full'") + " --resolution 1440 --memory ${task.memory}" }
4450
ext.prefix = { "${meta.id}_normal" }
4551
}
4652

@@ -55,7 +61,7 @@ process {
5561
]
5662
}
5763

58-
withName: ".*:REPEAT_DENSITY:UCSC_BEDGRAPHTOBIGWIG" {
64+
withName: ".*:REPEAT_DENSITY:FEATURE_DENSITY:UCSC_BEDGRAPHTOBIGWIG" {
5965
ext.prefix = { "${meta.id}_repeat_density" }
6066
}
6167

@@ -84,7 +90,6 @@ process {
8490
}
8591

8692
withName: 'GAWK_RENAME_IDS' {
87-
ext.args2 = "'{ gsub(/\\./, \"0\"); print}'"
8893
ext.suffix = '_renamed.bed'
8994
}
9095

@@ -170,9 +175,9 @@ process {
170175
ext.prefix = { "${meta.id}_hr" }
171176
}
172177

173-
withName: "PRETEXTSNAPSHOT" {
174-
ext.args = { "--sequences '=full' --resolution 1440 --memory ${task.memory}" }
175-
ext.prefix = { "${meta.id}_normal" }
178+
withName: "PRETEXT_INGEST_ULTRA" {
179+
ext.args = { "--textureBuffer 1G" }
180+
ext.prefix = { "${meta.id}_ultra" }
176181
}
177182

178183
//
@@ -238,6 +243,11 @@ process {
238243
ext.prefix = { "${meta.id}_hr_pi" }
239244
}
240245

246+
withName: ".*:CREATE_MAPS_ULTRA:PRETEXTMAP" {
247+
ext.args = { "${meta.map_order.equals("length") ? "--sortby length": "--sortby nosort" } --ultraRes --mapq ${params.multi_mapping}" }
248+
ext.prefix = { "${meta.id}_ultra_pi" }
249+
}
250+
241251
withName: ".*:ALIGN_CRAM:CRAMALIGN_BWAMEM2ALIGNHIC" {
242252
ext.args = ""
243253
ext.args2 = "-F0xB00 -nt"

conf/test.config

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -32,5 +32,6 @@ params {
3232
all_output = false
3333
skip_tracks = "NONE"
3434
run_hires = false
35+
run_ultra = "no"
3536
split_telomere = true
3637
}

conf/test_full.config

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -29,6 +29,7 @@ params {
2929
all_output = true
3030
skip_tracks = "NONE"
3131
run_hires = true
32+
run_ultra = "force"
3233
split_telomere = true
3334

3435
}

conf/very_large_resources.config

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -73,4 +73,10 @@ process {
7373
memory = { 40.GB * task.attempt }
7474
time = { 20.h * task.attempt }
7575
}
76+
77+
withName: CRAMALIGN_BWAMEM2ALIGNHIC {
78+
cpus = { 16 * 1 }
79+
memory = { 100.GB * task.attempt }
80+
time = { 40.h * task.attempt }
81+
}
7682
}

0 commit comments

Comments
 (0)