-
Notifications
You must be signed in to change notification settings - Fork 88
Expand file tree
/
Copy pathmanipulate_damage.nf
More file actions
178 lines (149 loc) · 9.28 KB
/
manipulate_damage.nf
File metadata and controls
178 lines (149 loc) · 9.28 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
//
// Calculate PMD scores, trim, or rescale DNA damage from mapped reads.
//
include { addNewMetaFromAttributes } from '../../subworkflows/local/utils_nfcore_eager_pipeline/main'
include { BEDTOOLS_MASKFASTA } from '../../modules/nf-core/bedtools/maskfasta/main'
include { MAPDAMAGE2 } from '../../modules/nf-core/mapdamage2/main'
include { PMDTOOLS_FILTER } from '../../modules/nf-core/pmdtools/filter/main'
include { BAMUTIL_TRIMBAM } from '../../modules/nf-core/bamutil/trimbam/main'
include { SAMTOOLS_INDEX as SAMTOOLS_INDEX_DAMAGE_RESCALED } from '../../modules/nf-core/samtools/index/main'
include { SAMTOOLS_INDEX as SAMTOOLS_INDEX_DAMAGE_FILTERED } from '../../modules/nf-core/samtools/index/main'
include { SAMTOOLS_INDEX as SAMTOOLS_INDEX_DAMAGE_TRIMMED } from '../../modules/nf-core/samtools/index/main'
include { SAMTOOLS_FLAGSTAT as SAMTOOLS_FLAGSTAT_DAMAGE_FILTERED } from '../../modules/nf-core/samtools/flagstat/main'
// TODO: Add required channels and channel manipulations for reference-dependent bed masking before pmdtools. Requires multi-ref support before implementation.
workflow MANIPULATE_DAMAGE {
take:
ch_bam_bai // [ [ meta ], bam , bai ]
ch_fasta // [ [ meta ], fasta ]
ch_pmd_masking // [ [ meta ], masked_fasta, bed_for_masking ]
main:
ch_versions = Channel.empty()
ch_rescaled_bams = Channel.empty()
ch_pmd_filtered_bams = Channel.empty()
ch_trimmed_bams = Channel.empty()
ch_pmd_filtered_flagstat = Channel.empty() // Only run flagstat on pmd filtered bam, since rescaling and trimming does not change the number of reads
// Ensure correct reference is associated with each bam_bai pair
ch_refs = ch_fasta
.map {
// Prepend a new meta that contains the meta.id value as the new_meta.reference attribute
addNewMetaFromAttributes( it, "id" , "reference" , false )
}
ch_input_for_damage_manipulation = ch_bam_bai
.map {
// Prepend a new meta that contains the meta.reference value as the new_meta.reference attribute
addNewMetaFromAttributes( it, "reference" , "reference" , false )
}
.combine( ch_refs, by: 0 ) // [ [combine_meta], [meta], bam, bai, [ref_meta], fasta ]
if ( params.run_mapdamage_rescaling ) {
ch_mapdamage_prep = ch_input_for_damage_manipulation
.branch {
ignore_me, meta, bam, bai, ref_meta, fasta ->
skip: meta.damage_treatment == 'full'
no_skip: true
}
ch_skip_rescale = ch_mapdamage_prep.skip
.map {
ignore_me, meta, bam, bai, ref_meta, fasta ->
[ meta, bam, bai ]
}
ch_mapdamage_input = ch_mapdamage_prep.no_skip
.multiMap {
ignore_me, meta, bam, bai, ref_meta, fasta ->
bam: [ meta, bam ]
fasta: fasta
}
MAPDAMAGE2( ch_mapdamage_input.bam, ch_mapdamage_input.fasta )
ch_versions = ch_versions.mix( MAPDAMAGE2.out.versions.first() )
SAMTOOLS_INDEX_DAMAGE_RESCALED( MAPDAMAGE2.out.rescaled )
ch_versions = ch_versions.mix( SAMTOOLS_INDEX_DAMAGE_RESCALED.out.versions.first() )
ch_rescaled_index = params.fasta_largeref ? SAMTOOLS_INDEX_DAMAGE_RESCALED.out.csi : SAMTOOLS_INDEX_DAMAGE_RESCALED.out.bai
// TODO When adding library-level data merging pre-genotyping, make sure that rescaled bams are not merged in any way as the underlying damage model could differ between libraries
ch_rescaled_bams = MAPDAMAGE2.out.rescaled.join(ch_rescaled_index)
.mix(ch_skip_rescale) // Should these be mixed actually, or excluded? Might not make sense to take rescaled and non-rescaled bams togetehr for anything downstream.
}
if ( params.run_pmd_filtering ) {
ch_masking_prep = ch_pmd_masking
.combine( ch_fasta, by: 0 ) // [ [meta], masked_fasta, bed, fasta ]
.branch {
meta, masked_fasta, bed, fasta ->
alreadymasked: masked_fasta != ""
tobemasked: masked_fasta == "" && bed != ""
nomasking: masked_fasta == "" && bed == ""
}
ch_masking_input = ch_masking_prep.tobemasked
.multiMap{
meta, masked_fasta, bed, fasta ->
bed: [ meta, bed ]
fasta: fasta
}
BEDTOOLS_MASKFASTA( ch_masking_input.bed, ch_masking_input.fasta )
ch_masking_output = BEDTOOLS_MASKFASTA.out.fasta
ch_versions = ch_versions.mix( BEDTOOLS_MASKFASTA.out.versions.first() )
ch_already_masked = ch_masking_prep.alreadymasked
.map {
meta, masked_fasta, bed, fasta ->
[ meta, masked_fasta ]
}
ch_no_masking = ch_masking_prep.nomasking
.map {
meta, masked_fasta, bed, fasta ->
[ meta, fasta ]
}
ch_pmd_fastas = ch_masking_output.mix( ch_already_masked, ch_no_masking )
.map {
// Prepend a new meta that contains the meta.id value as the new_meta.reference attribute
addNewMetaFromAttributes( it, "id" , "reference" , false )
}
ch_pmdtools_input = ch_bam_bai
.map { addNewMetaFromAttributes( it, "reference" , "reference" , false ) }
.combine( ch_pmd_fastas, by: 0 ) // [ [combine_meta], [meta], bam, bai, [ref_meta] fasta ]
.multiMap {
combine_meta, meta, bam, bai, ref_meta, fasta ->
bam: [ meta, bam, bai ]
fasta: fasta
}
PMDTOOLS_FILTER( ch_pmdtools_input.bam, params.damage_manipulation_pmdtools_threshold, ch_pmdtools_input.fasta )
ch_versions = ch_versions.mix( PMDTOOLS_FILTER.out.versions.first() )
SAMTOOLS_INDEX_DAMAGE_FILTERED( PMDTOOLS_FILTER.out.bam )
ch_versions = ch_versions.mix( SAMTOOLS_INDEX_DAMAGE_FILTERED.out.versions.first() )
ch_filtered_index = params.fasta_largeref ? SAMTOOLS_INDEX_DAMAGE_FILTERED.out.csi : SAMTOOLS_INDEX_DAMAGE_FILTERED.out.bai
ch_pmd_filtered_bams = PMDTOOLS_FILTER.out.bam.join( ch_filtered_index )
SAMTOOLS_FLAGSTAT_DAMAGE_FILTERED( ch_pmd_filtered_bams )
ch_pmd_filtered_flagstat = SAMTOOLS_FLAGSTAT_DAMAGE_FILTERED.out.flagstat
ch_versions = ch_versions.mix( SAMTOOLS_FLAGSTAT_DAMAGE_FILTERED.out.versions.first() )
}
if ( params.run_trim_bam ) {
if ( params.run_pmd_filtering ) {
ch_to_trim = ch_pmd_filtered_bams
.map{
meta, bam, bai ->
[ meta, bam ]
}
} else {
ch_to_trim = ch_bam_bai
.map {
meta, bam, bai ->
[ meta, bam ]
}
}
ch_trimbam_input = ch_to_trim
.map {
meta, bam ->
def trim_left = meta.strandedness == 'single' ? ( meta.damage_treatment == 'none' ? params.damage_manipulation_bamutils_trim_single_stranded_none_udg_left : meta.damage_treatment == 'half' ? params.damage_manipulation_bamutils_trim_single_stranded_half_udg_left : 0 ) : ( meta.damage_treatment == 'none' ? params.damage_manipulation_bamutils_trim_double_stranded_none_udg_left : meta.damage_treatment == 'half' ? params.damage_manipulation_bamutils_trim_double_stranded_half_udg_left : 0 )
def trim_right = meta.strandedness == 'single' ? ( meta.damage_treatment == 'none' ? params.damage_manipulation_bamutils_trim_single_stranded_none_udg_right : meta.damage_treatment == 'half' ? params.damage_manipulation_bamutils_trim_single_stranded_half_udg_right : 0 ) : ( meta.damage_treatment == 'none' ? params.damage_manipulation_bamutils_trim_double_stranded_none_udg_right : meta.damage_treatment == 'half' ? params.damage_manipulation_bamutils_trim_double_stranded_half_udg_right : 0 )
[ meta, bam, trim_left, trim_right ]
}
BAMUTIL_TRIMBAM( ch_trimbam_input )
ch_versions = ch_versions.mix( BAMUTIL_TRIMBAM.out.versions.first() )
SAMTOOLS_INDEX_DAMAGE_TRIMMED( BAMUTIL_TRIMBAM.out.bam )
ch_versions = ch_versions.mix( SAMTOOLS_INDEX_DAMAGE_TRIMMED.out.versions.first() )
ch_trimmed_index = params.fasta_largeref ? SAMTOOLS_INDEX_DAMAGE_TRIMMED.out.csi : SAMTOOLS_INDEX_DAMAGE_TRIMMED.out.bai
ch_trimmed_bams = BAMUTIL_TRIMBAM.out.bam.join( ch_trimmed_index )
}
emit:
rescaled = ch_rescaled_bams // [ meta, bam, bai ]
filtered = ch_pmd_filtered_bams // [ meta, bam, bai ]
trimmed = ch_trimmed_bams // [ meta, bam, bai ]
flagstat = ch_pmd_filtered_flagstat // [ meta, flagstat ]
versions = ch_versions
}