@@ -14,12 +14,12 @@ include { TABIX_BGZIPTABIX as TABIX_BGZIPTABIX_INTERVAL_COMBINED } from '../../.
14
14
15
15
workflow PREPARE_INTERVALS {
16
16
take :
17
- fasta_fai // mandatory [ fasta_fai ]
18
- intervals // [ params.intervals ]
19
- no_intervals // [ params.no_intervals ]
20
- nucleotides_per_second
21
- outdir
22
- step
17
+ fasta_fai // mandatory [ params. fasta_fai ]
18
+ intervals // optional [ params.intervals ]
19
+ no_intervals // boolean [ params.no_intervals ]
20
+ nucleotides_per_second // mandatory [ params.nucleotides_per_second ]
21
+ outdir // mandatory [ params.outdir ]
22
+ step // mandatory [ params.step ]
23
23
24
24
main :
25
25
versions = Channel . empty()
@@ -69,10 +69,12 @@ workflow PREPARE_INTERVALS {
69
69
}
70
70
71
71
// Now for the intervals.bed the following operations are done:
72
- // 1. Intervals file is split up into multiple bed files for scatter/gather
73
- // 2. Each bed file is indexed
72
+ // 1/ Split up intervals bed file into multiple bed files for scatter/gather
73
+ // 2/ Tabix index each bed file
74
74
75
- // 1. Intervals file is split up into multiple bed files for scatter/gather & grouping together small intervals
75
+ // 1/ Split up intervals bed file into multiple bed files for scatter/gather
76
+ // Also group together small intervals
77
+ // And add the number of intervals to the channel
76
78
intervals_bed = intervals_bed
77
79
.flatten()
78
80
.map { intervals_ ->
@@ -100,7 +102,7 @@ workflow PREPARE_INTERVALS {
100
102
.map { intervals_ -> [intervals_, intervals_. size()] }
101
103
.transpose()
102
104
103
- // 2. Create bed.gz and bed.gz.tbi for each interval file. They are split by region (see above)
105
+ // 2/ Tabix index each bed file
104
106
TABIX_BGZIPTABIX_INTERVAL_SPLIT (intervals_bed. map { intervals_ , _num_intervals -> [[id : intervals_. baseName], intervals_] })
105
107
106
108
intervals_bed_gz_tbi = TABIX_BGZIPTABIX_INTERVAL_SPLIT . out. gz_tbi
0 commit comments