Skip to content

Commit cf7d718

Browse files
committed
change MarkDuplicatesSpark to MarkDuplicates
1 parent cab0df2 commit cf7d718

File tree

1 file changed

+18
-8
lines changed

1 file changed

+18
-8
lines changed

modules/02_mark_duplicates.nf

Lines changed: 18 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
1-
params.mark_duplicates_cpus = 16
2-
params.mark_duplicates_memory = "64g"
1+
params.mark_duplicates_cpus = 2
2+
params.mark_duplicates_memory = "16g"
33
params.remove_duplicates = true
44
params.skip_metrics = false
55
params.output = 'output'
@@ -21,15 +21,25 @@ process MARK_DUPLICATES {
2121
file("${name}.dedup_metrics.txt") optional true
2222

2323
script:
24-
dedup_metrics = params.skip_metrics ? "": "--metrics-file ${name}.dedup_metrics.txt"
25-
remove_duplicates = params.remove_duplicates ? "--remove-all-duplicates true" : "--remove-all-duplicates false"
24+
dedup_metrics = params.skip_metrics ? "": "--METRICS_FILE ${name}.dedup_metrics.txt"
25+
remove_duplicates = params.remove_duplicates ? "--REMOVE_DUPLICATES true" : "--REMOVE_DUPLICATES false"
2626
"""
2727
mkdir tmp
2828
29-
gatk MarkDuplicatesSpark \
29+
gatk SortSam \
30+
--INPUT ${bam} \
31+
--OUTPUT ${name}.sorted.bam \
32+
--SORT_ORDER coordinate
33+
34+
gatk MarkDuplicates \
3035
--java-options '-Xmx${params.mark_duplicates_memory} -Djava.io.tmpdir=tmp' \
31-
--input ${bam} \
32-
--output ${name}.dedup.bam \
33-
--conf 'spark.executor.cores=${task.cpus}' ${remove_duplicates} ${dedup_metrics}
36+
--INPUT ${name}.sorted.bam \
37+
--OUTPUT ${name}.dedup.bam \
38+
--ASSUME_SORT_ORDER coordinate \
39+
--CREATE_INDEX true ${remove_duplicates} ${dedup_metrics}
40+
41+
cp ${name}.dedup.bai ${name}.dedup.bam.bai
42+
43+
rm -f ${name}.sorted.bam
3444
"""
3545
}

0 commit comments

Comments
 (0)