#!/bin/bash -euo pipefail
gatk --java-options "-Xmx60620M -XX:-UsePerfData -XX:ParallelGCThreads=2" \
MarkDuplicates \
--INPUT aih-tih-sc-377071-R1_A23YTGFLT4_1.Aligned.sortedByCoord.out.bam \
--OUTPUT aih-tih-sc-377071-R1_A23YTGFLT4_1.md.bam \
--METRICS_FILE aih-tih-sc-377071-R1_A23YTGFLT4_1.md.bam.metrics \
--TMP_DIR . \
--CREATE_INDEX true \
--REFERENCE_SEQUENCE ref_genome.fa \
-REMOVE_DUPLICATES false -VALIDATION_STRINGENCY LENIENT
# If cram files are wished as output, the run samtools for conversion
if [[ aih-tih-sc-377071-R1_A23YTGFLT4_1.md.bam == *.cram ]]; then
samtools view -Ch -T ref_genome.fa -o aih-tih-sc-377071-R1_A23YTGFLT4_1.md.bam aih-tih-sc-377071-R1_A23YTGFLT4_1.md.bam
rm aih-tih-sc-377071-R1_A23YTGFLT4_1.md.bam
samtools index aih-tih-sc-377071-R1_A23YTGFLT4_1.md.bam
fi
cat <<-END_VERSIONS > versions.yml
"NFCORE_RNAFUSION:RNAFUSION:QC_WORKFLOW:GATK4_MARKDUPLICATES":
gatk4: $(echo $(gatk --version 2>&1) | sed 's/^.*(GATK) v//; s/ .*$//')
samtools: $(echo $(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*$//')
END_VERSIONS