#!/bin/bash -euo pipefail
gatk --java-options "-Xmx60620M -XX:-UsePerfData -XX:ParallelGCThreads=2" \
MarkDuplicates \
--INPUT tih_rna_sample_00582_B23MVV7LT4_1.Aligned.sortedByCoord.out.bam \
--OUTPUT tih_rna_sample_00582_B23MVV7LT4_1.md.bam \
--METRICS_FILE tih_rna_sample_00582_B23MVV7LT4_1.md.bam.metrics \
--TMP_DIR . \
--CREATE_INDEX true \
--REFERENCE_SEQUENCE ref_genome.fa \
-REMOVE_DUPLICATES false -VALIDATION_STRINGENCY LENIENT
# If cram files are wished as output, the run samtools for conversion
if [[ tih_rna_sample_00582_B23MVV7LT4_1.md.bam == *.cram ]]; then
samtools view -Ch -T ref_genome.fa -o tih_rna_sample_00582_B23MVV7LT4_1.md.bam tih_rna_sample_00582_B23MVV7LT4_1.md.bam
rm tih_rna_sample_00582_B23MVV7LT4_1.md.bam
samtools index tih_rna_sample_00582_B23MVV7LT4_1.md.bam
fi
cat <<-END_VERSIONS > versions.yml
"NFCORE_RNAFUSION:RNAFUSION:QC_WORKFLOW:GATK4_MARKDUPLICATES":
gatk4: $(echo $(gatk --version 2>&1) | sed 's/^.*(GATK) v//; s/ .*$//')
samtools: $(echo $(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*$//')
END_VERSIONS