#!/bin/bash -euo pipefail
gatk --java-options "-Xmx60620M -XX:-UsePerfData -XX:ParallelGCThreads=2" \
MarkDuplicates \
--INPUT BreastNP_FFPE_L02_RNA_01_B23LG7FLT4_2.Aligned.sortedByCoord.out.bam \
--OUTPUT BreastNP_FFPE_L02_RNA_01_B23LG7FLT4_2.md.bam \
--METRICS_FILE BreastNP_FFPE_L02_RNA_01_B23LG7FLT4_2.md.bam.metrics \
--TMP_DIR . \
--CREATE_INDEX true \
--REFERENCE_SEQUENCE ref_genome.fa \
-REMOVE_DUPLICATES false -VALIDATION_STRINGENCY LENIENT
# If cram files are wished as output, the run samtools for conversion
if [[ BreastNP_FFPE_L02_RNA_01_B23LG7FLT4_2.md.bam == *.cram ]]; then
samtools view -Ch -T ref_genome.fa -o BreastNP_FFPE_L02_RNA_01_B23LG7FLT4_2.md.bam BreastNP_FFPE_L02_RNA_01_B23LG7FLT4_2.md.bam
rm BreastNP_FFPE_L02_RNA_01_B23LG7FLT4_2.md.bam
samtools index BreastNP_FFPE_L02_RNA_01_B23LG7FLT4_2.md.bam
fi
cat <<-END_VERSIONS > versions.yml
"NFCORE_RNAFUSION:RNAFUSION:QC_WORKFLOW:GATK4_MARKDUPLICATES":
gatk4: $(echo $(gatk --version 2>&1) | sed 's/^.*(GATK) v//; s/ .*$//')
samtools: $(echo $(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*$//')
END_VERSIONS