File Info

Filename
.command.sh
Full Path
s3://natera-rnd-pltf-dev-nextflow-scratch-01/work/ab/3e4f7767ff443caa676188dd4df574/.command.sh
Size
1.1 KB
Attempt
#!/bin/bash -euo pipefail
gatk --java-options "-Xmx60620M -XX:-UsePerfData -XX:ParallelGCThreads=2" \
    MarkDuplicates \
    --INPUT aih-tih-sc-16054b-R1_B23WHYVLT4_1.Aligned.sortedByCoord.out.bam \
    --OUTPUT aih-tih-sc-16054b-R1_B23WHYVLT4_1.md.bam \
    --METRICS_FILE aih-tih-sc-16054b-R1_B23WHYVLT4_1.md.bam.metrics \
    --TMP_DIR . \
    --CREATE_INDEX true \
    --REFERENCE_SEQUENCE ref_genome.fa \
    -REMOVE_DUPLICATES false -VALIDATION_STRINGENCY LENIENT

# If cram files are wished as output, the run samtools for conversion
if [[ aih-tih-sc-16054b-R1_B23WHYVLT4_1.md.bam == *.cram ]]; then
    samtools view -Ch -T ref_genome.fa -o aih-tih-sc-16054b-R1_B23WHYVLT4_1.md.bam aih-tih-sc-16054b-R1_B23WHYVLT4_1.md.bam
    rm aih-tih-sc-16054b-R1_B23WHYVLT4_1.md.bam
    samtools index aih-tih-sc-16054b-R1_B23WHYVLT4_1.md.bam
fi

cat <<-END_VERSIONS > versions.yml
"NFCORE_RNAFUSION:RNAFUSION:QC_WORKFLOW:GATK4_MARKDUPLICATES":
    gatk4: $(echo $(gatk --version 2>&1) | sed 's/^.*(GATK) v//; s/ .*$//')
    samtools: $(echo $(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*$//')
END_VERSIONS