#!/bin/bash -Ceuo pipefail
INDEX=`find -L ./ -name "*.amb" | sed 's/\.amb$//'`
export bwt_max_mem=112G
sentieon bwa mem \
-K 100000000 -Y -R '@RG\tID:REGRESSION.HCC1395_tumor.L001\tPU:L001\tSM:HCC1395_tumor\tLB:HCC1395_tumor\tDS:s3://natera-platform-sandbox/pipeline-resources/ngi-igenomes/igenomes/Homo_sapiens/GATK/GRCh38/Sequence/WholeGenomeFasta/Homo_sapiens_assembly38.fasta\tPL:ILLUMINA' \
-t 31 \
$INDEX \
HCC1395_tumor_R1.fastq.gz HCC1395_tumor_R2.fastq.gz \
| sentieon util sort \
-r Homo_sapiens_assembly38.fasta \
-t 31 \
-o HCC1395_tumor.bam \
--sam2bam \
-
# When outputting CRAM, sentieon util sort may create a spurious .bai index.
# Remove it since CRAM uses .crai indices.
if [ "bam" = "cram" ] && [ -f "HCC1395_tumor.cram.bai" ]; then
rm -f HCC1395_tumor.cram.bai
fi
cat <<-END_VERSIONS > versions.yml
"DAQ:SENTIEON_BWAMEM":
sentieon: $(echo $(sentieon driver --version 2>&1) | sed -e "s/sentieon-genomics-//g")
END_VERSIONS