#!/bin/bash -euo pipefail
python -u /usr/local/src/CTAT-SPLICING/STAR_to_cancer_introns.py \
--SJ_tab_file 1173_RPX_T1_RNA_SLD_01_A23T55JLT4_1.SJ.out.tab \
--chimJ_file 1173_RPX_T1_RNA_SLD_01_A23T55JLT4_1.Chimeric.out.junction \
--bam_file 1173_RPX_T1_RNA_SLD_01_A23T55JLT4_1.Aligned.sortedByCoord.out.bam \
--output_prefix 1173_RPX_T1_RNA_SLD_01_A23T55JLT4_1 \
--ctat_genome_lib ctat_genome_lib_build_dir \
--vis --sample_name 1173_RPX_T1_RNA_SLD_01_A23T55JLT4_1
# Sort output files to ensure consistent ordering across runs while preserving headers
if [ -f 1173_RPX_T1_RNA_SLD_01_A23T55JLT4_1.cancer.introns ]; then
# Extract header (first line) and sort data lines by fourth column (uniq_mapped) descending, then by first column (intron)
head -n 1 1173_RPX_T1_RNA_SLD_01_A23T55JLT4_1.cancer.introns > 1173_RPX_T1_RNA_SLD_01_A23T55JLT4_1.cancer.introns.tmp
tail -n +2 1173_RPX_T1_RNA_SLD_01_A23T55JLT4_1.cancer.introns | LC_ALL=C sort -k4,4nr -k1,1 >> 1173_RPX_T1_RNA_SLD_01_A23T55JLT4_1.cancer.introns.tmp
mv 1173_RPX_T1_RNA_SLD_01_A23T55JLT4_1.cancer.introns.tmp 1173_RPX_T1_RNA_SLD_01_A23T55JLT4_1.cancer.introns
fi
cat <<-END_VERSIONS > versions.yml
"NFCORE_RNAFUSION:RNAFUSION:CTATSPLICING_STARTOCANCERINTRONS":
ctat-splicing: 0.0.3
END_VERSIONS