Downloading: s3://natera-platform-sandbox/pipeline-resources/AIH/rna/GRCh38/starfusion/ctat_genome_lib_build_dir/ref_genome.fa
Downloading: s3://natera-platform-sandbox/pipeline-resources/Homo_sapiens_assembly38.dbsnp138.vcf.gz
Downloading: s3://natera-rnd-pltf-dev-nextflow-scratch-01/work/9f/6c8761b462720edcfce388eded78f6/.command.sh
Downloading: s3://natera-rnd-pltf-dev-nextflow-scratch-01/work/e9/f448cb106b606b624da42b70ecc978/NTC_0001_0001_23H5VFLT4_s15.md.bam
Downloading: s3://natera-platform-sandbox/pipeline-resources/AIH/rna/GRCh38/starfusion/ctat_genome_lib_build_dir/ref_genome.dict
Downloading: s3://natera-rnd-pltf-dev-nextflow-scratch-01/work/e9/f448cb106b606b624da42b70ecc978/NTC_0001_0001_23H5VFLT4_s15.md.bai
Downloading: s3://natera-platform-sandbox/pipeline-resources/AIH/rna/GRCh38/gatk4/dbsnp_hg38_contam_sites.bed
Downloading: s3://natera-rnd-pltf-dev-nextflow-scratch-01/work/9f/6c8761b462720edcfce388eded78f6/.command.run
Downloading: s3://natera-platform-sandbox/pipeline-resources/AIH/rna/GRCh38/starfusion/ctat_genome_lib_build_dir/ref_genome.fa.fai
Downloading: s3://natera-platform-sandbox/pipeline-resources/beds/twist/Twist_rna_exome_AND_fusion_hg38.bed
Downloading: s3://natera-platform-sandbox/pipeline-resources/Homo_sapiens_assembly38.dbsnp138.vcf.gz.tbi
==> STAGING COMPLETE (11 inputs)
+ mkdir NTC_0001_0001_23H5VFLT4_s15
+ all_qc -bam NTC_0001_0001_23H5VFLT4_s15.md.bam -beds Twist_rna_exome_AND_fusion_hg38.bed -dbsnp_vcf Homo_sapiens_assembly38.dbsnp138.vcf.gz -contamination_bed dbsnp_hg38_contam_sites.bed -output_folder NTC_0001_0001_23H5VFLT4_s15 -reference ref_genome.fa -region chr20
mkdir -p NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/
cat Twist_rna_exome_AND_fusion_hg38.bed | cut -f 1-3 | bedtools sort -g ref_genome.fa.fai | bedtools merge > NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/full_bed.bed
seqtool depth -bam NTC_0001_0001_23H5VFLT4_s15.md.bam -bed NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/full_bed.bed -threads 4 -bam_threads 2 | bgzip -c > NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/NTC_0001_0001_23H5VFLT4_s15.md.depth.gz
saturation_plot -bams NTC_0001_0001_23H5VFLT4_s15.md.bam -region chr20 -output NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/saturation_plot.png -threads 1
seqtool saturation_metric -at 1000000 -region chr20 -bam_threads 1 NTC_0001_0001_23H5VFLT4_s15.md.bam > NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/saturation_qc.tsv
fragment_size -bams NTC_0001_0001_23H5VFLT4_s15.md.bam -region chr20 -output_prefix NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/fragsize -threads 1
samtools mpileup -B --min-MQ 60 --min-BQ 30 -f ref_genome.fa -l dbsnp_hg38_contam_sites.bed NTC_0001_0001_23H5VFLT4_s15.md.bam > NTC_0001_0001_23H5VFLT4_s15.md.mpileup && contamination -input NTC_0001_0001_23H5VFLT4_s15.md.mpileup -dbsnp_vcf Homo_sapiens_assembly38.dbsnp138.vcf.gz > NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/contamination.tsv
[mpileup] 1 samples in 1 input files
/opt/conda/lib/python3.9/site-packages/pyranges/__init__.py:8: UserWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html. The pkg_resources package is slated for removal as early as 2025-11-30. Refrain from using this package or pin to Setuptools<81.
import pkg_resources
/opt/conda/lib/python3.9/site-packages/pyranges/__init__.py:8: UserWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html. The pkg_resources package is slated for removal as early as 2025-11-30. Refrain from using this package or pin to Setuptools<81.
import pkg_resources
0it [00:00, ?it/s]
2600it [00:00, 1525628.20it/s]
[W::hts_idx_load3] The index file is older than the data file: Homo_sapiens_assembly38.dbsnp138.vcf.gz.tbi
tabix -s 1 -b 2 -e 2 NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/NTC_0001_0001_23H5VFLT4_s15.md.depth.gz
seqtool depth_hist -nbins 500 NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/NTC_0001_0001_23H5VFLT4_s15.md.depth.gz > NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/NTC_0001_0001_23H5VFLT4_s15.md.depth_hist.tsv
cat NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/NTC_0001_0001_23H5VFLT4_s15.md.depth_hist.tsv | plot -x 0 -xlabel Depth -ylabel "Number of Sites" -xlim 0 2000 -title NTC_0001_0001_23H5VFLT4_s15.md -output NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/NTC_0001_0001_23H5VFLT4_s15.md.depth.png
seqtool read_qc -bed Twist_rna_exome_AND_fusion_hg38.bed -n_threads 1 -bam_threads 2 NTC_0001_0001_23H5VFLT4_s15.md.bam > NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/read_qc.Twist_rna_exome_AND_fusion_hg38.bed.tsv
seqtool reads_per_target -bed Twist_rna_exome_AND_fusion_hg38.bed -threads 1 -bam_threads 2 NTC_0001_0001_23H5VFLT4_s15.md.bam > NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/reads_per_target.Twist_rna_exome_AND_fusion_hg38.bed.tsv
seqtool depth_stats -bed Twist_rna_exome_AND_fusion_hg38.bed NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/NTC_0001_0001_23H5VFLT4_s15.md.depth.gz> NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/depth_stats.Twist_rna_exome_AND_fusion_hg38.bed.tsv
seqtool gc_bias -reference ref_genome.fa -bed Twist_rna_exome_AND_fusion_hg38.bed -bin_size 0.05 -threads 1 -bam_threads 2 NTC_0001_0001_23H5VFLT4_s15.md.bam > NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/gc_bias_qc.Twist_rna_exome_AND_fusion_hg38.bed.tsv
cat NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/gc_bias_qc.Twist_rna_exome_AND_fusion_hg38.bed.tsv | plot -x 0 -header infer -ylim 0 2 -title "NTC_0001_0001_23H5VFLT4_s15.md" -suptitle "Twist_rna_exome_AND_fusion_hg38.bed" -output "NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/gc_bias.Twist_rna_exome_AND_fusion_hg38.bed.png" -ylabel "Fold enrichment / depletion" -xlabel "GC Quantile"
echo `date` > NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md/qc_complete.txt
+ merge_qc -folders NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15.md -output NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15_full_basic_stats.tsv
+ head -n1 NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15_full_basic_stats.tsv
++ basename Twist_rna_exome_AND_fusion_hg38.bed
+ grep -e Twist_rna_exome_AND_fusion_hg38.bed NTC_0001_0001_23H5VFLT4_s15/NTC_0001_0001_23H5VFLT4_s15_full_basic_stats.tsv