File Info

Filename
.command.sh
Full Path
s3://natera-rnd-pltf-dev-nextflow-scratch-01/work/b8/7bb1e22d77d59d8af6bfa28abd7022/.command.sh
Size
915 bytes
Attempt
#!/bin/bash -Ceuo pipefail
SEX=$(python3 -c "
import pandas as pd
sex = pd.read_csv('sex_calls.csv')
lookup = dict(zip(sex['specimen_id'], sex['inferred_sex']))
s = lookup.get('1029_0I', 'unknown')
print('male' if s != 'female' else 'female')
")

python /usr/local/bin/normalize_sample.py \
    --counts 1029_0I-N1-BDNA-1_B23KGCJLT4_1_probes.tsv.gz \
    --batch-reference batch_reference.parquet \
    --gc-reference /usr/local/share/probe_gc_content.tsv \
    --sex $SEX \
    --sample-id 1029_0I-N1-BDNA-1_B23KGCJLT4_1 \
    --specimen-id 1029_0I \
    --flowcell unknown \
    --sample-type normal \
    --output 1029_0I-N1-BDNA-1_B23KGCJLT4_1_normalized.parquet \
    --feature-stats-output 1029_0I-N1-BDNA-1_B23KGCJLT4_1_gam_stats.json

cat <<-END_VERSIONS > versions.yml
"NFCORE_SAREK:SAREK:BAM_VARIANT_CALLING_SOMATIC_ALL:SOMATIC_CNV_CALLING:SOMA_CNV_NORMALIZE":
    soma-cnv: 20260604-9c39aac
END_VERSIONS