File Info

Filename
.command.sh
Full Path
s3://natera-rnd-pltf-dev-nextflow-scratch-01/work/aa/ff3fee6660880dd9ede93e027722a3/.command.sh
Size
751 bytes
Attempt
#!/bin/bash -Ceuo pipefail
SEX=$(python3 -c "
import pandas as pd
sex = pd.read_csv('sex_calls.csv')
lookup = dict(zip(sex['specimen_id'], sex['inferred_sex']))
s = lookup.get('1029_16G', 'unknown')
print('male' if s != 'female' else 'female')
")

python /usr/local/bin/normalize_sample.py \
    --counts 1029_16G-N1-BDNA-1_B23KGCJLT4_1_probes.tsv.gz \
    --batch-reference batch_reference.parquet \
    --gc-reference /usr/local/share/probe_gc_content.tsv \
    --sex $SEX \
    --sample-id 1029_16G-N1-BDNA-1_B23KGCJLT4_1 \
    --specimen-id 1029_16G \
    --flowcell B23KFCWLT4 \
    --sample-type normal \
    --output 1029_16G-N1-BDNA-1_B23KGCJLT4_1_normalized.parquet \
    --feature-stats-output 1029_16G-N1-BDNA-1_B23KGCJLT4_1_gam_stats.json