Skip to content

Commit e11a44c

Browse files
committed
check for constant gene impairments
1 parent 229e059 commit e11a44c

File tree

1 file changed

+15
-0
lines changed

1 file changed

+15
-0
lines changed

deeprvat/deeprvat/associate.py

+15
Original file line numberDiff line numberDiff line change
@@ -449,9 +449,19 @@ def make_regenie_input_(
449449
samples=list(sample_ids.astype(str)),
450450
metadata="Pseudovariants containing DeepRVAT gene impairment scores. One pseudovariant per gene.",
451451
) as f:
452+
skipped_genes = 0
452453
for i in trange(n_genes):
453454
varid = f"pseudovariant_gene_{ensgids[i]}"
454455
this_burdens = burdens[:, i]
456+
if np.all(this_burdens == this_burdens[0]):
457+
# burdens are constant, cannot perform association testing
458+
logger.warning(
459+
f"Gene impairment scores for gene {i} ({ensgids[i]}) "
460+
"are all constant. Gene will not be written to BGEN "
461+
"and will be skipped during association testing"
462+
)
463+
skipped_genes += 1
464+
continue
455465

456466
# Rescale scores to fill out range [0, 1] (making dosages in [0, 2])
457467
min_burden = np.min(this_burdens)
@@ -478,6 +488,11 @@ def make_regenie_input_(
478488
bit_depth=16,
479489
)
480490

491+
if skipped_genes > 0:
492+
logger.warning(
493+
f"Skipped {skipped_genes} with constant gene impairment scores"
494+
)
495+
481496

482497
@cli.command()
483498
@click.option("--debug", is_flag=True)

0 commit comments

Comments
 (0)