Skip to content

Commit 0bec9de

Browse files
committed
Fix splice_ai
1 parent 7bdfcb6 commit 0bec9de

File tree

1 file changed

+6
-0
lines changed

1 file changed

+6
-0
lines changed

v03_pipeline/lib/reference_datasets/splice_ai.py

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,6 @@
11
import hail as hl
22

3+
from v03_pipeline.lib.misc.io import checkpoint
34
from v03_pipeline.lib.model import ReferenceGenome
45
from v03_pipeline.lib.reference_datasets.misc import vcf_to_ht
56

@@ -10,6 +11,11 @@ def get_ht(
1011
) -> hl.Table:
1112
ht = vcf_to_ht(paths, reference_genome)
1213

14+
# NB: We ran into weird issues...running out
15+
# of file descriptors on dataproc :/
16+
ht, _ = checkpoint(ht)
17+
hl._set_flags(use_new_shuffle=None, no_whole_stage_codegen='1') # noqa: SLF001
18+
1319
# SpliceAI INFO field description from the VCF header: SpliceAIv1.3 variant annotation. These include
1420
# delta scores (DS) and delta positions (DP) for acceptor gain (AG), acceptor loss (AL), donor gain (DG), and
1521
# donor loss (DL). Format: ALLELE|SYMBOL|DS_AG|DS_AL|DS_DG|DS_DL|DP_AG|DP_AL|DP_DG|DP_DL

0 commit comments

Comments
 (0)