We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent cc50910 commit b3927c4Copy full SHA for b3927c4
v03_pipeline/lib/misc/io.py
@@ -11,6 +11,7 @@
11
BIALLELIC = 2
12
B_PER_MB = 1 << 20 # 1024 * 1024
13
MB_PER_PARTITION = 128
14
+MAX_SAMPLES_SPLIT_MULTI_SHUFFLE = 100
15
16
MALE = 'Male'
17
FEMALE = 'Female'
@@ -54,7 +55,9 @@ def split_multi_hts(mt: hl.MatrixTable) -> hl.MatrixTable:
54
55
bi = bi.filter_rows(~bi.alleles.contains('*'))
56
bi = bi.annotate_rows(a_index=1, was_split=False)
57
multi = mt.filter_rows(hl.len(mt.alleles) > BIALLELIC)
- split = hl.split_multi_hts(multi)
58
+ split = hl.split_multi_hts(
59
+ multi, permit_shuffle=mt.count()[1] < MAX_SAMPLES_SPLIT_MULTI_SHUFFLE
60
+ )
61
mt = split.union_rows(bi)
62
return mt.distinct_by_row()
63
0 commit comments