Skip to content

Commit fadb07e

Browse files
committed
hrm
1 parent 04c000c commit fadb07e

File tree

1 file changed

+6
-1
lines changed

1 file changed

+6
-1
lines changed

v03_pipeline/bin/migration.py

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -99,7 +99,7 @@ def initialize_table(dataset_type: DatasetType, reference_genome: ReferenceGenom
9999
for dataset_type, reference_genome in MIGRATIONS:
100100
ht = initialize_table(dataset_type, reference_genome)
101101
sample_lookup_ht = hl.read_table(f'gs://seqr-hail-search-data/v03/{reference_genome.value}/{dataset_type.value}/lookup.ht')
102-
for project_guid in sample_lookup_ht.ref_samples:
102+
for project_guid in sample_lookup_ht.ref_samples[:3]:
103103
if project_guid in PROJECTS_EXCLUDED_FROM_LOOKUP:
104104
continue
105105
if project_guid not in sample_id_to_family_guid:
@@ -168,6 +168,11 @@ def initialize_table(dataset_type: DatasetType, reference_genome: ReferenceGenom
168168
project_lookup_ht = project_lookup_ht.select('project_stats')
169169
ht = join_lookup_hts(ht, project_lookup_ht)
170170
print(ht.count())
171+
print(ht.distinct().count())
172+
ht = ht.annotate_globals(
173+
updates=sample_lookup_ht.index_globals().updates
174+
)
175+
import pdb; pdb.set_trace()
171176
ht.write('gs://seqr-scratch-temp/benlasdkflookup.ht')
172177

173178

0 commit comments

Comments
 (0)