Skip to content

Commit a259804

Browse files
authored
make updating crdqs a dependency of updating vat (#912)
* make updating crdqs a dependency of updating vat * remove from init * fix import
1 parent 1ab1a25 commit a259804

8 files changed

+66
-32
lines changed

v03_pipeline/bin/pipeline_worker.py

Lines changed: 0 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,6 @@
1313
project_remap_path,
1414
)
1515
from v03_pipeline.lib.tasks import (
16-
UpdateCachedReferenceDatasetQueries,
1716
UpdateVariantAnnotationsTableWithNewSamplesTask,
1817
WriteProjectFamilyTablesTask,
1918
)
@@ -50,10 +49,6 @@ def main():
5049
k: v for k, v in lpr.model_dump().items() if k != 'projects_to_run'
5150
}
5251
tasks = [
53-
UpdateCachedReferenceDatasetQueries(
54-
reference_genome=lpr.reference_genome,
55-
dataset_type=lpr.dataset_type,
56-
),
5752
UpdateVariantAnnotationsTableWithNewSamplesTask(
5853
project_guids=lpr.projects_to_run,
5954
project_remap_paths=project_remap_paths,

v03_pipeline/lib/tasks/__init__.py

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -8,9 +8,6 @@
88
from v03_pipeline.lib.tasks.migrate_all_variant_annotations_tables import (
99
MigrateAllVariantAnnotationsTablesTask,
1010
)
11-
from v03_pipeline.lib.tasks.reference_data.update_cached_reference_dataset_queries import (
12-
UpdateCachedReferenceDatasetQueries,
13-
)
1411
from v03_pipeline.lib.tasks.update_lookup_table import (
1512
UpdateLookupTableTask,
1613
)
@@ -53,7 +50,6 @@
5350
'UpdateVariantAnnotationsTableWithNewSamplesTask',
5451
'UpdateVariantAnnotationsTableWithDeletedProjectTask',
5552
'UpdateVariantAnnotationsTableWithDeletedFamiliesTask',
56-
'UpdateCachedReferenceDatasetQueries',
5753
'WriteMetadataForRunTask',
5854
'WriteProjectFamilyTablesTask',
5955
]

v03_pipeline/lib/tasks/base/base_update_variant_annotations_table.py

Lines changed: 16 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -13,6 +13,9 @@
1313
)
1414
from v03_pipeline.lib.tasks.base.base_update import BaseUpdateTask
1515
from v03_pipeline.lib.tasks.files import GCSorLocalTarget
16+
from v03_pipeline.lib.tasks.reference_data.update_cached_reference_dataset_queries import (
17+
UpdateCachedReferenceDatasetQueries,
18+
)
1619
from v03_pipeline.lib.tasks.reference_data.updated_reference_dataset_collection import (
1720
UpdatedReferenceDatasetCollectionTask,
1821
)
@@ -32,19 +35,24 @@ def output(self) -> luigi.Target:
3235
)
3336

3437
def requires(self) -> list[luigi.Task]:
35-
return [
36-
(
37-
UpdatedReferenceDatasetCollectionTask(
38-
self.reference_genome,
39-
self.dataset_type,
40-
rdc,
41-
)
38+
requirements = [
39+
UpdateCachedReferenceDatasetQueries(
40+
reference_genome=self.reference_genome,
41+
dataset_type=self.dataset_type,
42+
),
43+
]
44+
requirements.extend(
45+
UpdatedReferenceDatasetCollectionTask(
46+
self.reference_genome,
47+
self.dataset_type,
48+
rdc,
4249
)
4350
for rdc in ReferenceDatasetCollection.for_reference_genome_dataset_type(
4451
self.reference_genome,
4552
self.dataset_type,
4653
)
47-
]
54+
)
55+
return requirements
4856

4957
def initialize_table(self) -> hl.Table:
5058
key_type = self.dataset_type.table_key_type(self.reference_genome)

v03_pipeline/lib/tasks/base/base_update_variant_annotations_table_test.py

Lines changed: 9 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -53,8 +53,16 @@ def setUp(self) -> None:
5353
@patch(
5454
'v03_pipeline.lib.tasks.base.base_update_variant_annotations_table.UpdatedReferenceDatasetCollectionTask',
5555
)
56-
def test_should_create_initialized_table(self, mock_update_rdc_task) -> None:
56+
@patch(
57+
'v03_pipeline.lib.tasks.base.base_update_variant_annotations_table.UpdateCachedReferenceDatasetQueries',
58+
)
59+
def test_should_create_initialized_table(
60+
self,
61+
mock_update_crdqs_task,
62+
mock_update_rdc_task,
63+
) -> None:
5764
mock_update_rdc_task.return_value = MockCompleteTask()
65+
mock_update_crdqs_task.return_value = MockCompleteTask()
5866
vat_task = BaseUpdateVariantAnnotationsTableTask(
5967
reference_genome=ReferenceGenome.GRCh38,
6068
dataset_type=DatasetType.SNV_INDEL,

v03_pipeline/lib/tasks/reference_data/update_variant_annotations_table_with_updated_reference_dataset_test.py

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -649,6 +649,9 @@
649649
@mock.patch(
650650
'v03_pipeline.lib.tasks.base.base_update_variant_annotations_table.UpdatedReferenceDatasetCollectionTask',
651651
)
652+
@mock.patch(
653+
'v03_pipeline.lib.tasks.base.base_update_variant_annotations_table.UpdateCachedReferenceDatasetQueries',
654+
)
652655
@mock.patch(
653656
'v03_pipeline.lib.tasks.base.base_update_variant_annotations_table.BaseUpdateVariantAnnotationsTableTask.initialize_table',
654657
)
@@ -719,9 +722,11 @@ def setUp(self) -> None:
719722
def test_update_vat_with_updated_rdc_snv_indel_38(
720723
self,
721724
mock_initialize_table,
725+
mock_update_crdqs_task,
722726
mock_update_rdc_task,
723727
):
724728
mock_update_rdc_task.return_value = MockCompleteTask()
729+
mock_update_crdqs_task.return_value = MockCompleteTask()
725730
mock_initialize_table.return_value = hl.Table.parallelize(
726731
[
727732
hl.Struct(
@@ -927,9 +932,11 @@ def test_update_vat_with_updated_rdc_snv_indel_38(
927932
def test_update_vat_with_updated_rdc_mito_38(
928933
self,
929934
mock_initialize_table,
935+
mock_update_crdqs_task,
930936
mock_update_rdc_task,
931937
):
932938
mock_update_rdc_task.return_value = MockCompleteTask()
939+
mock_update_crdqs_task.return_value = MockCompleteTask()
933940
mock_initialize_table.return_value = hl.Table.parallelize(
934941
[
935942
hl.Struct(
@@ -1075,9 +1082,11 @@ def test_update_vat_with_updated_rdc_mito_38(
10751082
def test_update_vat_with_updated_rdc_snv_indel_37(
10761083
self,
10771084
mock_initialize_table,
1085+
mock_update_crdqs_task,
10781086
mock_update_rdc_task,
10791087
):
10801088
mock_update_rdc_task.return_value = MockCompleteTask()
1089+
mock_update_crdqs_task.return_value = MockCompleteTask()
10811090
mock_initialize_table.return_value = hl.Table.parallelize(
10821091
[
10831092
hl.Struct(

v03_pipeline/lib/tasks/update_variant_annotations_table_with_new_samples_test.py

Lines changed: 19 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -88,6 +88,9 @@
8888
@patch(
8989
'v03_pipeline.lib.tasks.base.base_update_variant_annotations_table.UpdatedReferenceDatasetCollectionTask',
9090
)
91+
@patch(
92+
'v03_pipeline.lib.tasks.base.base_update_variant_annotations_table.UpdateCachedReferenceDatasetQueries',
93+
)
9194
class UpdateVariantAnnotationsTableWithNewSamplesTaskTest(MockedDatarootTestCase):
9295
def setUp(self) -> None:
9396
super().setUp()
@@ -154,9 +157,11 @@ def setUp(self) -> None:
154157
def test_missing_pedigree(
155158
self,
156159
mock_update_vat_with_rdc_task,
160+
mock_update_crdqs_task,
157161
mock_update_rdc_task,
158162
) -> None:
159163
mock_update_rdc_task.return_value = MockCompleteTask()
164+
mock_update_crdqs_task.return_value = MockCompleteTask()
160165
mock_update_vat_with_rdc_task.return_value = MockCompleteTask()
161166
uvatwns_task = UpdateVariantAnnotationsTableWithNewSamplesTask(
162167
reference_genome=ReferenceGenome.GRCh38,
@@ -180,9 +185,11 @@ def test_missing_pedigree(
180185
def test_missing_interval_reference(
181186
self,
182187
mock_update_vat_with_rdc_task,
188+
mock_update_crdqs_task,
183189
mock_update_rdc_task,
184190
) -> None:
185191
mock_update_rdc_task.return_value = MockCompleteTask()
192+
mock_update_crdqs_task.return_value = MockCompleteTask()
186193
mock_update_vat_with_rdc_task.return_value = MockCompleteTask()
187194
shutil.rmtree(
188195
valid_reference_dataset_collection_path(
@@ -233,10 +240,12 @@ def test_multiple_update_vat(
233240
mock_updated_cached_reference_dataset_query,
234241
mock_env: Mock,
235242
mock_register_alleles: Mock,
243+
mock_update_crdqs_task,
236244
mock_update_rdc_task: Mock,
237245
) -> None:
238246
mock_updated_cached_reference_dataset_query.return_value = MockCompleteTask()
239247
mock_update_rdc_task.return_value = MockCompleteTask()
248+
mock_update_crdqs_task.return_value = MockCompleteTask()
240249
mock_update_vat_with_rdc_task.return_value = (
241250
BaseUpdateVariantAnnotationsTableTask(
242251
reference_genome=ReferenceGenome.GRCh38,
@@ -679,9 +688,11 @@ def test_update_vat_grch37(
679688
mock_vep: Mock,
680689
mock_update_vat_with_rdc_task: Mock,
681690
mock_register_alleles: Mock,
691+
mock_update_crdqs_task,
682692
mock_update_rdc_task: Mock,
683693
) -> None:
684694
mock_update_rdc_task.return_value = MockCompleteTask()
695+
mock_update_crdqs_task.return_value = MockCompleteTask()
685696
mock_update_vat_with_rdc_task.return_value = (
686697
BaseUpdateVariantAnnotationsTableTask(
687698
reference_genome=ReferenceGenome.GRCh37,
@@ -845,12 +856,14 @@ def test_update_vat_without_accessing_private_datasets(
845856
mock_rdc_env: Mock,
846857
mock_update_vat_with_rdc_task: Mock,
847858
mock_register_alleles: Mock,
859+
mock_update_crdqs_task,
848860
mock_update_rdc_task: Mock,
849861
) -> None:
850862
mock_load_gencode_ensembl_to_refseq_id.return_value = hl.dict(
851863
{'ENST00000327044': 'NM_015658.4'},
852864
)
853865
mock_update_rdc_task.return_value = MockCompleteTask()
866+
mock_update_crdqs_task.return_value = MockCompleteTask()
854867
mock_update_vat_with_rdc_task.return_value = (
855868
BaseUpdateVariantAnnotationsTableTask(
856869
reference_genome=ReferenceGenome.GRCh38,
@@ -913,9 +926,11 @@ def test_mito_update_vat(
913926
self,
914927
mock_update_vat_with_rdc_task: Mock,
915928
mock_register_alleles: Mock,
929+
mock_update_crdqs_task,
916930
mock_update_rdc_task: Mock,
917931
) -> None:
918932
mock_update_rdc_task.return_value = MockCompleteTask()
933+
mock_update_crdqs_task.return_value = MockCompleteTask()
919934
mock_update_vat_with_rdc_task.return_value = (
920935
BaseUpdateVariantAnnotationsTableTask(
921936
reference_genome=ReferenceGenome.GRCh38,
@@ -1198,9 +1213,11 @@ def test_mito_update_vat(
11981213
def test_sv_update_vat(
11991214
self,
12001215
mock_load_gencode: Mock,
1216+
mock_update_crdqs_task,
12011217
mock_update_rdc_task: Mock,
12021218
) -> None:
12031219
mock_update_rdc_task.return_value = MockCompleteTask()
1220+
mock_update_crdqs_task.return_value = MockCompleteTask()
12041221
mock_load_gencode.return_value = GENE_ID_MAPPING
12051222
worker = luigi.worker.Worker()
12061223
update_variant_annotations_task = (
@@ -1778,9 +1795,11 @@ def test_sv_update_vat(
17781795

17791796
def test_gcnv_update_vat(
17801797
self,
1798+
mock_update_crdqs_task,
17811799
mock_update_rdc_task,
17821800
) -> None:
17831801
mock_update_rdc_task.return_value = MockCompleteTask()
1802+
mock_update_crdqs_task.return_value = MockCompleteTask()
17841803
worker = luigi.worker.Worker()
17851804
update_variant_annotations_task = (
17861805
UpdateVariantAnnotationsTableWithNewSamplesTask(

v03_pipeline/lib/tasks/write_relatedness_check_table.py

Lines changed: 7 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@
33
import luigi.util
44

55
from v03_pipeline.lib.methods.relatedness import call_relatedness
6-
from v03_pipeline.lib.model import CachedReferenceDatasetQuery, Env
6+
from v03_pipeline.lib.model import CachedReferenceDatasetQuery
77
from v03_pipeline.lib.paths import (
88
relatedness_check_table_path,
99
)
@@ -27,21 +27,14 @@ def output(self) -> luigi.Target:
2727
),
2828
)
2929

30-
def requires(self) -> luigi.Task:
31-
requirements = [
30+
def requires(self):
31+
return [
3232
self.clone(ValidateCallsetTask),
33+
self.clone(
34+
UpdatedCachedReferenceDatasetQuery,
35+
crdq=CachedReferenceDatasetQuery.GNOMAD_QC,
36+
),
3337
]
34-
if Env.ACCESS_PRIVATE_REFERENCE_DATASETS:
35-
requirements = [
36-
*requirements,
37-
(
38-
self.clone(
39-
UpdatedCachedReferenceDatasetQuery,
40-
crdq=CachedReferenceDatasetQuery.GNOMAD_QC,
41-
)
42-
),
43-
]
44-
return requirements
4538

4639
def create_table(self) -> hl.Table:
4740
callset_mt = hl.read_matrix_table(self.input()[0].path)

v03_pipeline/lib/tasks/write_variant_annotations_vcf_test.py

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -10,6 +10,7 @@
1010
from v03_pipeline.lib.tasks.write_variant_annotations_vcf import (
1111
WriteVariantAnnotationsVCF,
1212
)
13+
from v03_pipeline.lib.test.mock_complete_task import MockCompleteTask
1314
from v03_pipeline.lib.test.mocked_dataroot_testcase import MockedDatarootTestCase
1415

1516
TEST_SV_VCF = 'v03_pipeline/var/test/callsets/sv_1.vcf'
@@ -39,11 +40,16 @@ class WriteVariantAnnotationsVCFTest(MockedDatarootTestCase):
3940
@patch(
4041
'v03_pipeline.lib.tasks.write_new_variants_table.load_gencode_gene_symbol_to_gene_id',
4142
)
43+
@patch(
44+
'v03_pipeline.lib.tasks.base.base_update_variant_annotations_table.UpdateCachedReferenceDatasetQueries',
45+
)
4246
def test_sv_export_vcf(
4347
self,
48+
mock_update_crdqs_task: Mock,
4449
mock_load_gencode: Mock,
4550
) -> None:
4651
mock_load_gencode.return_value = GENE_ID_MAPPING
52+
mock_update_crdqs_task.return_value = MockCompleteTask()
4753
worker = luigi.worker.Worker()
4854
update_variant_annotations_task = (
4955
UpdateVariantAnnotationsTableWithNewSamplesTask(

0 commit comments

Comments
 (0)