Skip to content

Commit 1987548

Browse files
authored
Merge pull request #711 from broadinstitute/benb/prefer_env_vars_for_vep_path
prefer env vars for vep path
2 parents ffdb18d + 1ff8e92 commit 1987548

File tree

5 files changed

+9
-18
lines changed

5 files changed

+9
-18
lines changed

v03_pipeline/lib/annotations/fields_test.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -41,7 +41,6 @@ def test_get_formatting_fields(self, mock_vep: Mock, mock_validate: Mock) -> Non
4141
ht,
4242
DatasetType.SNV_INDEL,
4343
ReferenceGenome.GRCh38,
44-
None,
4544
)
4645
ht = ht.annotate(rsid='abcd')
4746
for reference_genome, expected_fields in [

v03_pipeline/lib/annotations/shared_test.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -40,7 +40,6 @@ def test_sorted_transcript_consequences(
4040
ht,
4141
DatasetType.SNV_INDEL,
4242
ReferenceGenome.GRCh38,
43-
None,
4443
)
4544
ht = ht.select(
4645
sorted_transcript_consequences=sorted_transcript_consequences(ht),

v03_pipeline/lib/model/environment.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,8 @@
1818
'REFERENCE_DATASETS',
1919
'/seqr-reference-data',
2020
)
21+
VEP_CONFIG_PATH = os.environ.get('VEP_CONFIG_PATH', None)
22+
VEP_CONFIG_URI = os.environ.get('VEP_CONFIG_URI', None)
2123

2224

2325
@dataclass
@@ -30,3 +32,5 @@ class Env:
3032
LOADING_DATASETS: str = LOADING_DATASETS
3133
PRIVATE_REFERENCE_DATASETS: str = PRIVATE_REFERENCE_DATASETS
3234
REFERENCE_DATASETS: str = REFERENCE_DATASETS
35+
VEP_CONFIG_PATH: str | None = VEP_CONFIG_PATH
36+
VEP_CONFIG_URI: str | None = VEP_CONFIG_URI

v03_pipeline/lib/tasks/update_variant_annotations_table_with_new_samples.py

Lines changed: 0 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -52,10 +52,6 @@ class UpdateVariantAnnotationsTableWithNewSamplesTask(BaseVariantAnnotationsTabl
5252
default='gs://hail-common/references/grch38_to_grch37.over.chain.gz',
5353
description='Path to GRCh38 to GRCh37 coordinates file',
5454
)
55-
vep_config_json_path = luigi.OptionalParameter(
56-
default=None,
57-
description='Path of hail vep config .json file',
58-
)
5955

6056
@property
6157
def other_annotation_dependencies(self) -> dict[str, hl.Table]:
@@ -216,7 +212,6 @@ def update_table(self, ht: hl.Table) -> hl.Table:
216212
new_variants_ht,
217213
self.dataset_type,
218214
self.reference_genome,
219-
self.vep_config_json_path,
220215
)
221216

222217
# 2) Select down to the formatting annotations fields and

v03_pipeline/lib/vep.py

Lines changed: 5 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,10 @@
11
import hail as hl
22

3-
from v03_pipeline.lib.model import DatasetType, ReferenceGenome
3+
from v03_pipeline.lib.model import DatasetType, Env, ReferenceGenome
44

55

6-
def validate_vep_config_reference_genome(reference_genome, config: str) -> None:
7-
with open(config) as f:
6+
def validate_vep_config_reference_genome(reference_genome) -> None:
7+
with open(Env.VEP_CONFIG_PATH) as f:
88
if reference_genome.value not in f.read():
99
msg = f'Vep config does not match supplied reference genome {reference_genome.value}'
1010
raise ValueError(msg)
@@ -14,19 +14,13 @@ def run_vep(
1414
ht: hl.Table,
1515
dataset_type: DatasetType,
1616
reference_genome: ReferenceGenome,
17-
vep_config_json_path: str | None,
1817
) -> hl.Table:
1918
if not dataset_type.veppable:
2019
return ht
21-
config = (
22-
vep_config_json_path
23-
if vep_config_json_path is not None
24-
else f'file:///vep_data/vep-{reference_genome.value}-gcloud.json'
25-
)
26-
validate_vep_config_reference_genome(reference_genome, config)
20+
validate_vep_config_reference_genome(reference_genome)
2721
return hl.vep(
2822
ht,
29-
config=config,
23+
config=Env.VEP_CONFIG_URI,
3024
name='vep',
3125
block_size=1000,
3226
tolerate_parse_error=True,

0 commit comments

Comments
 (0)