Skip to content

Commit cdc5a8b

Browse files
bpblankenjklugherz
andauthored
Run ruff format during CI. (#697)
* Run ruff format * commas * one more format * Delete v03_pipeline/lib/tasks/reference_data/updated_cached_reference_dataset_query_test.py --------- Co-authored-by: Julia Klugherz <juliaklugherz@gmail.com>
1 parent 408a3db commit cdc5a8b

File tree

9 files changed

+49
-13
lines changed

9 files changed

+49
-13
lines changed

.github/workflows/unit-tests.yml

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -30,6 +30,8 @@ jobs:
3030
python -m pip install --upgrade pip
3131
pip install -r requirements.txt
3232
pip install -r requirements-dev.txt
33+
- name: Check Ruff Format
34+
run: ruff format --check v03_pipeline --diff
3335
- name: Check Ruff
3436
run: ruff . --output-format github
3537
- name: Unit Tests

v03_pipeline/lib/logger.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -27,8 +27,9 @@
2727

2828
_CONFIGURED = False
2929

30+
3031
def get_logger(name: str):
31-
global _CONFIGURED # noqa: PLW0603
32+
global _CONFIGURED # noqa: PLW0603
3233
if not _CONFIGURED:
3334
logging.config.dictConfig(LOG_CONFIG)
3435
_CONFIGURED = True

v03_pipeline/lib/reference_data/clinvar.py

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -38,6 +38,7 @@
3838

3939
logger = get_logger(__name__)
4040

41+
4142
def safely_move_to_gcs(tmp_file_name, gcs_tmp_file_name):
4243
try:
4344
subprocess.run(
@@ -106,7 +107,10 @@ def download_and_import_latest_clinvar_vcf(
106107

107108
with tempfile.NamedTemporaryFile(suffix='.vcf.gz', delete=False) as tmp_file:
108109
urllib.request.urlretrieve(clinvar_url, tmp_file.name) # noqa: S310
109-
gcs_tmp_file_name = os.path.join(Env.HAIL_TMPDIR, os.path.basename(tmp_file.name))
110+
gcs_tmp_file_name = os.path.join(
111+
Env.HAIL_TMPDIR,
112+
os.path.basename(tmp_file.name),
113+
)
110114
safely_move_to_gcs(tmp_file.name, gcs_tmp_file_name)
111115
mt = hl.import_vcf(
112116
gcs_tmp_file_name,

v03_pipeline/lib/reference_data/compare_globals.py

Lines changed: 12 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -51,8 +51,12 @@ def from_dataset_configs(
5151
),
5252
)
5353
enums[dataset] = dataset_config.get('enum_select', {})
54-
dataset_ht = dataset_ht.select(**get_all_select_fields(dataset_ht, dataset_config))
55-
dataset_ht = dataset_ht.transmute(**get_enum_select_fields(dataset_ht, dataset_config))
54+
dataset_ht = dataset_ht.select(
55+
**get_all_select_fields(dataset_ht, dataset_config),
56+
)
57+
dataset_ht = dataset_ht.transmute(
58+
**get_enum_select_fields(dataset_ht, dataset_config),
59+
)
5660
selects[dataset] = set(dataset_ht.row) - set(dataset_ht.key)
5761
return cls(paths, versions, enums, selects)
5862

@@ -67,13 +71,17 @@ def from_ht(
6771
paths = dict(rdc_globals_struct.paths)
6872
versions = dict(rdc_globals_struct.versions)
6973
# enums are nested structs
70-
enums = {k: dict(v) for k,v in rdc_globals_struct.enums.items()}
74+
enums = {k: dict(v) for k, v in rdc_globals_struct.enums.items()}
7175

7276
selects = {}
7377
for dataset in rdc.datasets(dataset_type):
7478
if dataset in ht.row:
7579
# NB: handle an edge case (mito high constraint) where we annotate a bool from the reference dataset collection
76-
selects[dataset] = set(ht[dataset]) if isinstance(ht[dataset], hl.StructExpression) else set()
80+
selects[dataset] = (
81+
set(ht[dataset])
82+
if isinstance(ht[dataset], hl.StructExpression)
83+
else set()
84+
)
7785
return cls(paths, versions, enums, selects)
7886

7987

v03_pipeline/lib/reference_data/compare_globals_test.py

Lines changed: 12 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -22,15 +22,21 @@ class CompareGlobalsTest(unittest.TestCase):
2222
'38': {
2323
'custom_import': None,
2424
'source_path': 'a_path', # 'a' has a custom import
25-
'select': {'test_select': 'info.test_select', 'test_enum': 'test_enum'},
25+
'select': {
26+
'test_select': 'info.test_select',
27+
'test_enum': 'test_enum',
28+
},
2629
'version': 'a_version',
2730
'enum_select': {'test_enum': ['A', 'B']},
2831
},
2932
},
3033
'b': { # b is missing version
3134
'38': {
3235
'path': 'b_path',
33-
'select': {'test_select': 'info.test_select', 'test_enum': 'test_enum'},
36+
'select': {
37+
'test_select': 'info.test_select',
38+
'test_enum': 'test_enum',
39+
},
3440
'enum_select': {'test_enum': ['C', 'D']},
3541
'custom_select': lambda ht: {'field2': ht.info.test_select_2},
3642
},
@@ -93,7 +99,10 @@ def test_create_globals_from_dataset_ht_configs(
9399
)
94100
self.assertTrue(
95101
dataset_config_globals.selects
96-
== {'a': {'test_select', 'test_enum_id'}, 'b': {'test_select', 'field2', 'test_enum_id'}},
102+
== {
103+
'a': {'test_select', 'test_enum_id'},
104+
'b': {'test_select', 'field2', 'test_enum_id'},
105+
},
97106
)
98107

99108
def test_from_rdc_or_annotations_ht(self):

v03_pipeline/lib/reference_data/dataset_table_operations_test.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -583,4 +583,3 @@ def test_update_or_create_joined_ht_drop_a_dataset(
583583
),
584584
],
585585
)
586-

v03_pipeline/lib/tasks/base/base_hail_table_task.py

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,7 @@
77

88
logger = get_logger(__name__)
99

10+
1011
class BaseHailTableTask(luigi.Task):
1112
reference_genome = luigi.EnumParameter(enum=ReferenceGenome)
1213
dataset_type = luigi.EnumParameter(enum=DatasetType)
@@ -25,24 +26,29 @@ def init_hail(self):
2526
# Interval ref data join causes shuffle death, this prevents it
2627
hl._set_flags(use_new_shuffle='1', no_whole_stage_codegen='1') # noqa: SLF001
2728

29+
2830
# NB: these are defined over luigi.Task instead of the BaseHailTableTask so that
2931
# they work on file dependencies.
3032
@luigi.Task.event_handler(luigi.Event.DEPENDENCY_MISSING)
3133
def dependency_missing(task):
3234
logger.info(f'{task} dependency_missing')
3335

36+
3437
@luigi.Task.event_handler(luigi.Event.DEPENDENCY_PRESENT)
3538
def dependency_present(task):
3639
logger.info(f'{task} dependency_present')
3740

41+
3842
@luigi.Task.event_handler(luigi.Event.START)
3943
def start(task):
4044
logger.info(f'{task} start')
4145

46+
4247
@luigi.Task.event_handler(luigi.Event.FAILURE)
4348
def failure(task, _):
4449
logger.exception(f'{task} failure')
4550

51+
4652
@luigi.Task.event_handler(luigi.Event.SUCCESS)
4753
def success(task):
4854
logger.info(f'{task} success')

v03_pipeline/lib/tasks/reference_data/update_variant_annotations_table_with_updated_reference_dataset.py

Lines changed: 7 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,6 @@
1414
class UpdateVariantAnnotationsTableWithUpdatedReferenceDataset(
1515
BaseVariantAnnotationsTableTask,
1616
):
17-
1817
def __init__(self, *args, **kwargs):
1918
super().__init__(*args, **kwargs)
2019
self._datasets_to_update = []
@@ -66,7 +65,13 @@ def update_table(self, ht: hl.Table) -> hl.Table:
6665
if dataset in ht.row:
6766
ht = ht.drop(dataset)
6867
if rdc.requires_annotation:
69-
formatting_fn = next(x for x in self.dataset_type.formatting_annotation_fns(self.reference_genome) if x.__name__ == dataset)
68+
formatting_fn = next(
69+
x
70+
for x in self.dataset_type.formatting_annotation_fns(
71+
self.reference_genome,
72+
)
73+
if x.__name__ == dataset
74+
)
7075
ht = ht.annotate(
7176
**get_fields(
7277
ht,

v03_pipeline/lib/tasks/reference_data/updated_reference_dataset_collection.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -54,7 +54,9 @@ def complete(self) -> bool:
5454
self.dataset_type,
5555
),
5656
)
57-
logger.info(f'Datasets to update: {self._datasets_to_update} for {self.reference_dataset_collection}')
57+
logger.info(
58+
f'Datasets to update: {self._datasets_to_update} for {self.reference_dataset_collection}',
59+
)
5860
return not self._datasets_to_update
5961

6062
def output(self) -> luigi.Target:

0 commit comments

Comments
 (0)