File tree Expand file tree Collapse file tree 2 files changed +28
-1
lines changed
nextstrain_profiles/nextstrain-gisaid Expand file tree Collapse file tree 2 files changed +28
-1
lines changed Original file line number Diff line number Diff line change @@ -2,6 +2,7 @@ auspice_json_prefix: ncov_gisaid
2
2
3
3
# Define custom rules for pre- or post-standard workflow processing of data.
4
4
custom_rules :
5
+ - workflow/snakemake_rules/prefilter.smk
5
6
- workflow/snakemake_rules/export_for_nextstrain.smk
6
7
7
8
# These parameters are only used by the `export_for_nextstrain` rule and shouldn't need to be modified.
25
26
26
27
inputs :
27
28
- name : gisaid
28
- metadata : " s3://nextstrain-ncov-private/metadata .tsv.zst "
29
+ metadata : " data/prefiltered_metadata .tsv"
29
30
aligned : " s3://nextstrain-ncov-private/aligned.fasta.zst"
30
31
skip_sanitize_metadata : true
31
32
Original file line number Diff line number Diff line change
1
+ rule download_metadata :
2
+ params :
3
+ metadata_url = "s3://nextstrain-ncov-private/metadata.tsv.zst" ,
4
+ output :
5
+ metadata = "data/metadata.tsv.zst" ,
6
+ shell :
7
+ """
8
+ aws s3 cp {params.metadata_url} {output.metadata}
9
+ """
10
+
11
+ rule filter_metadata :
12
+ input :
13
+ metadata = "data/metadata.tsv.zst" ,
14
+ output :
15
+ metadata = "data/prefiltered_metadata.tsv" ,
16
+ params :
17
+ max_sequences = 500000 ,
18
+ group_by = "division year month" ,
19
+ shell :
20
+ """
21
+ augur filter \
22
+ --metadata {input.metadata} \
23
+ --subsample-max-sequences {params.max_sequences} \
24
+ --group-by {params.group_by} \
25
+ --output-metadata {output.metadata}
26
+ """
You can’t perform that action at this time.
0 commit comments