File tree Expand file tree Collapse file tree 5 files changed +22
-14
lines changed Expand file tree Collapse file tree 5 files changed +22
-14
lines changed Original file line number Diff line number Diff line change 52
52
gcc -Wall -Werror -O2 /vep.c -o /vep
53
53
chmod u+s /vep
54
54
55
- gcloud storage cp gs://seqr-luigi/releases/$ENVIRONMENT /latest/bin/download_vep_data .bash /download_vep_data .bash
56
- chmod +x /download_vep_data .bash
57
- ./download_vep_data .bash $REFERENCE_GENOME
55
+ gcloud storage cp gs://seqr-luigi/releases/$ENVIRONMENT /latest/bin/download_vep_reference_data .bash /download_vep_reference_data .bash
56
+ chmod +x /download_vep_reference_data .bash
57
+ ./download_vep_reference_data .bash $REFERENCE_GENOME
58
58
59
59
gcloud storage cp gs://seqr-luigi/releases/$ENVIRONMENT /latest/bin/vep /vep.bash
60
60
chmod +x /vep.bash
Original file line number Diff line number Diff line change 3
3
set -eux
4
4
5
5
REFERENCE_GENOME=$1
6
- VEP_DATA= /seqr/vep_data
6
+ VEP_REFERENCE_DATASETS_DIR= ${VEP_REFERENCE_DATASETS_DIR :- / seqr/ vep-reference-data}
7
7
8
8
case $REFERENCE_GENOME in
9
9
GRCh38)
@@ -43,20 +43,20 @@ case $REFERENCE_GENOME in
43
43
exit 1
44
44
esac
45
45
46
- if [ -f $VEP_DATA /$REFERENCE_GENOME /_SUCCESS ]; then
46
+ if [ -f $VEP_REFERENCE_DATASETS_DIR /$REFERENCE_GENOME /_SUCCESS ]; then
47
47
echo " Skipping download because already successful"
48
48
exit 0;
49
49
fi
50
50
51
- mkdir -p $VEP_DATA /$REFERENCE_GENOME ;
51
+ mkdir -p $VEP_REFERENCE_DATASETS_DIR /$REFERENCE_GENOME ;
52
52
for vep_reference_data_file in ${VEP_REFERENCE_DATA_FILES[@]} ; do
53
53
if [[ $vep_reference_data_file == * .tar.gz ]]; then
54
54
echo " Downloading and extracting" $vep_reference_data_file ;
55
- gsutil cat $vep_reference_data_file | tar -xzf - -C $VEP_DATA /$REFERENCE_GENOME / &
55
+ gsutil cat $vep_reference_data_file | tar -xzf - -C $VEP_REFERENCE_DATASETS_DIR /$REFERENCE_GENOME / &
56
56
else
57
57
echo " Downloading" $vep_reference_data_file ;
58
- gsutil cat $vep_reference_data_file $VEP_DATA /$REFERENCE_GENOME / &
58
+ gsutil cat $vep_reference_data_file $VEP_REFERENCE_DATASETS_DIR /$REFERENCE_GENOME / &
59
59
fi
60
60
done ;
61
61
wait
62
- touch $VEP_DATA /$REFERENCE_GENOME /_SUCCESS
62
+ touch $VEP_REFERENCE_DATASETS_DIR /$REFERENCE_GENOME /_SUCCESS
Original file line number Diff line number Diff line change 3
3
set -eux
4
4
5
5
REFERENCE_GENOME=$1
6
- VEP_DATA= /seqr/vep_data
6
+ VEP_REFERENCE_DATASETS_DIR= ${VEP_REFERENCE_DATASETS_DIR :- / seqr/ vep-reference-data}
7
7
VEP_DOCKER_IMAGE=" gcr.io/seqr-project/vep-docker-image"
8
8
9
9
case $REFERENCE_GENOME in
@@ -17,5 +17,5 @@ case $REFERENCE_GENOME in
17
17
esac
18
18
19
19
shift # Remove the REFERENCE_GENOME arg.
20
- docker run --platform linux/amd64 -i -v $VEP_DATA /$REFERENCE_GENOME :/opt/vep/.vep/:ro $VEP_DOCKER_IMAGE :$REFERENCE_GENOME \
20
+ docker run --platform linux/amd64 -i -v $VEP_REFERENCE_DATASETS_DIR /$REFERENCE_GENOME :/opt/vep/.vep/:ro $VEP_DOCKER_IMAGE :$REFERENCE_GENOME \
21
21
/opt/vep/src/ensembl-vep/vep $@
Original file line number Diff line number Diff line change 21
21
'REFERENCE_DATASETS_DIR' ,
22
22
'/seqr/seqr-reference-data' ,
23
23
)
24
+ VEP_REFERENCE_DATASETS_DIR = os .environ .get (
25
+ 'VEP_REFERENCE_DATASETS_DIR' ,
26
+ '/seqr/vep-reference-data' ,
27
+ )
24
28
25
29
# Allele registry secrets :/
26
30
ALLELE_REGISTRY_SECRET_NAME = os .environ .get ('ALLELE_REGISTRY_SECRET_NAME' , None )
@@ -50,3 +54,4 @@ class Env:
50
54
PROJECT_ID : str | None = PROJECT_ID
51
55
REFERENCE_DATASETS_DIR : str = REFERENCE_DATASETS_DIR
52
56
SHOULD_REGISTER_ALLELES : bool = SHOULD_REGISTER_ALLELES
57
+ VEP_REFERENCE_DATASETS_DIR : str = VEP_REFERENCE_DATASETS_DIR
Original file line number Diff line number Diff line change 2
2
3
3
import hail as hl
4
4
5
- from v03_pipeline .lib .model import DatasetType , ReferenceGenome
5
+ from v03_pipeline .lib .model import DatasetType , Env , ReferenceGenome
6
6
7
7
VEP_CONFIG_URI = Template (
8
- 'file:///seqr/vep_data /$reference_genome/vep-$reference_genome.json' ,
8
+ 'file://$vep_reference_datasets_dir /$reference_genome/vep-$reference_genome.json' ,
9
9
)
10
10
11
11
@@ -18,7 +18,10 @@ def run_vep(
18
18
return ht
19
19
return hl .vep (
20
20
ht ,
21
- config = VEP_CONFIG_URI .substitute (reference_genome = reference_genome .value ),
21
+ config = VEP_CONFIG_URI .substitute (
22
+ vep_reference_datasets_dir = Env .VEP_REFERENCE_DATASETS_DIR ,
23
+ reference_genome = reference_genome .value ,
24
+ ),
22
25
name = 'vep' ,
23
26
block_size = 1000 ,
24
27
tolerate_parse_error = True ,
You can’t perform that action at this time.
0 commit comments