@@ -48,9 +48,9 @@ FROM builder as builder-75
48
48
49
49
RUN if [ $VERTEX = "true" ]; \
50
50
then \
51
- CUDA_COMPUTE_CAP=75 cargo chef cook --release --features google --features candle-cuda-turing --no-default-features --recipe-path recipe.json && sccache -s; \
51
+ CUDA_COMPUTE_CAP=75 cargo chef cook --release --features google --features candle-cuda-turing --features http -- no-default-features --recipe-path recipe.json && sccache -s; \
52
52
else \
53
- CUDA_COMPUTE_CAP=75 cargo chef cook --release --features candle-cuda-turing --no-default-features --recipe-path recipe.json && sccache -s; \
53
+ CUDA_COMPUTE_CAP=75 cargo chef cook --release --features candle-cuda-turing --no-default-features --features http -- recipe-path recipe.json && sccache -s; \
54
54
fi;
55
55
56
56
COPY backends backends
@@ -70,9 +70,9 @@ FROM builder as builder-80
70
70
71
71
RUN if [ $VERTEX = "true" ]; \
72
72
then \
73
- CUDA_COMPUTE_CAP=80 cargo chef cook --release --features google --features candle-cuda-turing --no-default-features --recipe-path recipe.json && sccache -s; \
73
+ CUDA_COMPUTE_CAP=80 cargo chef cook --release --features google --features candle-cuda --features http --no-default-features --recipe-path recipe.json && sccache -s; \
74
74
else \
75
- CUDA_COMPUTE_CAP=80 cargo chef cook --release --features candle-cuda-turing --no-default-features --recipe-path recipe.json && sccache -s; \
75
+ CUDA_COMPUTE_CAP=80 cargo chef cook --release --features candle-cuda --no-default-features --features http --recipe-path recipe.json && sccache -s; \
76
76
fi;
77
77
78
78
COPY backends backends
@@ -83,18 +83,18 @@ COPY Cargo.lock ./
83
83
84
84
RUN if [ $VERTEX = "true" ]; \
85
85
then \
86
- CUDA_COMPUTE_CAP=80 cargo build --release --bin text-embeddings-router -F candle-cuda-turing -F http -F google --no-default-features && sccache -s; \
86
+ CUDA_COMPUTE_CAP=80 cargo build --release --bin text-embeddings-router -F candle-cuda -F http -F google --no-default-features && sccache -s; \
87
87
else \
88
- CUDA_COMPUTE_CAP=80 cargo build --release --bin text-embeddings-router -F candle-cuda-turing -F http --no-default-features && sccache -s; \
88
+ CUDA_COMPUTE_CAP=80 cargo build --release --bin text-embeddings-router -F candle-cuda -F http --no-default-features && sccache -s; \
89
89
fi;
90
90
91
91
FROM builder as builder-90
92
92
93
93
RUN if [ $VERTEX = "true" ]; \
94
94
then \
95
- CUDA_COMPUTE_CAP=90 cargo chef cook --release --features google --features candle-cuda-turing --no-default-features --recipe-path recipe.json && sccache -s; \
95
+ CUDA_COMPUTE_CAP=90 cargo chef cook --release --features google --features candle-cuda --features http --no-default-features --recipe-path recipe.json && sccache -s; \
96
96
else \
97
- CUDA_COMPUTE_CAP=90 cargo chef cook --release --features candle-cuda-turing --no-default-features --recipe-path recipe.json && sccache -s; \
97
+ CUDA_COMPUTE_CAP=90 cargo chef cook --release --features candle-cuda --features http --no-default-features --recipe-path recipe.json && sccache -s; \
98
98
fi;
99
99
100
100
COPY backends backends
@@ -105,9 +105,9 @@ COPY Cargo.lock ./
105
105
106
106
RUN if [ $VERTEX = "true" ]; \
107
107
then \
108
- CUDA_COMPUTE_CAP=90 cargo build --release --bin text-embeddings-router -F candle-cuda-turing -F http -F google --no-default-features && sccache -s; \
108
+ CUDA_COMPUTE_CAP=90 cargo build --release --bin text-embeddings-router -F candle-cuda -F http -F google --no-default-features && sccache -s; \
109
109
else \
110
- CUDA_COMPUTE_CAP=90 cargo build --release --bin text-embeddings-router -F candle-cuda-turing -F http --no-default-features && sccache -s; \
110
+ CUDA_COMPUTE_CAP=90 cargo build --release --bin text-embeddings-router -F candle-cuda -F http --no-default-features && sccache -s; \
111
111
fi;
112
112
113
113
FROM nvidia/cuda:12.2.0-runtime-ubuntu22.04 as base
0 commit comments