File tree Expand file tree Collapse file tree 2 files changed +7
-1
lines changed Expand file tree Collapse file tree 2 files changed +7
-1
lines changed Original file line number Diff line number Diff line change @@ -111,6 +111,11 @@ ARG DEFAULT_USE_FLASH_ATTENTION=True
111
111
COPY backends/python/Makefile-flash-att-v2 Makefile-flash-att-v2
112
112
RUN make -f Makefile-flash-att-v2 install-flash-attention-v2-rocm
113
113
114
+ # Install python backend
115
+ COPY backends/python/server /tei_backends/python/server
116
+ COPY backends/proto tei_backends/proto
117
+ RUN make -C /tei_backends/python/server install
118
+
114
119
ENV HUGGINGFACE_HUB_CACHE=/data \
115
120
PORT=80 \
116
121
USE_FLASH_ATTENTION=$DEFAULT_USE_FLASH_ATTENTION
Original file line number Diff line number Diff line change @@ -15,12 +15,13 @@ grpcio-status = "^1.51.1"
15
15
grpcio-reflection = " ^1.51.1"
16
16
grpc-interceptor = " ^0.15.0"
17
17
typer = " ^0.6.1"
18
- safetensors = " ^0.3.2 "
18
+ safetensors = " ^0.4.0 "
19
19
loguru = " ^0.6.0"
20
20
opentelemetry-api = " ^1.15.0"
21
21
opentelemetry-exporter-otlp = " ^1.15.0"
22
22
opentelemetry-instrumentation-grpc = " ^0.36b0"
23
23
torch = { version = " ==2.3.1" }
24
+ transformers = { version = " ^4.39.0" }
24
25
25
26
[tool .poetry .extras ]
26
27
You can’t perform that action at this time.
0 commit comments