@@ -76,10 +76,8 @@ COPY backends backends
76
76
COPY backends/python/server/text_embeddings_server/models/__init__.py backends/python/server/text_embeddings_server/models/__init__.py
77
77
COPY backends/python/server/pyproject.toml backends/python/server/pyproject.toml
78
78
79
- RUN python -m pip install torch==2.6.0 torchvision torchaudio==2.6.0 --index-url https://download.pytorch.org/whl/cpu --no-cache-dir
80
-
81
79
RUN cd backends/python/server && \
82
- make install
80
+ make install-cpu
83
81
84
82
FROM vault.habana.ai/gaudi-docker/1.19.0/ubuntu22.04/habanalabs/pytorch-installer-2.5.1:latest AS hpu
85
83
ENV HUGGINGFACE_HUB_CACHE=/data \
@@ -99,7 +97,10 @@ COPY backends/python/server/text_embeddings_server/models/__init__.py backends/p
99
97
COPY backends/python/server/pyproject.toml backends/python/server/pyproject.toml
100
98
101
99
RUN cd backends/python/server && \
102
- make install
100
+ pip install -U pip uv && \
101
+ uv venv && \
102
+ cp -r /usr/local/lib/python3.10/dist-packages/* /usr/src/backends/python/server/.venv/lib/python3.10/site-packages/ && \
103
+ make install-hpu
103
104
104
105
FROM intel/intel-extension-for-pytorch:2.6.10-xpu AS xpu
105
106
@@ -115,9 +116,6 @@ RUN wget -O- https://apt.repos.intel.com/intel-gpg-keys/GPG-PUB-KEY-INTEL-SW-PRO
115
116
116
117
RUN apt-get update && apt install -y intel-basekit cmake python3-dev ninja-build pciutils
117
118
WORKDIR /usr/src
118
- RUN pip install torch==2.6.0 torchvision torchaudio --index-url https://download.pytorch.org/whl/xpu --no-cache-dir
119
- RUN pip install intel-extension-for-pytorch==2.6.10+xpu oneccl_bind_pt==2.6.0+xpu --extra-index-url https://pytorch-extension.intel.com/release-whl/stable/xpu/us/ --no-cache-dir
120
-
121
119
ENV CCL_ROOT=/opt/intel/oneapi/ccl/latest
122
120
ENV I_MPI_ROOT=/opt/intel/oneapi/mpi/latest
123
121
ENV FI_PROVIDER_PATH=/opt/intel/oneapi/mpi/latest/opt/mpi/libfabric/lib/prov:/usr/lib/x86_64-linux-gnu/libfabric
@@ -132,7 +130,7 @@ COPY backends backends
132
130
COPY backends/python/server/text_embeddings_server/models/__init__.py backends/python/server/text_embeddings_server/models/__init__.py
133
131
COPY backends/python/server/pyproject.toml backends/python/server/pyproject.toml
134
132
RUN cd backends/python/server && \
135
- make install
133
+ make install-xpu
136
134
137
135
FROM ${PLATFORM} AS grpc
138
136
@@ -144,6 +142,8 @@ CMD ["--json-output"]
144
142
FROM ${PLATFORM}
145
143
146
144
COPY --from=http-builder /usr/src/target/release/text-embeddings-router /usr/local/bin/text-embeddings-router
145
+ ENV VIRTUAL_ENV=/usr/src/backends/python/server/.venv
146
+ ENV PATH=$VIRTUAL_ENV/bin/:$PATH
147
147
148
148
ENTRYPOINT ["text-embeddings-router"]
149
149
CMD ["--json-output"]
0 commit comments