Skip to content

Commit f0071be

Browse files
Add HF token and timeout for TEI Server
Signed-off-by: cogniware-devops <ambarish.desai@cogniware.ai>
1 parent eae282e commit f0071be

1 file changed

Lines changed: 8 additions & 3 deletions

File tree

CogniwareIms/docker_compose/intel/cpu/xeon/compose.yaml

Lines changed: 8 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -56,6 +56,7 @@ services:
5656
MODEL_ID: ${EMBEDDING_MODEL_ID:-BAAI/bge-base-en-v1.5}
5757
PORT: 80
5858
MAX_BATCH_TOKENS: 16384
59+
HF_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
5960
# Intel Xeon optimizations
6061
OMP_NUM_THREADS: 4
6162
KMP_AFFINITY: "granularity=fine,compact,1,0"
@@ -67,7 +68,8 @@ services:
6768
test: ["CMD", "curl", "-f", "http://localhost:80/health"]
6869
interval: 30s
6970
timeout: 10s
70-
retries: 3
71+
retries: 10
72+
start_period: 120s
7173

7274
# Embedding Microservice
7375
embedding:
@@ -125,14 +127,16 @@ services:
125127
environment:
126128
MODEL_ID: ${RERANK_MODEL_ID:-BAAI/bge-reranker-base}
127129
PORT: 80
130+
HF_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
128131
http_proxy: ${http_proxy}
129132
https_proxy: ${https_proxy}
130133
no_proxy: ${no_proxy}
131134
healthcheck:
132135
test: ["CMD", "curl", "-f", "http://localhost:80/health"]
133136
interval: 30s
134137
timeout: 10s
135-
retries: 3
138+
retries: 10
139+
start_period: 120s
136140

137141
# Reranking Microservice
138142
reranking:
@@ -179,7 +183,8 @@ services:
179183
test: ["CMD", "curl", "-f", "http://localhost:80/health"]
180184
interval: 30s
181185
timeout: 10s
182-
retries: 3
186+
retries: 10
187+
start_period: 180s
183188

184189
# LLM Microservice
185190
llm-tgi:

0 commit comments

Comments
 (0)