File tree Expand file tree Collapse file tree
ChatQnA/docker_compose/intel Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -96,6 +96,7 @@ services:
9696 HF_TOKEN : ${HUGGINGFACEHUB_API_TOKEN}
9797 LLM_MODEL_ID : ${LLM_MODEL_ID}
9898 VLLM_TORCH_PROFILER_DIR : " /mnt"
99+ VLLM_CPU_KVCACHE_SPACE : 40
99100 healthcheck :
100101 test : ["CMD-SHELL", "curl -f http://$host_ip:9009/health || exit 1"]
101102 interval : 10s
@@ -124,7 +125,7 @@ services:
124125 - RERANK_SERVER_HOST_IP=tei-reranking-service
125126 - RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
126127 - LLM_SERVER_HOST_IP=vllm-service
127- - LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
128+ - LLM_SERVER_PORT=80
128129 - LLM_MODEL=${LLM_MODEL_ID}
129130 - LOGFLAG=${LOGFLAG}
130131 ipc : host
Original file line number Diff line number Diff line change @@ -183,7 +183,7 @@ services:
183183 - RERANK_SERVER_HOST_IP=tei-reranking-service
184184 - RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
185185 - LLM_SERVER_HOST_IP=vllm-service
186- - LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
186+ - LLM_SERVER_PORT=80
187187 - LLM_MODEL=${LLM_MODEL_ID}
188188 - LOGFLAG=${LOGFLAG}
189189 ipc : host
Original file line number Diff line number Diff line change @@ -107,7 +107,7 @@ services:
107107 - RERANK_SERVER_HOST_IP=tei-reranking-service
108108 - RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
109109 - LLM_SERVER_HOST_IP=vllm-service
110- - LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
110+ - LLM_SERVER_PORT=80
111111 - LOGFLAG=${LOGFLAG}
112112 - LLM_MODEL=${LLM_MODEL_ID}
113113 ipc : host
Original file line number Diff line number Diff line change @@ -113,7 +113,7 @@ services:
113113 - RERANK_SERVER_HOST_IP=tei-reranking-service
114114 - RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
115115 - LLM_SERVER_HOST_IP=vllm-service
116- - LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
116+ - LLM_SERVER_PORT=80
117117 - LLM_MODEL=${LLM_MODEL_ID}
118118 - LOGFLAG=${LOGFLAG}
119119 ipc : host
Original file line number Diff line number Diff line change @@ -113,7 +113,7 @@ services:
113113 - RERANK_SERVER_HOST_IP=tei-reranking-service
114114 - RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
115115 - LLM_SERVER_HOST_IP=tgi-service
116- - LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
116+ - LLM_SERVER_PORT=80
117117 - LLM_MODEL=${LLM_MODEL_ID}
118118 - LOGFLAG=${LOGFLAG}
119119 ipc : host
Original file line number Diff line number Diff line change @@ -94,7 +94,7 @@ services:
9494 - EMBEDDING_SERVER_PORT=${EMBEDDING_SERVER_PORT:-80}
9595 - RETRIEVER_SERVICE_HOST_IP=retriever
9696 - LLM_SERVER_HOST_IP=vllm-service
97- - LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
97+ - LLM_SERVER_PORT=80
9898 - LLM_MODEL=${LLM_MODEL_ID}
9999 - LOGFLAG=${LOGFLAG}
100100 - CHATQNA_TYPE=${CHATQNA_TYPE:-CHATQNA_NO_RERANK}
Original file line number Diff line number Diff line change @@ -133,7 +133,7 @@ services:
133133 - RERANK_SERVER_HOST_IP=tei-reranking-service
134134 - RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
135135 - LLM_SERVER_HOST_IP=vllm-service
136- - LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
136+ - LLM_SERVER_PORT=80
137137 - LLM_MODEL=${LLM_MODEL_ID}
138138 - LOGFLAG=${LOGFLAG}
139139 ipc : host
Original file line number Diff line number Diff line change @@ -166,7 +166,7 @@ services:
166166 - RERANK_SERVER_HOST_IP=tei-reranking-service
167167 - RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
168168 - LLM_SERVER_HOST_IP=vllm-service
169- - LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
169+ - LLM_SERVER_PORT=80
170170 - LLM_MODEL=${LLM_MODEL_ID}
171171 - LOGFLAG=${LOGFLAG}
172172 - CHATQNA_TYPE=${CHATQNA_TYPE:-CHATQNA_GUARDRAILS}
Original file line number Diff line number Diff line change @@ -127,7 +127,7 @@ services:
127127 - RERANK_SERVER_HOST_IP=tei-reranking-service
128128 - RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
129129 - LLM_SERVER_HOST_IP=tgi-service
130- - LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
130+ - LLM_SERVER_PORT=80
131131 - LLM_MODEL=${LLM_MODEL_ID}
132132 - LOGFLAG=${LOGFLAG}
133133 ipc : host
Original file line number Diff line number Diff line change @@ -99,7 +99,7 @@ services:
9999 - EMBEDDING_SERVER_PORT=${EMBEDDING_SERVER_PORT:-80}
100100 - RETRIEVER_SERVICE_HOST_IP=retriever
101101 - LLM_SERVER_HOST_IP=vllm-service
102- - LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
102+ - LLM_SERVER_PORT=80
103103 - LLM_MODEL=${LLM_MODEL_ID}
104104 - LOGFLAG=${LOGFLAG}
105105 - CHATQNA_TYPE=${CHATQNA_TYPE:-CHATQNA_NO_RERANK}
You can’t perform that action at this time.
0 commit comments