Skip to content

Commit 18261c0

Browse files
Merge branch 'main' into videoqna-bug
2 parents 5ea8491 + 7b7728c commit 18261c0

10 files changed

Lines changed: 11 additions & 10 deletions

ChatQnA/docker_compose/intel/cpu/xeon/compose.yaml

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -96,6 +96,7 @@ services:
9696
HF_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
9797
LLM_MODEL_ID: ${LLM_MODEL_ID}
9898
VLLM_TORCH_PROFILER_DIR: "/mnt"
99+
VLLM_CPU_KVCACHE_SPACE: 40
99100
healthcheck:
100101
test: ["CMD-SHELL", "curl -f http://$host_ip:9009/health || exit 1"]
101102
interval: 10s
@@ -124,7 +125,7 @@ services:
124125
- RERANK_SERVER_HOST_IP=tei-reranking-service
125126
- RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
126127
- LLM_SERVER_HOST_IP=vllm-service
127-
- LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
128+
- LLM_SERVER_PORT=80
128129
- LLM_MODEL=${LLM_MODEL_ID}
129130
- LOGFLAG=${LOGFLAG}
130131
ipc: host

ChatQnA/docker_compose/intel/cpu/xeon/compose_milvus.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -183,7 +183,7 @@ services:
183183
- RERANK_SERVER_HOST_IP=tei-reranking-service
184184
- RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
185185
- LLM_SERVER_HOST_IP=vllm-service
186-
- LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
186+
- LLM_SERVER_PORT=80
187187
- LLM_MODEL=${LLM_MODEL_ID}
188188
- LOGFLAG=${LOGFLAG}
189189
ipc: host

ChatQnA/docker_compose/intel/cpu/xeon/compose_pinecone.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -107,7 +107,7 @@ services:
107107
- RERANK_SERVER_HOST_IP=tei-reranking-service
108108
- RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
109109
- LLM_SERVER_HOST_IP=vllm-service
110-
- LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
110+
- LLM_SERVER_PORT=80
111111
- LOGFLAG=${LOGFLAG}
112112
- LLM_MODEL=${LLM_MODEL_ID}
113113
ipc: host

ChatQnA/docker_compose/intel/cpu/xeon/compose_qdrant.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -113,7 +113,7 @@ services:
113113
- RERANK_SERVER_HOST_IP=tei-reranking-service
114114
- RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
115115
- LLM_SERVER_HOST_IP=vllm-service
116-
- LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
116+
- LLM_SERVER_PORT=80
117117
- LLM_MODEL=${LLM_MODEL_ID}
118118
- LOGFLAG=${LOGFLAG}
119119
ipc: host

ChatQnA/docker_compose/intel/cpu/xeon/compose_tgi.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -113,7 +113,7 @@ services:
113113
- RERANK_SERVER_HOST_IP=tei-reranking-service
114114
- RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
115115
- LLM_SERVER_HOST_IP=tgi-service
116-
- LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
116+
- LLM_SERVER_PORT=80
117117
- LLM_MODEL=${LLM_MODEL_ID}
118118
- LOGFLAG=${LOGFLAG}
119119
ipc: host

ChatQnA/docker_compose/intel/cpu/xeon/compose_without_rerank.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -94,7 +94,7 @@ services:
9494
- EMBEDDING_SERVER_PORT=${EMBEDDING_SERVER_PORT:-80}
9595
- RETRIEVER_SERVICE_HOST_IP=retriever
9696
- LLM_SERVER_HOST_IP=vllm-service
97-
- LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
97+
- LLM_SERVER_PORT=80
9898
- LLM_MODEL=${LLM_MODEL_ID}
9999
- LOGFLAG=${LOGFLAG}
100100
- CHATQNA_TYPE=${CHATQNA_TYPE:-CHATQNA_NO_RERANK}

ChatQnA/docker_compose/intel/hpu/gaudi/compose.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -133,7 +133,7 @@ services:
133133
- RERANK_SERVER_HOST_IP=tei-reranking-service
134134
- RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
135135
- LLM_SERVER_HOST_IP=vllm-service
136-
- LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
136+
- LLM_SERVER_PORT=80
137137
- LLM_MODEL=${LLM_MODEL_ID}
138138
- LOGFLAG=${LOGFLAG}
139139
ipc: host

ChatQnA/docker_compose/intel/hpu/gaudi/compose_guardrails.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -166,7 +166,7 @@ services:
166166
- RERANK_SERVER_HOST_IP=tei-reranking-service
167167
- RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
168168
- LLM_SERVER_HOST_IP=vllm-service
169-
- LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
169+
- LLM_SERVER_PORT=80
170170
- LLM_MODEL=${LLM_MODEL_ID}
171171
- LOGFLAG=${LOGFLAG}
172172
- CHATQNA_TYPE=${CHATQNA_TYPE:-CHATQNA_GUARDRAILS}

ChatQnA/docker_compose/intel/hpu/gaudi/compose_tgi.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -127,7 +127,7 @@ services:
127127
- RERANK_SERVER_HOST_IP=tei-reranking-service
128128
- RERANK_SERVER_PORT=${RERANK_SERVER_PORT:-80}
129129
- LLM_SERVER_HOST_IP=tgi-service
130-
- LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
130+
- LLM_SERVER_PORT=80
131131
- LLM_MODEL=${LLM_MODEL_ID}
132132
- LOGFLAG=${LOGFLAG}
133133
ipc: host

ChatQnA/docker_compose/intel/hpu/gaudi/compose_without_rerank.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -99,7 +99,7 @@ services:
9999
- EMBEDDING_SERVER_PORT=${EMBEDDING_SERVER_PORT:-80}
100100
- RETRIEVER_SERVICE_HOST_IP=retriever
101101
- LLM_SERVER_HOST_IP=vllm-service
102-
- LLM_SERVER_PORT=${LLM_SERVER_PORT:-80}
102+
- LLM_SERVER_PORT=80
103103
- LLM_MODEL=${LLM_MODEL_ID}
104104
- LOGFLAG=${LOGFLAG}
105105
- CHATQNA_TYPE=${CHATQNA_TYPE:-CHATQNA_NO_RERANK}

0 commit comments

Comments
 (0)