Skip to content

Commit caa3f3c

Browse files
committed
fixed deploy issues.
1 parent a0bdf8e commit caa3f3c

2 files changed

Lines changed: 10 additions & 1 deletion

File tree

DocSum/docker_compose/intel/hpu/gaudi/README.md

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -47,6 +47,9 @@ Some HuggingFace resources, such as some models, are only accessible if you have
4747
To set up environment variables for deploying DocSum services, source the _set_env.sh_ script in this directory:
4848

4949
```
50+
# Please setting your HUGGINGFACE_API_TOKEN.
51+
export HUGGINGFACEHUB_API_TOKEN="Your_HuggingFace_API_Token"
52+
5053
source ./set_env.sh
5154
```
5255

DocSum/docker_compose/set_env.sh

Lines changed: 7 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,14 +6,20 @@ pushd "../../" > /dev/null
66
source .set_env.sh
77
popd > /dev/null
88

9+
export host_ip=$(hostname -I | awk '{print $1}') # Example: host_ip="192.168.1.1"
910
export no_proxy="${no_proxy},${host_ip}" # Example: no_proxy="localhost, 127.0.0.1, 192.168.1.1"
1011
export http_proxy=$http_proxy
1112
export https_proxy=$https_proxy
12-
export host_ip=$(hostname -I | awk '{print $1}') # Example: host_ip="192.168.1.1"
1313
export HUGGINGFACEHUB_API_TOKEN=${HUGGINGFACEHUB_API_TOKEN}
1414

1515
export LLM_ENDPOINT_PORT=8008
1616
export LLM_MODEL_ID="Intel/neural-chat-7b-v3-3"
17+
18+
export BLOCK_SIZE=128
19+
export MAX_NUM_SEQS=256
20+
export MAX_SEQ_LEN_TO_CAPTURE=2048
21+
export NUM_CARDS=1
22+
1723
export MAX_INPUT_TOKENS=1024
1824
export MAX_TOTAL_TOKENS=2048
1925

0 commit comments

Comments
 (0)