Skip to content

Commit afb46bd

Browse files
authored
update default model to resolve the vllm/model_executor issue (#1985)
Signed-off-by: chensuyue <[email protected]>
1 parent d1a500f commit afb46bd

File tree

5 files changed

+5
-1
lines changed

5 files changed

+5
-1
lines changed

DocSum/docker_compose/intel/cpu/xeon/compose.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -40,6 +40,7 @@ services:
4040
LLM_ENDPOINT: ${LLM_ENDPOINT}
4141
LLM_MODEL_ID: ${LLM_MODEL_ID}
4242
HUGGINGFACEHUB_API_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
43+
HF_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
4344
MAX_INPUT_TOKENS: ${MAX_INPUT_TOKENS}
4445
MAX_TOTAL_TOKENS: ${MAX_TOTAL_TOKENS}
4546
DocSum_COMPONENT_NAME: ${DocSum_COMPONENT_NAME}

DocSum/docker_compose/intel/cpu/xeon/compose_tgi.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -40,6 +40,7 @@ services:
4040
LLM_ENDPOINT: ${LLM_ENDPOINT}
4141
LLM_MODEL_ID: ${LLM_MODEL_ID}
4242
HUGGINGFACEHUB_API_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
43+
HF_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
4344
MAX_INPUT_TOKENS: ${MAX_INPUT_TOKENS}
4445
MAX_TOTAL_TOKENS: ${MAX_TOTAL_TOKENS}
4546
DocSum_COMPONENT_NAME: ${DocSum_COMPONENT_NAME}

DocSum/docker_compose/intel/hpu/gaudi/compose.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -45,6 +45,7 @@ services:
4545
http_proxy: ${http_proxy}
4646
https_proxy: ${https_proxy}
4747
HUGGINGFACEHUB_API_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
48+
HF_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
4849
MAX_INPUT_TOKENS: ${MAX_INPUT_TOKENS}
4950
MAX_TOTAL_TOKENS: ${MAX_TOTAL_TOKENS}
5051
LLM_ENDPOINT: ${LLM_ENDPOINT}

DocSum/docker_compose/intel/hpu/gaudi/compose_tgi.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -49,6 +49,7 @@ services:
4949
http_proxy: ${http_proxy}
5050
https_proxy: ${https_proxy}
5151
HUGGINGFACEHUB_API_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
52+
HF_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
5253
MAX_INPUT_TOKENS: ${MAX_INPUT_TOKENS}
5354
MAX_TOTAL_TOKENS: ${MAX_TOTAL_TOKENS}
5455
LLM_ENDPOINT: ${LLM_ENDPOINT}

DocSum/docker_compose/intel/set_env.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@ export https_proxy=$https_proxy
1313
export HUGGINGFACEHUB_API_TOKEN=${HUGGINGFACEHUB_API_TOKEN}
1414

1515
export LLM_ENDPOINT_PORT=8008
16-
export LLM_MODEL_ID="Intel/neural-chat-7b-v3-3"
16+
export LLM_MODEL_ID="meta-llama/Meta-Llama-3-8B-Instruct"
1717
export MAX_INPUT_TOKENS=1024
1818
export MAX_TOTAL_TOKENS=2048
1919

0 commit comments

Comments
 (0)