File tree Expand file tree Collapse file tree 6 files changed +20
-12
lines changed
Expand file tree Collapse file tree 6 files changed +20
-12
lines changed Original file line number Diff line number Diff line change 33# Copyright (C) 2024 Intel Corporation
44# SPDX-License-Identifier: Apache-2.0
55
6- FROM langchain/langchain:latest
6+ FROM python:3.11-slim
77
88RUN apt-get update -y && apt-get install -y --no-install-recommends --fix-missing \
99 libgl1-mesa-glx \
1010 libjemalloc-dev \
11- vim
11+ vim \
12+ git
1213
1314RUN useradd -m -s /bin/bash user && \
1415 mkdir -p /home/user && \
Original file line number Diff line number Diff line change 33# Copyright (C) 2024 Intel Corporation
44# SPDX-License-Identifier: Apache-2.0
55
6- FROM langchain/langchain:latest
6+ FROM python:3.11-slim
77
88
99RUN apt-get update -y && apt-get install -y --no-install-recommends --fix-missing \
1010 libgl1-mesa-glx \
1111 libjemalloc-dev \
12- vim
12+ vim \
13+ git
1314
1415RUN useradd -m -s /bin/bash user && \
1516 mkdir -p /home/user && \
Original file line number Diff line number Diff line change 1313# limitations under the License.
1414
1515
16- FROM langchain/langchain:latest
16+ FROM python:3.11-slim
1717
1818RUN apt-get update -y && apt-get install -y --no-install-recommends --fix-missing \
1919 libgl1-mesa-glx \
Original file line number Diff line number Diff line change @@ -11,7 +11,15 @@ services:
1111 http_proxy : ${http_proxy}
1212 https_proxy : ${https_proxy}
1313 TGI_LLM_ENDPOINT : ${TGI_LLM_ENDPOINT}
14- HUGGINGFACEHUB_API_TOKEN : ${HUGGINGFACEHUB_API_TOKEN}
14+ HF_TOKEN : ${HUGGINGFACEHUB_API_TOKEN}
15+ HF_HUB_DISABLE_PROGRESS_BARS : 1
16+ HF_HUB_ENABLE_HF_TRANSFER : 0
17+ HABANA_VISIBLE_DEVICES : all
18+ OMPI_MCA_btl_vader_single_copy_mechanism : none
19+ runtime : habana
20+ cap_add :
21+ - SYS_NICE
22+ ipc : host
1523 volumes :
1624 - " ./data:/data"
1725 command : --model-id ${LLM_MODEL_ID} --max-input-length 1024 --max-total-tokens 2048
Original file line number Diff line number Diff line change @@ -47,7 +47,7 @@ function start_services() {
4747 if grep -q Connected ${LOG_PATH} /tgi_service_start.log; then
4848 break
4949 fi
50- sleep 5s
50+ sleep 10s
5151 n=$(( n+ 1 ))
5252 done
5353}
@@ -84,8 +84,7 @@ function validate_services() {
8484
8585function validate_microservices() {
8686 # Check if the microservices are running correctly.
87- # TODO: Any results check required??
88- sleep 3m
87+
8988 # tgi gaudi service
9089 validate_services \
9190 " ${ip_address} :8008/generate" \
Original file line number Diff line number Diff line change @@ -47,7 +47,7 @@ function start_services() {
4747 if grep -q Connected ${LOG_PATH} /tgi_service_start.log; then
4848 break
4949 fi
50- sleep 5s
50+ sleep 10s
5151 n=$(( n+ 1 ))
5252 done
5353}
@@ -82,8 +82,7 @@ function validate_services() {
8282
8383function validate_microservices() {
8484 # Check if the microservices are running correctly.
85- # TODO: Any results check required??
86- sleep 3m
85+
8786 # tgi for llm service
8887 validate_services \
8988 " ${ip_address} :8008/generate" \
You can’t perform that action at this time.
0 commit comments