File tree Expand file tree Collapse file tree 4 files changed +7
-7
lines changed
Expand file tree Collapse file tree 4 files changed +7
-7
lines changed Original file line number Diff line number Diff line change 1515 TGI_LLM_ENDPOINT : http://llm-dependency-svc.default.svc.cluster.local:9009
1616 REDIS_URL : redis://vector-db.default.svc.cluster.local:6379
1717 INDEX_NAME : rag-redis
18- HUGGINGFACEHUB_API_TOKEN : {HF_TOKEN}
18+ HUGGINGFACEHUB_API_TOKEN : $ {HF_TOKEN}
1919 EMBEDDING_SERVICE_HOST_IP : embedding-svc
2020 RETRIEVER_SERVICE_HOST_IP : retriever-svc
2121 RERANK_SERVICE_HOST_IP : reranking-svc
Original file line number Diff line number Diff line change 3535 - --model-id
3636 - $(LLM_MODEL_ID)
3737 - --max-input-length
38- - ' 2048 '
38+ - ' 1024 '
3939 - --max-total-tokens
40- - ' 4096 '
40+ - ' 2048 '
4141 - --max-batch-total-tokens
4242 - ' 65536'
4343 - --max-batch-prefill-tokens
Original file line number Diff line number Diff line change 3535 - --model-id
3636 - $(LLM_MODEL_ID)
3737 - --max-input-length
38- - ' 2048 '
38+ - ' 1024 '
3939 - --max-total-tokens
40- - ' 4096 '
40+ - ' 2048 '
4141 - --max-batch-total-tokens
4242 - ' 65536'
4343 - --max-batch-prefill-tokens
Original file line number Diff line number Diff line change 3535 - --model-id
3636 - $(LLM_MODEL_ID)
3737 - --max-input-length
38- - ' 2048 '
38+ - ' 1024 '
3939 - --max-total-tokens
40- - ' 4096 '
40+ - ' 2048 '
4141 - --max-batch-total-tokens
4242 - ' 65536'
4343 - --max-batch-prefill-tokens
You can’t perform that action at this time.
0 commit comments