From 01bfa66a5614172716e508b02574e3830e45a902 Mon Sep 17 00:00:00 2001 From: dolpher Date: Fri, 8 Nov 2024 10:31:13 +0800 Subject: [PATCH] Update helm-charts/chatqna/gaudi-values.yaml Co-authored-by: Eero Tamminen --- helm-charts/chatqna/gaudi-values.yaml | 1 + 1 file changed, 1 insertion(+) diff --git a/helm-charts/chatqna/gaudi-values.yaml b/helm-charts/chatqna/gaudi-values.yaml index 6867fbef4..203e1afae 100644 --- a/helm-charts/chatqna/gaudi-values.yaml +++ b/helm-charts/chatqna/gaudi-values.yaml @@ -13,6 +13,7 @@ tgi: resources: limits: habana.ai/gaudi: 1 + # higher limits are needed with extra input tokens added by rerank MAX_INPUT_LENGTH: "2048" MAX_TOTAL_TOKENS: "4096" CUDA_GRAPHS: ""