Skip to content
Merged
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion helm-charts/agentqna/gaudi-values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,7 @@ tgi:
accelDevice: "gaudi"
image:
repository: ghcr.io/huggingface/tgi-gaudi
tag: "2.0.5"
tag: "2.0.6"
resources:
limits:
habana.ai/gaudi: 4
Expand Down
2 changes: 1 addition & 1 deletion helm-charts/audioqna/gaudi-values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@ tgi:
accelDevice: "gaudi"
image:
repository: ghcr.io/huggingface/tgi-gaudi
tag: "2.0.5"
tag: "2.0.6"
resources:
limits:
habana.ai/gaudi: 1
Expand Down
2 changes: 1 addition & 1 deletion helm-charts/chatqna/gaudi-values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@ tgi:
accelDevice: "gaudi"
image:
repository: ghcr.io/huggingface/tgi-gaudi
tag: "2.0.5"
tag: "2.0.6"
resources:
limits:
habana.ai/gaudi: 1
Expand Down
4 changes: 2 additions & 2 deletions helm-charts/chatqna/guardrails-gaudi-values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -49,7 +49,7 @@ tgi:
accelDevice: "gaudi"
image:
repository: ghcr.io/huggingface/tgi-gaudi
tag: "2.0.5"
tag: "2.0.6"
resources:
limits:
habana.ai/gaudi: 1
Expand Down Expand Up @@ -81,7 +81,7 @@ tgi-guardrails:
LLM_MODEL_ID: "meta-llama/Meta-Llama-Guard-2-8B"
image:
repository: ghcr.io/huggingface/tgi-gaudi
tag: "2.0.5"
tag: "2.0.6"
resources:
limits:
habana.ai/gaudi: 1
Expand Down
2 changes: 1 addition & 1 deletion helm-charts/codegen/gaudi-values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@ tgi:
accelDevice: "gaudi"
image:
repository: ghcr.io/huggingface/tgi-gaudi
tag: "2.0.5"
tag: "2.0.6"
resources:
limits:
habana.ai/gaudi: 1
Expand Down
2 changes: 1 addition & 1 deletion helm-charts/codetrans/gaudi-values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@ tgi:
accelDevice: "gaudi"
image:
repository: ghcr.io/huggingface/tgi-gaudi
tag: "2.0.5"
tag: "2.0.6"
resources:
limits:
habana.ai/gaudi: 1
Expand Down
2 changes: 1 addition & 1 deletion helm-charts/common/agent/gaudi-values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@ tgi:
accelDevice: "gaudi"
image:
repository: ghcr.io/huggingface/tgi-gaudi
tag: "2.0.5"
tag: "2.0.6"
resources:
limits:
habana.ai/gaudi: 4
Expand Down
2 changes: 1 addition & 1 deletion helm-charts/common/tgi/gaudi-values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@ accelDevice: "gaudi"

image:
repository: ghcr.io/huggingface/tgi-gaudi
tag: "2.0.5"
tag: "2.0.6"

MAX_INPUT_LENGTH: "1024"
MAX_TOTAL_TOKENS: "2048"
Expand Down
2 changes: 1 addition & 1 deletion helm-charts/docsum/gaudi-values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@ tgi:
accelDevice: "gaudi"
image:
repository: ghcr.io/huggingface/tgi-gaudi
tag: "2.0.5"
tag: "2.0.6"
resources:
limits:
habana.ai/gaudi: 1
Expand Down
2 changes: 1 addition & 1 deletion helm-charts/faqgen/gaudi-values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@ tgi:
accelDevice: "gaudi"
image:
repository: ghcr.io/huggingface/tgi-gaudi
tag: "2.0.5"
tag: "2.0.6"
resources:
limits:
habana.ai/gaudi: 1
Expand Down
2 changes: 1 addition & 1 deletion helm-charts/visualqna/gaudi-values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@ tgi:
accelDevice: "gaudi"
image:
repository: ghcr.io/huggingface/tgi-gaudi
tag: "2.0.5"
tag: "2.0.6"
resources:
limits:
habana.ai/gaudi: 1
Expand Down
2 changes: 1 addition & 1 deletion microservices-connector/config/manifests/tgi_gaudi.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -88,7 +88,7 @@ spec:
optional: true
securityContext:
{}
image: "ghcr.io/huggingface/tgi-gaudi:2.0.5"
image: "ghcr.io/huggingface/tgi-gaudi:2.0.6"
imagePullPolicy: IfNotPresent
volumeMounts:
- mountPath: /data
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,7 @@ Should you desire to use the Gaudi accelerator, two alternate images are used fo
For Gaudi:

- tei-embedding-service: ghcr.io/huggingface/tei-gaudi:1.5.0
- tgi-service: ghcr.io/huggingface/tgi-gaudi:2.0.5
- tgi-service: ghcr.io/huggingface/tgi-gaudi:2.0.6

## Deploy ChatQnA pipeline

Expand Down