Skip to content

Commit

Permalink
helm: upgrade tgi chart
Browse files Browse the repository at this point in the history
- upgrade tgi version to 2.1.0
- upgrade tgi-gaudi version to 2.0.1
- change default model to Intel/neural-chat-7b-v3-3

Signed-off-by: Lianhao Lu <[email protected]>
  • Loading branch information
lianhao authored and leslieluyu committed Jul 18, 2024
1 parent fbdb1da commit c3a1c1a
Show file tree
Hide file tree
Showing 5 changed files with 15 additions and 17 deletions.
2 changes: 1 addition & 1 deletion helm-charts/common/tgi/Chart.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -7,4 +7,4 @@ description: The Helm chart for HuggingFace Text Generation Inference Server
type: application
version: 0.8.0
# The HF TGI version
appVersion: "1.4"
appVersion: "2.1.0"
5 changes: 2 additions & 3 deletions helm-charts/common/tgi/gaudi-values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -13,7 +13,7 @@ image:
repository: ghcr.io/huggingface/tgi-gaudi
pullPolicy: IfNotPresent
# Overrides the image tag whose default is the chart appVersion.
tag: "1.2.1"
tag: "2.0.1"

imagePullSecrets: []
nameOverride: ""
Expand Down Expand Up @@ -48,8 +48,7 @@ tolerations: []

affinity: {}

LLM_MODEL_ID: ise-uiuc/Magicoder-S-DS-6.7B
# LLM_MODEL_ID: /data/Magicoder-S-DS-6.7B
LLM_MODEL_ID: Intel/neural-chat-7b-v3-3

global:
http_proxy: ""
Expand Down
5 changes: 2 additions & 3 deletions helm-charts/common/tgi/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -13,7 +13,7 @@ image:
repository: ghcr.io/huggingface/text-generation-inference
pullPolicy: IfNotPresent
# Overrides the image tag whose default is the chart appVersion.
tag: "1.4"
tag: "2.1.0"

imagePullSecrets: []
nameOverride: ""
Expand Down Expand Up @@ -56,8 +56,7 @@ tolerations: []

affinity: {}

LLM_MODEL_ID: bigscience/bloom-560m
# LLM_MODEL_ID: /data/OpenCodeInterpreter-DS-6.7B
LLM_MODEL_ID: Intel/neural-chat-7b-v3-3

global:
http_proxy: ""
Expand Down
10 changes: 5 additions & 5 deletions manifests/common/tgi.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -11,10 +11,10 @@ metadata:
helm.sh/chart: tgi-0.8.0
app.kubernetes.io/name: tgi
app.kubernetes.io/instance: tgi
app.kubernetes.io/version: "1.4"
app.kubernetes.io/version: "2.1.0"
app.kubernetes.io/managed-by: Helm
data:
MODEL_ID: "bigscience/bloom-560m"
MODEL_ID: "Intel/neural-chat-7b-v3-3"
PORT: "2080"
HUGGING_FACE_HUB_TOKEN: "insert-your-huggingface-token-here"
HF_TOKEN: "insert-your-huggingface-token-here"
Expand All @@ -40,7 +40,7 @@ metadata:
helm.sh/chart: tgi-0.8.0
app.kubernetes.io/name: tgi
app.kubernetes.io/instance: tgi
app.kubernetes.io/version: "1.4"
app.kubernetes.io/version: "2.1.0"
app.kubernetes.io/managed-by: Helm
spec:
type: ClusterIP
Expand All @@ -65,7 +65,7 @@ metadata:
helm.sh/chart: tgi-0.8.0
app.kubernetes.io/name: tgi
app.kubernetes.io/instance: tgi
app.kubernetes.io/version: "1.4"
app.kubernetes.io/version: "2.1.0"
app.kubernetes.io/managed-by: Helm
spec:
replicas: 1
Expand All @@ -91,7 +91,7 @@ spec:
optional: true
securityContext:
{}
image: "ghcr.io/huggingface/text-generation-inference:1.4"
image: "ghcr.io/huggingface/text-generation-inference:2.1.0"
imagePullPolicy: IfNotPresent
volumeMounts:
- mountPath: /data
Expand Down
10 changes: 5 additions & 5 deletions manifests/common/tgi_gaudi.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -11,10 +11,10 @@ metadata:
helm.sh/chart: tgi-0.8.0
app.kubernetes.io/name: tgi
app.kubernetes.io/instance: tgi
app.kubernetes.io/version: "1.4"
app.kubernetes.io/version: "2.1.0"
app.kubernetes.io/managed-by: Helm
data:
MODEL_ID: "ise-uiuc/Magicoder-S-DS-6.7B"
MODEL_ID: "Intel/neural-chat-7b-v3-3"
PORT: "2080"
HUGGING_FACE_HUB_TOKEN: "insert-your-huggingface-token-here"
HF_TOKEN: "insert-your-huggingface-token-here"
Expand All @@ -40,7 +40,7 @@ metadata:
helm.sh/chart: tgi-0.8.0
app.kubernetes.io/name: tgi
app.kubernetes.io/instance: tgi
app.kubernetes.io/version: "1.4"
app.kubernetes.io/version: "2.1.0"
app.kubernetes.io/managed-by: Helm
spec:
type: ClusterIP
Expand All @@ -65,7 +65,7 @@ metadata:
helm.sh/chart: tgi-0.8.0
app.kubernetes.io/name: tgi
app.kubernetes.io/instance: tgi
app.kubernetes.io/version: "1.4"
app.kubernetes.io/version: "2.1.0"
app.kubernetes.io/managed-by: Helm
spec:
replicas: 1
Expand All @@ -91,7 +91,7 @@ spec:
optional: true
securityContext:
{}
image: "ghcr.io/huggingface/tgi-gaudi:1.2.1"
image: "ghcr.io/huggingface/tgi-gaudi:2.0.1"
imagePullPolicy: IfNotPresent
volumeMounts:
- mountPath: /data
Expand Down

0 comments on commit c3a1c1a

Please sign in to comment.