Skip to content

Commit

Permalink
helm: Update tei/teirerank version and args
Browse files Browse the repository at this point in the history
- Upgrade image version to cpu-1.5

- Add parameter to handling long retrievals

Fix issue #233. Partial of #231.

Signed-off-by: Lianhao Lu <[email protected]>
  • Loading branch information
lianhao committed Aug 6, 2024
1 parent d39b315 commit db29443
Show file tree
Hide file tree
Showing 11 changed files with 27 additions and 17 deletions.
2 changes: 1 addition & 1 deletion helm-charts/common/tei/Chart.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -7,4 +7,4 @@ description: The Helm chart for HuggingFace Text Embedding Inference Server
type: application
version: 0.8.0
# The HF TEI version
appVersion: "1.2"
appVersion: "cpu-1.5"
2 changes: 1 addition & 1 deletion helm-charts/common/tei/README.md
Original file line number Diff line number Diff line change
Expand Up @@ -40,4 +40,4 @@ curl http://localhost:2081/embed -X POST -d '{"inputs":"What is Deep Learning?"}
| EMBEDDING_MODEL_ID | string | `"BAAI/bge-base-en-v1.5"` | Models id from https://huggingface.co/, or predownloaded model directory |
| global.modelUseHostPath | string | `"/mnt/opea-models"` | Cached models directory, tei will not download if the model is cached here. The host path "modelUseHostPath" will be mounted to container as /data directory. Set this to null/empty will force it to download model. |
| image.repository | string | `"ghcr.io/huggingface/text-embeddings-inference"` | |
| image.tag | string | `"cpu-1.2"` | |
| image.tag | string | `"cpu-1.5"` | |
2 changes: 2 additions & 0 deletions helm-charts/common/tei/templates/deployment.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -45,6 +45,8 @@ spec:
{{- end }}
image: "{{ .Values.image.repository }}:{{ .Values.image.tag | default .Chart.AppVersion }}"
imagePullPolicy: {{ .Values.image.pullPolicy }}
args:
- "--auto-truncate"
volumeMounts:
- mountPath: /data
name: model-volume
Expand Down
2 changes: 1 addition & 1 deletion helm-charts/common/tei/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,7 @@ image:
repository: ghcr.io/huggingface/text-embeddings-inference
pullPolicy: IfNotPresent
# Overrides the image tag whose default is the chart appVersion.
tag: "cpu-1.2"
tag: "cpu-1.5"

imagePullSecrets: []
nameOverride: ""
Expand Down
2 changes: 1 addition & 1 deletion helm-charts/common/teirerank/Chart.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -7,4 +7,4 @@ description: The Helm chart for HuggingFace Text Embedding Inference Server
type: application
version: 0.8.0
# The HF TEI version
appVersion: "1.2"
appVersion: "cpu-1.5"
2 changes: 1 addition & 1 deletion helm-charts/common/teirerank/README.md
Original file line number Diff line number Diff line change
Expand Up @@ -43,4 +43,4 @@ curl http://localhost:2082/rerank \
| RERANK_MODEL_ID | string | `"BAAI/bge-reranker-base"` | Models id from https://huggingface.co/, or predownloaded model directory |
| global.modelUseHostPath | string | `"/mnt/opea-models"` | Cached models directory, teirerank will not download if the model is cached here. The host path "modelUseHostPath" will be mounted to container as /data directory. Set this to null/empty will force it to download model. |
| image.repository | string | `"ghcr.io/huggingface/text-embeddings-inference"` | |
| image.tag | string | `"cpu-1.2"` | |
| image.tag | string | `"cpu-1.5"` | |
2 changes: 2 additions & 0 deletions helm-charts/common/teirerank/templates/deployment.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -45,6 +45,8 @@ spec:
{{- end }}
image: "{{ .Values.image.repository }}:{{ .Values.image.tag | default .Chart.AppVersion }}"
imagePullPolicy: {{ .Values.image.pullPolicy }}
args:
- "--auto-truncate"
volumeMounts:
- mountPath: /data
name: model-volume
Expand Down
2 changes: 1 addition & 1 deletion helm-charts/common/teirerank/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,7 @@ image:
repository: ghcr.io/huggingface/text-embeddings-inference
pullPolicy: IfNotPresent
# Overrides the image tag whose default is the chart appVersion.
tag: "cpu-1.2"
tag: "cpu-1.5"

imagePullSecrets: []
nameOverride: ""
Expand Down
10 changes: 6 additions & 4 deletions microservices-connector/config/manifests/tei.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,7 @@ metadata:
helm.sh/chart: tei-0.8.0
app.kubernetes.io/name: tei
app.kubernetes.io/instance: tei
app.kubernetes.io/version: "1.2"
app.kubernetes.io/version: "cpu-1.5"
app.kubernetes.io/managed-by: Helm
data:
MODEL_ID: "BAAI/bge-base-en-v1.5"
Expand All @@ -36,7 +36,7 @@ metadata:
helm.sh/chart: tei-0.8.0
app.kubernetes.io/name: tei
app.kubernetes.io/instance: tei
app.kubernetes.io/version: "1.2"
app.kubernetes.io/version: "cpu-1.5"
app.kubernetes.io/managed-by: Helm
spec:
type: ClusterIP
Expand All @@ -61,7 +61,7 @@ metadata:
helm.sh/chart: tei-0.8.0
app.kubernetes.io/name: tei
app.kubernetes.io/instance: tei
app.kubernetes.io/version: "1.2"
app.kubernetes.io/version: "cpu-1.5"
app.kubernetes.io/managed-by: Helm
spec:
replicas: 1
Expand All @@ -87,8 +87,10 @@ spec:
optional: true
securityContext:
{}
image: "ghcr.io/huggingface/text-embeddings-inference:cpu-1.2"
image: "ghcr.io/huggingface/text-embeddings-inference:cpu-1.5"
imagePullPolicy: IfNotPresent
args:
- "--auto-truncate"
volumeMounts:
- mountPath: /data
name: model-volume
Expand Down
8 changes: 5 additions & 3 deletions microservices-connector/config/manifests/tei_gaudi.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,7 @@ metadata:
helm.sh/chart: tei-0.8.0
app.kubernetes.io/name: tei
app.kubernetes.io/instance: tei
app.kubernetes.io/version: "1.2"
app.kubernetes.io/version: "cpu-1.5"
app.kubernetes.io/managed-by: Helm
data:
MODEL_ID: "BAAI/bge-base-en-v1.5"
Expand All @@ -36,7 +36,7 @@ metadata:
helm.sh/chart: tei-0.8.0
app.kubernetes.io/name: tei
app.kubernetes.io/instance: tei
app.kubernetes.io/version: "1.2"
app.kubernetes.io/version: "cpu-1.5"
app.kubernetes.io/managed-by: Helm
spec:
type: ClusterIP
Expand All @@ -61,7 +61,7 @@ metadata:
helm.sh/chart: tei-0.8.0
app.kubernetes.io/name: tei
app.kubernetes.io/instance: tei
app.kubernetes.io/version: "1.2"
app.kubernetes.io/version: "cpu-1.5"
app.kubernetes.io/managed-by: Helm
spec:
replicas: 1
Expand Down Expand Up @@ -89,6 +89,8 @@ spec:
{}
image: "ghcr.io/huggingface/tei-gaudi:synapse_1.16"
imagePullPolicy: IfNotPresent
args:
- "--auto-truncate"
volumeMounts:
- mountPath: /data
name: model-volume
Expand Down
10 changes: 6 additions & 4 deletions microservices-connector/config/manifests/teirerank.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,7 @@ metadata:
helm.sh/chart: teirerank-0.8.0
app.kubernetes.io/name: teirerank
app.kubernetes.io/instance: teirerank
app.kubernetes.io/version: "1.2"
app.kubernetes.io/version: "cpu-1.5"
app.kubernetes.io/managed-by: Helm
data:
MODEL_ID: "BAAI/bge-reranker-base"
Expand All @@ -35,7 +35,7 @@ metadata:
helm.sh/chart: teirerank-0.8.0
app.kubernetes.io/name: teirerank
app.kubernetes.io/instance: teirerank
app.kubernetes.io/version: "1.2"
app.kubernetes.io/version: "cpu-1.5"
app.kubernetes.io/managed-by: Helm
spec:
type: ClusterIP
Expand All @@ -60,7 +60,7 @@ metadata:
helm.sh/chart: teirerank-0.8.0
app.kubernetes.io/name: teirerank
app.kubernetes.io/instance: teirerank
app.kubernetes.io/version: "1.2"
app.kubernetes.io/version: "cpu-1.5"
app.kubernetes.io/managed-by: Helm
spec:
replicas: 1
Expand All @@ -86,8 +86,10 @@ spec:
optional: true
securityContext:
{}
image: "ghcr.io/huggingface/text-embeddings-inference:cpu-1.2"
image: "ghcr.io/huggingface/text-embeddings-inference:cpu-1.5"
imagePullPolicy: IfNotPresent
args:
- "--auto-truncate"
volumeMounts:
- mountPath: /data
name: model-volume
Expand Down

0 comments on commit db29443

Please sign in to comment.