Skip to content

Commit

Permalink
Remove tgi
Browse files Browse the repository at this point in the history
  • Loading branch information
lakinduakash committed Oct 30, 2024
1 parent 0086360 commit eccb0c2
Show file tree
Hide file tree
Showing 8 changed files with 2 additions and 268 deletions.
23 changes: 0 additions & 23 deletions helm/h2ogpt-chart/README.md
Original file line number Diff line number Diff line change
Expand Up @@ -135,29 +135,6 @@ A Helm chart for h2oGPT
| h2ogpt.updateStrategy.type | string | `"RollingUpdate"` | |
| nameOverride | string | `""` | |
| namespaceOverride | string | `""` | |
| tgi.containerArgs | string | `nil` | |
| tgi.enabled | bool | `false` | Enable tgi |
| tgi.env | object | `{}` | |
| tgi.hfSecret | string | `nil` | |
| tgi.image.pullPolicy | string | `"IfNotPresent"` | |
| tgi.image.repository | string | `"ghcr.io/huggingface/text-generation-inference"` | |
| tgi.image.tag | string | `"0.9.3"` | |
| tgi.nodeSelector | string | `nil` | |
| tgi.overrideConfig | string | `nil` | |
| tgi.podAffinity | string | `nil` | Set hostname and zone to true for pod affinity rules based on hostname and zone. |
| tgi.podAnnotations | object | `{}` | |
| tgi.podLabels | object | `{}` | |
| tgi.podSecurityContext | string | `nil` | |
| tgi.replicaCount | int | `1` | |
| tgi.resources | string | `nil` | |
| tgi.securityContext | string | `nil` | |
| tgi.service.port | int | `8080` | |
| tgi.service.type | string | `"ClusterIP"` | |
| tgi.storage.class | string | `nil` | |
| tgi.storage.size | string | `"512Gi"` | |
| tgi.storage.useEphemeral | bool | `true` | |
| tgi.tolerations | string | `nil` | |
| tgi.updateStrategy.type | string | `"RollingUpdate"` | |
| vllm.containerArgs[0] | string | `"--model"` | |
| vllm.containerArgs[1] | string | `"h2oai/h2ogpt-4096-llama2-7b-chat"` | |
| vllm.containerArgs[2] | string | `"--tokenizer"` | |
Expand Down
17 changes: 1 addition & 16 deletions helm/h2ogpt-chart/templates/h2ogpt-deployment.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -87,18 +87,7 @@ spec:
python3 /workspace/generate.py
{{- end }}
{{- if and .Values.tgi.enabled (not .Values.global.externalLLM.modelLock) }}
args:
- >
until wget -O- http://{{ include "h2ogpt.fullname" . }}-tgi-inference:{{ .Values.tgi.service.port }}/ >/dev/null 2>&1;
do
echo "Waiting for inference service to become ready...";
sleep 5;
done
python3 /workspace/generate.py
{{- end }}
{{- if and .Values.h2ogpt.enabled (not (or .Values.vllm.enabled .Values.tgi.enabled )) }}
{{- if and .Values.h2ogpt.enabled (not .Values.vllm.enabled ) }}
args:
- >
python3 /workspace/generate.py
Expand Down Expand Up @@ -146,10 +135,6 @@ spec:
name: {{ include "h2ogpt.fullname" . }}-external-llm-secret
{{- end }}
env:
{{- if and .Values.tgi.enabled (not .Values.global.externalLLM.enabled) }}
- name: h2ogpt_inference_server
value: "http://{{ include "h2ogpt.fullname" . }}-tgi-inference:{{ .Values.tgi.service.port }}"
{{- end }}
{{- if and .Values.vllm.enabled (not .Values.global.externalLLM.enabled) }}
- name: h2ogpt_inference_server
value: "vllm:{{ include "h2ogpt.fullname" . }}-vllm-inference:{{ .Values.vllm.service.port }}"
Expand Down
13 changes: 0 additions & 13 deletions helm/h2ogpt-chart/templates/tgi-configmap.yaml

This file was deleted.

141 changes: 0 additions & 141 deletions helm/h2ogpt-chart/templates/tgi-deployment.yaml

This file was deleted.

14 changes: 0 additions & 14 deletions helm/h2ogpt-chart/templates/tgi-pvc.yaml

This file was deleted.

15 changes: 0 additions & 15 deletions helm/h2ogpt-chart/templates/tgi-service.yaml

This file was deleted.

Original file line number Diff line number Diff line change
@@ -1,6 +1,3 @@
{{- if and .Values.vllm.enabled .Values.tgi.enabled }}
{{- fail "Both TGI and vLLM cannot be enabled at the same time. Enable only one and try again" }}
{{- end }}
{{- if and ( and .Values.h2ogpt.enabled .Values.h2ogpt.agents.enabled) .Values.agents.enabled }}
{{- fail " Both agents in both h2ogpt.agents cannot be enabled. Enably only one and try again" }}
{{- end }}
44 changes: 1 addition & 43 deletions helm/h2ogpt-chart/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -140,7 +140,7 @@ agents:
# -- Enable agents, this must be `false` if `h2ogpt.agents.enabled` is `true`
enabled: false
autoscaling:
# Enable autoscaling for agents
# Enable autoscaling (HPA) for agents
enabled: false
minReplicas: 1
maxReplicas: 2
Expand Down Expand Up @@ -239,48 +239,6 @@ agents:
podAnnotations: {}
podLabels: {}

tgi:
# -- Enable tgi
enabled: false
replicaCount: 1

image:
repository: ghcr.io/huggingface/text-generation-inference
tag: 0.9.3
pullPolicy: IfNotPresent
# -- Set hostname and zone to true for pod affinity rules based on hostname and zone.
podAffinity:
# hostname:
# zone:

storage:
size: 512Gi
class:
useEphemeral: true

overrideConfig:
hfSecret:
containerArgs:

service:
type: ClusterIP
port: 8080

updateStrategy:
type: RollingUpdate

podSecurityContext:
securityContext:

resources:
nodeSelector:
tolerations:

env: {}

podAnnotations: {}
podLabels: {}

vllm:
# -- Enable vllm
enabled: false
Expand Down

0 comments on commit eccb0c2

Please sign in to comment.