From b883f9c1f6e70fb1f040fed50e1b19f13b864a9e Mon Sep 17 00:00:00 2001 From: chantu Date: Sun, 22 Oct 2023 22:57:16 +0800 Subject: [PATCH] chore: add baichuan replit-code codeshell (#5575) --- deploy/llm/templates/clusterversion.yaml | 84 ++++++++++++++++++++++++ deploy/llm/values.yaml | 2 + 2 files changed, 86 insertions(+) diff --git a/deploy/llm/templates/clusterversion.yaml b/deploy/llm/templates/clusterversion.yaml index 6514a05b2a8..fd3b5cd7fc8 100644 --- a/deploy/llm/templates/clusterversion.yaml +++ b/deploy/llm/templates/clusterversion.yaml @@ -187,3 +187,87 @@ spec: volumeMounts: - name: models mountPath: /models +--- +apiVersion: apps.kubeblocks.io/v1alpha1 +kind: ClusterVersion +metadata: + name: ggml-baichuan2-13b-q4 + labels: + {{- include "llm.labels" . | nindent 4 }} +spec: + clusterDefinitionRef: ggml + componentVersions: + - componentDefRef: ggml + versionsContext: + initContainers: + - name: download + image: infracreate-registry.cn-zhangjiakou.cr.aliyuncs.com/apecloud/baichuan2-13b-gguf:ggml-model-q4 + command: ["sh", "-c", "cp /models/ggml-model-q4.gguf /models-target/"] + volumeMounts: + - name: models + mountPath: /models-target + containers: + - name: ggml + image: {{ .Values.imageDev.registry | default "docker.io" }}/{{ .Values.imageDev.repository}}:{{ default .Chart.AppVersion .Values.imageDev.tagNew }} + env: + - name: MODEL + value: /models/ggml-model-q4.gguf + volumeMounts: + - name: models + mountPath: /models +--- +apiVersion: apps.kubeblocks.io/v1alpha1 +kind: ClusterVersion +metadata: + name: ggml-replit-code-3b-f16 + labels: + {{- include "llm.labels" . | nindent 4 }} +spec: + clusterDefinitionRef: ggml + componentVersions: + - componentDefRef: ggml + versionsContext: + initContainers: + - name: download + image: infracreate-registry.cn-zhangjiakou.cr.aliyuncs.com/apecloud/replit-code-3b:ggml-model-f16 + command: ["sh", "-c", "cp /models/ggml-model-f16.gguf /models-target/"] + volumeMounts: + - name: models + mountPath: /models-target + containers: + - name: ggml + image: {{ .Values.imageDev.registry | default "docker.io" }}/{{ .Values.imageDev.repository}}:{{ default .Chart.AppVersion .Values.imageDev.tagNew }} + env: + - name: MODEL + value: /models/ggml-model-f16.gguf + volumeMounts: + - name: models + mountPath: /models +--- +apiVersion: apps.kubeblocks.io/v1alpha1 +kind: ClusterVersion +metadata: + name: ggml-codeshell-7b-chat-q4 + labels: + {{- include "llm.labels" . | nindent 4 }} +spec: + clusterDefinitionRef: ggml + componentVersions: + - componentDefRef: ggml + versionsContext: + initContainers: + - name: download + image: infracreate-registry.cn-zhangjiakou.cr.aliyuncs.com/apecloud/codeshell-7b-chat:codeshell-chat-q4_0 + command: ["sh", "-c", "cp /models/codeshell-chat-q4_0.gguf /models-target/"] + volumeMounts: + - name: models + mountPath: /models-target + containers: + - name: ggml + image: {{ .Values.imageDev.registry | default "docker.io" }}/{{ .Values.imageDev.repository}}:{{ default .Chart.AppVersion .Values.imageDev.tagCodeShell }} + env: + - name: MODEL + value: /models/codeshell-chat-q4_0.gguf + volumeMounts: + - name: models + mountPath: /models diff --git a/deploy/llm/values.yaml b/deploy/llm/values.yaml index 9178bc4eac2..6e7ba8d12eb 100644 --- a/deploy/llm/values.yaml +++ b/deploy/llm/values.yaml @@ -10,3 +10,5 @@ imageDev: registry: infracreate-registry.cn-zhangjiakou.cr.aliyuncs.com # Overrides the image tag whose default is the chart appVersion. tag: latest + tagNew: latest-new + tagCodeShell: latest-codeshell