-
Notifications
You must be signed in to change notification settings - Fork 29
/
zarf.yaml
68 lines (64 loc) · 2.12 KB
/
zarf.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
# yaml-language-server: $schema=https://raw.githubusercontent.com/defenseunicorns/uds-cli/v0.16.0/zarf.schema.json
kind: ZarfPackageConfig
metadata:
name: text-embeddings
version: "###ZARF_PKG_TMPL_IMAGE_VERSION###"
description: >
text embeddings model
constants:
- name: IMAGE_VERSION
value: "###ZARF_PKG_TMPL_IMAGE_VERSION###"
variables:
- name: GPU_LIMIT
description: The GPU limit for the model inferencing.
default: "0"
pattern: "^[0-9]+$"
- name: GPU_RUNTIME
description: The GPU class name for the model inferencing. Leave blank for CPU-only.
default: ""
pattern: "^(nvidia)?$"
- name: PVC_SIZE
description: Size of the PVC used for model storage.
default: "15Gi"
pattern: "^[0-9]+[a-zA-Z]+$"
- name: PVC_ACCESS_MODE
description: Access mode of the PVC used for model storage.
default: "ReadWriteOnce"
pattern: "^(ReadWriteOnce|ReadOnlyMany|ReadWriteMany)$"
- name: PVC_STORAGE_CLASS
description: Storage class of the PVC used for model storage.
default: "local-path"
components:
- name: text-embeddings-model
required: true
only:
flavor: upstream
charts:
- name: text-embeddings-model
namespace: leapfrogai
localPath: chart
releaseName: text-embeddings-model
# x-release-please-start-version
version: 0.14.0
# x-release-please-end
valuesFiles:
- "values/upstream-values.yaml"
images:
- ghcr.io/defenseunicorns/leapfrogai/text-embeddings:###ZARF_PKG_TMPL_IMAGE_VERSION###
- cgr.dev/chainguard/bash:latest
dataInjections:
- source: .model/
target:
namespace: leapfrogai
selector: app=lfai-text-embeddings
container: data-loader
path: /data/.model
compress: true
actions:
onCreate:
before:
# NOTE: This assumes python is installed and in $PATH and 'huggingface_hub[cli,hf_transfer]' has been installed
- cmd: python scripts/model_download.py
env:
- REPO_ID=hkunlp/instructor-xl
- REVISION=ce48b213095e647a6c3536364b9fa00daf57f436