-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy path.drone.yml
143 lines (133 loc) · 3.52 KB
/
.drone.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
kind: pipeline
type: docker
name: build-runner-base-empty
volumes:
- name: dockersocket
host:
path: /var/run/docker.sock
steps:
- name: publish-runner
image: plugins/docker
environment:
HF_TOKEN:
from_secret: HF_TOKEN
pull: always
settings:
dockerfile: Dockerfile.runner
tags:
- "${DRONE_TAG:-main}-empty" # Default to branch
- "latest-empty"
daemon_off: true
registry: registry.helix.ml
repo: registry.helix.ml/helix/runner-base
username: admin
password:
from_secret: helix_registry_password
secret: id=HF_TOKEN,env=HF_TOKEN
volumes:
- name: dockersocket
path: /var/run/docker.sock
when:
branch:
- main
event:
- tag
# Only build on tag, so that common case of merge to main & immediately tag
# doesn't result in concurrent huge builds. Note if changing this you need
# to change it in all 3 places in this file.
# - push
---
kind: pipeline
type: docker
name: build-runner-base-small
volumes:
- name: dockersocket
host:
path: /var/run/docker.sock
steps:
- name: publish-runner
image: plugins/docker
environment:
HF_TOKEN:
from_secret: HF_TOKEN
pull: always
settings:
dockerfile: Dockerfile.runner
tags:
- "${DRONE_TAG:-main}-small" # Default to branch
- "latest-small"
daemon_off: true
registry: registry.helix.ml
repo: registry.helix.ml/helix/runner-base
build_args:
# Small models only
- PULL_OLLAMA_MODELS=llama3.1:8b-instruct-q8_0
secret: id=HF_TOKEN,env=HF_TOKEN
username: admin
password:
from_secret: helix_registry_password
volumes:
- name: dockersocket
path: /var/run/docker.sock
when:
branch:
- main
event:
- tag
# Only build on tag, so that common case of merge to main & immediately tag
# doesn't result in concurrent huge builds.
# - push
depends_on:
- build-runner-base-empty
---
kind: pipeline
type: docker
name: build-runner-base-large
volumes:
- name: dockersocket
host:
path: /var/run/docker.sock
steps:
- name: publish-runner
image: plugins/docker
environment:
HF_TOKEN:
from_secret: HF_TOKEN
pull: always
settings:
dockerfile: Dockerfile.runner
tags:
- "${DRONE_TAG:-main}-large"
- "latest-large"
daemon_off: true
registry: registry.helix.ml
repo: registry.helix.ml/helix/runner-base
build_args:
# We put models we're confident in keeping around for a long time in a
# big base layer, and have a smaller layers on top for models that might
# change more frequently and that we can add to without churning the
# 100GB base
- PULL_OLLAMA_MODELS=llama3.1:8b-instruct-q8_0;llama3.3:70b-instruct-q4_K_M;llama3.2:1b-instruct-q8_0;llama3.2:3b-instruct-q8_0
- PULL_OLLAMA_MODELS_PHASE_2=phi3.5:3.8b-mini-instruct-q8_0
- PULL_OLLAMA_MODELS_PHASE_3=qwen2.5:7b-instruct-q8_0
- PULL_OLLAMA_MODELS_PHASE_4=aya:8b-23-q8_0;aya:35b-23-q4_0
# disabled for now because not better than flux and trying to minimize disk usage
# - PULL_DIFFUSERS_MODELS_STABLEDIFFUSION=true
- PULL_DIFFUSERS_MODELS_FLUX=true
secret: id=HF_TOKEN,env=HF_TOKEN
username: admin
password:
from_secret: helix_registry_password
volumes:
- name: dockersocket
path: /var/run/docker.sock
when:
branch:
- main
event:
- tag
# Only build on tag, so that common case of merge to main & immediately tag
# doesn't result in concurrent huge builds.
# - push
depends_on:
- build-runner-base-small