Skip to content

Commit

Permalink
Zarf-native create time model download
Browse files Browse the repository at this point in the history
  • Loading branch information
justinthelaw committed Sep 16, 2024
1 parent e19f892 commit 6ab0434
Show file tree
Hide file tree
Showing 2 changed files with 17 additions and 6 deletions.
10 changes: 10 additions & 0 deletions packages/vllm/zarf-config.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,10 @@
package:
create:
set:
# x-release-please-start-version
image_version: "0.12.2"
# x-release-please-end

model_repo_id: "TheBloke/Synthia-7B-v2.0-GPTQ"
model_revision: "gptq-4bit-32g-actorder_True"
model_path: "/data/.model/"
13 changes: 7 additions & 6 deletions packages/vllm/zarf.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -11,12 +11,13 @@ constants:
value: "###ZARF_PKG_TMPL_IMAGE_VERSION###"
- name: MODEL_REPO_ID
description: "The HuggingFace repository ID"
value: "TheBloke/Synthia-7B-v2.0-GPTQ"
value: "###ZARF_PKG_TMPL_MODEL_REPO_ID###"
- name: MODEL_REVISION
value: "gptq-4bit-32g-actorder_True"
description: "The HuggingFace git branch or commit hash"
value: "###ZARF_PKG_TMPL_MODEL_REVISION###"
- name: MODEL_PATH
description: "Location of the Zarf Injected model files"
value: "/data/.model/"
description: "Defines the location of the Zarf Injected model files in the vLLM container"
value: "###ZARF_PKG_TMPL_MODEL_PATH###"

variables:
# vLLM runtime configuration (usually influenced by .env in local development)
Expand Down Expand Up @@ -132,5 +133,5 @@ components:
# NOTE: This assumes python is installed and in $PATH and 'huggingface_hub[cli,hf_transfer]' has been installed
- cmd: "python src/model_download.py"
env:
- LFAI_REPO_ID="###ZARF_CONST_MODEL_REPO_ID###"
- LFAI_REVISION="###ZARF_CONST_MODEL_REVISION###"
- LFAI_REPO_ID=###ZARF_PKG_TMPL_MODEL_REPO_ID###
- LFAI_REVISION=###ZARF_PKG_TMPL_MODEL_REVISION###

0 comments on commit 6ab0434

Please sign in to comment.