Skip to content

Commit

Permalink
update worker-config
Browse files Browse the repository at this point in the history
Signed-off-by: Ubuntu <azureuser@marut-dev-machine.zb0qmvlxdhvujimyzdkawhuxph.bx.internal.cloudapp.net>
  • Loading branch information
Ubuntu committed Jan 2, 2025
1 parent 28b54c5 commit 93d7dd7
Show file tree
Hide file tree
Showing 2 changed files with 69 additions and 1 deletion.
3 changes: 2 additions & 1 deletion builder/requirements.txt
Original file line number Diff line number Diff line change
Expand Up @@ -7,4 +7,5 @@ packaging
typing-extensions==4.7.1
pydantic
pydantic-settings
hf-transfer
hf-transfer
transformers
67 changes: 67 additions & 0 deletions worker-config.json
Original file line number Diff line number Diff line change
@@ -1,5 +1,72 @@
{
"versions": {
"0.4.1": {
"imageName": "runpod/worker-sglang:v0.4.1stable",
"minimumCudaVersion": "12.1",
"categories": [
{
"title": "Model Settings",
"settings": [
"TOKENIZER_PATH",
"CONTEXT_LENGTH",
"QUANTIZATION",
"LOAD_FORMAT",
"DTYPE",
"CHAT_TEMPLATE",
"SERVED_MODEL_NAME"
]
},
{
"title": "Server Configuration",
"settings": [
"HOST",
"PORT",
"ADDITIONAL_PORTS",
"API_KEY",
"LOG_LEVEL",
"LOG_LEVEL_HTTP",
"FILE_STORAGE_PTH"
]
},
{
"title": "Performance Settings",
"settings": [
"MEM_FRACTION_STATIC",
"MAX_RUNNING_REQUESTS",
"MAX_NUM_REQS",
"MAX_TOTAL_TOKENS",
"MAX_PREFILL_TOKENS",
"CHUNKED_PREFILL_SIZE",
"STREAM_INTERVAL"
]
},
{
"title": "Parallelization Settings",
"settings": [
"TENSOR_PARALLEL_SIZE",
"DATA_PARALLEL_SIZE",
"NNODES",
"NODE_RANK",
"NCCL_INIT_ADDR"
]
},
{
"title": "Scheduling Settings",
"settings": [
"SCHEDULE_POLICY",
"SCHEDULE_CONSERVATIVENESS",
"LOAD_BALANCE_METHOD"
]
},
{
"title": "Tokenizer Settings",
"settings": [
"TOKENIZER_MODE",
"RANDOM_SEED"
]
}
]
},
"0.3.3": {
"imageName": "runpod/worker-sglang:v0.3.3stable",
"minimumCudaVersion": "12.1",
Expand Down

0 comments on commit 93d7dd7

Please sign in to comment.