Skip to content

Commit

Permalink
first commit
Browse files Browse the repository at this point in the history
  • Loading branch information
jorgeantonio21 committed Dec 26, 2024
1 parent 4d01ecb commit 327fe58
Showing 1 changed file with 6 additions and 6 deletions.
12 changes: 6 additions & 6 deletions docker-compose.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -127,7 +127,7 @@ services:
profiles: [chat_completions_vllm]
image: vllm/vllm-openai:v0.6.5
ports:
- "${CHAT_COMPLETIONS_SERVER_PORT}:8000"
- "127.0.0.1:${CHAT_COMPLETIONS_SERVER_PORT}:8000"
ipc: host
command: ${VLLM_ENGINE_ARGS}

Expand All @@ -139,7 +139,7 @@ services:
context: https://github.com/atoma-network/vllm.git#main
dockerfile: Dockerfile.cpu
ports:
- "${CHAT_COMPLETIONS_SERVER_PORT}:8000"
- "127.0.0.1:${CHAT_COMPLETIONS_SERVER_PORT}:8000"
command: --model ${CHAT_COMPLETIONS_MODEL} --max-model-len ${CHAT_COMPLETIONS_MAX_MODEL_LEN}

vllm-rocm:
Expand All @@ -150,7 +150,7 @@ services:
context: https://github.com/atoma-network/vllm.git#main
dockerfile: Dockerfile.rocm
ports:
- "${CHAT_COMPLETIONS_SERVER_PORT}:8000"
- "127.0.0.1:${CHAT_COMPLETIONS_SERVER_PORT}:8000"
command: --model ${CHAT_COMPLETIONS_MODEL} --max-model-len ${CHAT_COMPLETIONS_MAX_MODEL_LEN} --tensor-parallel-size ${VLLM_TENSOR_PARALLEL_SIZE}

mistralrs-cpu:
Expand All @@ -161,7 +161,7 @@ services:
context: https://github.com/EricLBuehler/mistral.rs.git
dockerfile: Dockerfile
ports:
- "${CHAT_COMPLETIONS_SERVER_PORT}:80"
- "127.0.0.1:${CHAT_COMPLETIONS_SERVER_PORT}:80"
command: plain -m ${CHAT_COMPLETIONS_MODEL}

tei:
Expand All @@ -170,7 +170,7 @@ services:
profiles: [embeddings_tei]
image: ${TEI_IMAGE}
ports:
- "${EMBEDDINGS_SERVER_PORT}:80"
- "127.0.0.1:${EMBEDDINGS_SERVER_PORT}:80"
command: --model-id ${EMBEDDINGS_MODEL} --huggingface-hub-cache /root/.cache/huggingface/hub

mistralrs:
Expand All @@ -179,7 +179,7 @@ services:
profiles: [image_generations_mistralrs]
image: ${MISTRALRS_IMAGE}
ports:
- "${IMAGE_GENERATIONS_SERVER_PORT}:80"
- "127.0.0.1:${IMAGE_GENERATIONS_SERVER_PORT}:80"
command: diffusion-plain -m ${IMAGE_GENERATIONS_MODEL} --arch ${IMAGE_GENERATIONS_ARCHITECTURE}

networks:
Expand Down

0 comments on commit 327fe58

Please sign in to comment.