Skip to content

Commit

Permalink
add docker compose vllm
Browse files Browse the repository at this point in the history
  • Loading branch information
hitpoint6 committed Oct 2, 2024
1 parent 9aefad8 commit 7e6c0c5
Showing 1 changed file with 35 additions and 0 deletions.
35 changes: 35 additions & 0 deletions docker-compose-vllm.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,35 @@
version: '3.8'

services:
letta:
image: lettaai/letta:latest
ports:
- "8083:8083"
environment:
- LETTA_LLM_ENDPOINT=http://vllm:8000
- LETTA_LLM_ENDPOINT_TYPE=vllm
- LETTA_LLM_MODEL=teknium/OpenHermes-2-Mistral-7B # Replace with your model
- LETTA_LLM_CONTEXT_WINDOW=8192
depends_on:
- vllm

vllm:
image: vllm/vllm-openai:latest
runtime: nvidia
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: all
capabilities: [gpu]
environment:
- HUGGING_FACE_HUB_TOKEN=${HUGGING_FACE_HUB_TOKEN}
volumes:
- ~/.cache/huggingface:/root/.cache/huggingface
ports:
- "8000:8000"
command: >
--model teknium/OpenHermes-2-Mistral-7B --max_model_len=8000
# Replace with your model
ipc: host

0 comments on commit 7e6c0c5

Please sign in to comment.