version: '3.8'
services:
Loading actions...
Skill content
Main instructions and any bundled files for this skill.
version: '3.8'
services: letta: image: letta/letta:latest ports: - "8283:8283" environment: - LETTA_LLM_ENDPOINT=http://vllm:8000 - LETTA_LLM_ENDPOINT_TYPE=vllm - LETTA_LLM_MODEL=${LETTA_LLM_MODEL} # Replace with your model - LETTA_LLM_CONTEXT_WINDOW=8192 depends_on: - vllm
vllm: image: vllm/vllm-openai:latest runtime: nvidia deploy: resources: reservations: devices: - driver: nvidia count: all capabilities: [gpu] environment: - HUGGING_FACE_HUB_TOKEN=${HUGGING_FACE_HUB_TOKEN} volumes: - ~/.cache/huggingface:/root/.cache/huggingface ports: - "8000:8000" command: > --model ${LETTA_LLM_MODEL} --max_model_len=8000 # Replace with your model ipc: host
Related Skills
Frontend Typescript Linting.mdc
TypeScript and ESLint rules that MUST be followed when creating, modifying, or reviewing any file under apps/frontend/, including .ts, .tsx, .js, and .jsx files. Also apply when discussing frontend li...
2. Apply Deepthink Protocol (reason about dependencies
risks