# Agent Mai Vault — vLLM OpenAI-compatible API (GPU required)
services:
  agent-mai-engine:
    image: vllm/vllm-openai:latest
    command:
      - --model
      - mistralai/Mistral-Small-Instruct-2409
      - --tensor-parallel-size
      - "1"
    deploy:
      resources:
        reservations:
          devices:
            - driver: nvidia
              count: 1
              capabilities: [gpu]
    ports:
      - "8000:8000"
