services: rabbitmq: image: rabbitmq:3-management ports: - 5672:5672 - 15672:15672 vllm: image: vllm/vllm-openai:latest command: "--model Qwen/Qwen2-VL-2B-Instruct" volumes: - ~/.cache/huggingface:/root/.cache/huggingface ports: - 8002:8000 environment: - HUGGING_FACE_HUB_TOKEN=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 deploy: resources: reservations: devices: - driver: nvidia device_ids: ["0"] capabilities: [gpu]