vllm-openai-8002: runtime: nvidia # 只使用 gpu 1 deploy: resources: reservations: devices: - device_ids: ["1"] capabilities: ["gpu"] driver: "nvidia" environment ...