version: '3.3' services: tabby: shm_size: 1gb environment: MODEL_BACKEND: triton MODEL_REPLICA: ${MODEL_REPLICA:-1} deploy: resources: reservations: devices: - driver: nvidia count: all capabilities: [gpu]