version: '3.5'
services:
tabby:
command: serve --model TabbyML/SantaCoder-1B --device cuda
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: 1
capabilities: [gpu]