2023-03-22 15:18:12 +00:00
|
|
|
version: '3.3'
|
|
|
|
|
|
|
|
|
|
services:
|
2023-03-29 04:57:03 +00:00
|
|
|
tabby:
|
2023-03-25 09:39:40 +00:00
|
|
|
image: tabbyml/tabby
|
2023-03-29 04:57:03 +00:00
|
|
|
container_name: tabby
|
2023-03-22 15:18:12 +00:00
|
|
|
environment:
|
2023-03-27 05:41:22 +00:00
|
|
|
MODEL_NAME: ${MODEL_NAME}
|
|
|
|
|
MODEL_BACKEND: triton
|
2023-03-29 08:33:00 +00:00
|
|
|
LOGS_DIR: /data/logs
|
2023-03-29 04:57:03 +00:00
|
|
|
DAGU_DAGS: /app/tabby/tasks
|
2023-03-22 15:18:12 +00:00
|
|
|
ports:
|
|
|
|
|
- "5000:5000"
|
2023-03-29 04:57:03 +00:00
|
|
|
- "8080:8080"
|
2023-03-22 15:18:12 +00:00
|
|
|
- "8501:8501"
|
2023-03-28 12:12:03 +00:00
|
|
|
volumes:
|
2023-03-29 04:57:03 +00:00
|
|
|
- ${DATA_VOLUME}
|
|
|
|
|
- ${HF_VOLUME}
|
|
|
|
|
healthcheck:
|
|
|
|
|
test: ["CMD", "curl", "-f", "http://localhost:5000"]
|
|
|
|
|
interval: 2s
|
|
|
|
|
timeout: 2s
|
2023-03-29 08:45:46 +00:00
|
|
|
start_period: 1200s
|
2023-03-22 15:18:12 +00:00
|
|
|
|
2023-03-26 14:44:15 +00:00
|
|
|
triton:
|
|
|
|
|
image: tabbyml/fastertransformer_backend
|
|
|
|
|
container_name: tabby-triton
|
2023-03-29 08:33:00 +00:00
|
|
|
command: triton.sh
|
2023-03-26 14:44:15 +00:00
|
|
|
shm_size: 1gb
|
2023-03-22 15:18:12 +00:00
|
|
|
volumes:
|
2023-03-29 08:33:00 +00:00
|
|
|
- ./scripts/triton.sh:/usr/bin/triton.sh:ro
|
2023-03-27 05:41:22 +00:00
|
|
|
- ${HF_VOLUME}
|
2023-03-26 14:44:15 +00:00
|
|
|
deploy:
|
|
|
|
|
resources:
|
|
|
|
|
reservations:
|
|
|
|
|
devices:
|
|
|
|
|
- driver: nvidia
|
|
|
|
|
count: all
|
|
|
|
|
capabilities: [gpu]
|
2023-03-25 06:44:46 +00:00
|
|
|
environment:
|
2023-03-27 05:41:22 +00:00
|
|
|
MODEL_NAME: ${MODEL_NAME}
|
2023-04-02 05:19:09 +00:00
|
|
|
MODEL_REPLICA: ${MODEL_REPLICA:-1}
|
2023-03-26 14:44:15 +00:00
|
|
|
depends_on:
|
2023-03-29 04:57:03 +00:00
|
|
|
tabby:
|
|
|
|
|
condition: service_healthy
|