2023-03-23 06:14:33 +00:00
|
|
|
version: '3.3'
|
|
|
|
|
|
|
|
|
|
services:
|
|
|
|
|
server:
|
|
|
|
|
image: tabbyml/tabby
|
|
|
|
|
environment:
|
|
|
|
|
- MODEL_BACKEND=triton
|
2023-03-24 01:44:12 +00:00
|
|
|
- TRITON_TOKENIZER_NAME=EleutherAI/pythia-70m-deduped
|
2023-03-23 06:14:33 +00:00
|
|
|
links:
|
|
|
|
|
- triton
|
|
|
|
|
|
|
|
|
|
admin:
|
|
|
|
|
links:
|
|
|
|
|
- triton
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
triton:
|
|
|
|
|
image: tabbyml/fastertransformer_backend
|
|
|
|
|
container_name: tabby-triton
|
|
|
|
|
command: mpirun -n 1 --allow-run-as-root /opt/tritonserver/bin/tritonserver --model-repository=/model
|
|
|
|
|
shm_size: 1gb
|
|
|
|
|
volumes:
|
|
|
|
|
- ../testdata/tiny-70M/models:/model
|
|
|
|
|
deploy:
|
|
|
|
|
resources:
|
|
|
|
|
reservations:
|
|
|
|
|
devices:
|
|
|
|
|
- driver: nvidia
|
|
|
|
|
count: all
|
|
|
|
|
capabilities: [gpu]
|