55 lines
1.2 KiB
YAML
55 lines
1.2 KiB
YAML
version: '3.3'
|
|
|
|
services:
|
|
server:
|
|
image: tabbyml/tabby
|
|
container_name: tabby-server
|
|
working_dir: /app/server
|
|
command: uvicorn app:app --host 0.0.0.0 --port 5000
|
|
environment:
|
|
- TOKENIZER_NAME=/tokenizer
|
|
- TRITON_HOST=triton
|
|
- EVENTS_LOG_DIR=/logs/tabby-server
|
|
ports:
|
|
- "5000:5000"
|
|
volumes:
|
|
- ./logs:/logs
|
|
- ../testdata/gptneox/tokenizer:/tokenizer
|
|
links:
|
|
- triton
|
|
- vector
|
|
|
|
triton:
|
|
image: tabbyml/fastertransformer_backend
|
|
container_name: tabby-triton
|
|
command: mpirun -n 1 --allow-run-as-root /opt/tritonserver/bin/tritonserver --model-repository=/model
|
|
shm_size: 1gb
|
|
volumes:
|
|
- ../testdata/gptneox/models:/model
|
|
deploy:
|
|
resources:
|
|
reservations:
|
|
devices:
|
|
- driver: nvidia
|
|
count: all
|
|
capabilities: [gpu]
|
|
|
|
admin:
|
|
image: tabbyml/tabby
|
|
container_name: tabby-admin
|
|
working_dir: /app/admin
|
|
command: streamlit run Home.py
|
|
ports:
|
|
- "8501:8501"
|
|
links:
|
|
- server
|
|
- triton
|
|
- vector
|
|
|
|
vector:
|
|
image: timberio/vector:0.28.1-alpine
|
|
container_name: tabby-vector
|
|
volumes:
|
|
- ./config/vector.toml:/etc/vector/vector.toml:ro
|
|
- ./logs:/logs
|