@ -35,7 +35,8 @@ docker run \
-p 5000:5000 \
-p 8501:8501 \
-p 8080:8080 \
-e MODEL_NAME=TabbyML/J-350M tabbyml/tabby
-e MODEL_NAME=TabbyML/J-350M \
tabbyml/tabby
```
You can then query the server using `/v1/completions` endpoint: