feat(experimental): update tabby.py to use debug_options.raw_prompt

2023-10-21 17:27:43 -07:00 · 2023-10-21 17:27:43 -07:00 · 2dcb5599b3
parent 1d31b33ccc
commit 2dcb5599b3
2 changed files with 36 additions and 23 deletions
--- a/experimental/eval/output.jsonl
+++ b/experimental/eval/output.jsonl
--- a/experimental/eval/tabby.py
+++ b/experimental/eval/tabby.py
@ -1,18 +1,12 @@
 from pathlib import Path

+import modal
 from modal import Image, Mount, Secret, Stub, asgi_app, gpu, method

 GPU_CONFIG = gpu.T4()
 MODEL_ID = "TabbyML/StarCoder-1B"
-LAUNCH_FLAGS = [
-    "serve",
-    "--model",
-    MODEL_ID,
-    "--port",
-    "8000",
-    "--device",
-    "cuda"
-]
+LAUNCH_FLAGS = ["serve", "--model", MODEL_ID, "--port", "8000", "--device", "cuda"]
+

 def download_model():
    import subprocess
@ -28,10 +22,15 @@ def download_model():


 image = (
-        Image.from_registry("tabbyml/tabby:0.3.0", add_python="3.11")
-        .dockerfile_commands("ENTRYPOINT []")
-        .run_function(download_model)
-        .pip_install("git+https://github.com/TabbyML/tabby.git#egg=tabby-python-client&subdirectory=clients/tabby-python-client")
+    Image.from_registry(
+        "tabbyml/tabby@sha256:64d71ec4c7d9ae7269e6301ad4106baad70ee997408691a6af17d7186283a856",
+        add_python="3.11",
+    )
+    .dockerfile_commands("ENTRYPOINT []")
+    .run_function(download_model)
+    .pip_install(
+        "git+https://github.com/TabbyML/tabby.git#egg=tabby-python-client&subdirectory=experimental/eval/tabby-python-client"
+    )
 )

 stub = Stub("tabby-" + MODEL_ID.split("/")[-1], image=image)
@ -49,11 +48,9 @@ class Model:
        import subprocess
        import time

-        from tabby_client import Client
+        from tabby_python_client import Client

-        self.launcher = subprocess.Popen(
-            ["/opt/tabby/bin/tabby"] + LAUNCH_FLAGS
-        )
+        self.launcher = subprocess.Popen(["/opt/tabby/bin/tabby"] + LAUNCH_FLAGS)
        self.client = Client("http://127.0.0.1:8000")

        # Poll until webserver at 127.0.0.1:8000 accepts connections before running inputs.
@ -79,15 +76,29 @@ class Model:
    def __exit__(self, _exc_type, _exc_value, _traceback):
        self.launcher.terminate()

+    @method()
+    async def health(self):
+        from tabby_python_client.api.v1 import health
+
+        resp = await health.asyncio(client=self.client)
+        return resp.to_dict()
+
    @method()
    async def complete(self, language: str, prompt: str):
-        from tabby_client.api.v1 import completion
-        from tabby_client.models import CompletionRequest, DebugOptions, CompletionResponse, Segments
+        from tabby_python_client.api.v1 import completion
+        from tabby_python_client.models import (
+            CompletionRequest,
+            DebugOptions,
+            CompletionResponse,
+            Segments,
+        )

        request = CompletionRequest(
            language=language, debug_options=DebugOptions(raw_prompt=prompt)
        )
-        resp: CompletionResponse = await completion.asyncio(client=self.client, json_body=request)
+        resp: CompletionResponse = await completion.asyncio(
+            client=self.client, json_body=request
+        )
        return resp.choices[0].text


@ -96,12 +107,14 @@ def main():
    import json

    model = Model()
+    print(model.health.remote())
+
    with open("./output.jsonl", "w") as fout:
        with open("./sample.jsonl") as fin:
            for line in fin:
                x = json.loads(line)
-                prompt = x['crossfile_context']['text'] + x['prompt']
-                label = x['groundtruth']
+                prompt = x["crossfile_context"]["text"] + x["prompt"]
+                label = x["groundtruth"]
                prediction = model.complete.remote("python", prompt)

                json.dump(dict(prompt=prompt, label=label, prediction=prediction), fout)