Revert stop words implementation in python

#33
2023-03-30 14:52:04 +08:00 · 2023-03-30 14:52:04 +08:00 · 78280d44bf
parent bfcdfd5b7e
commit 78280d44bf
1 changed files with 0 additions and 41 deletions
--- a/tabby/server/backend/python.py
+++ b/tabby/server/backend/python.py
@ -40,66 +40,25 @@ class PythonModelService:
            .to(device)
            .eval()
        )
        self.stopping_criteria_mappings = {}
    def generate(self, request: CompletionRequest) -> List[Choice]:
        # FIXME(meng): read preset from request.
        preset_name = "python"
        preset = LanguagePresets[preset_name]
        stopping_criteria_list = self.stopping_criteria_for_preset(preset_name)
        input_ids = self.tokenizer.encode(request.prompt, return_tensors="pt").to(
            self.device
        )
        res = self.model.generate(
            input_ids,
            max_length=preset.max_length,
            stopping_criteria=stopping_criteria_list,
        )
        output_ids = res[0][len(input_ids[0]) :]
        text = trim_with_stopwords(self.tokenizer.decode(output_ids), preset.stop_words)
        return [Choice(index=0, text=text)]
    def stopping_criteria_for_preset(self, name: str) -> StoppingCriteriaList:
        return StoppingCriteriaList(
            [
                StopWordsIdsCriteria(
                    [self.tokenizer.encode(x) for x in LanguagePresets[name].stop_words]
                )
            ]
        )
    def __call__(self, request: CompletionRequest) -> CompletionResponse:
        choices = self.generate(request)
        return CompletionResponse(
            id=random_completion_id(), created=int(time.time()), choices=choices
        )
 class StopWordsIdsCriteria(StoppingCriteria):
    def __init__(self, stop_words_ids: List[str]):
        self.stop_words_ids = stop_words_ids
    def __call__(
        self, input_ids: torch.LongTensor, scores: torch.FloatTensor, **kwargs
    ) -> bool:
        if len(input_ids) != 1:
            raise ValueError("Only 1-length list is handled")
        # FIXME(meng): trie based lookup.
        tokens = input_ids[0]
        for stop_word in self.stop_words_ids:
            if len(tokens) < len(stop_word):
                continue
            matched = True
            for i in range(len(stop_word)):
                if tokens[i - len(stop_word)] != stop_word[i]:
                    matched = False
                    break
            if matched:
                return True
        return False