tabby/crates/ctranslate2-bindings/src/lib.rs

use async_trait::async_trait;
use dashmap::DashMap;
use derive_builder::Builder;
use regex::Regex;
use tabby_inference::{TextGeneration, TextGenerationOptions};
use tokenizers::tokenizer::Tokenizer;
use tokio_util::sync::CancellationToken;

#[cxx::bridge(namespace = "tabby")]
mod ffi {
    extern "Rust" {
        type InferenceContext;
    }

    unsafe extern "C++" {
        include!("ctranslate2-bindings/include/ctranslate2.h");

        type TextInferenceEngine;

        fn create_engine(
            model_path: &str,
            model_type: &str,
            device: &str,
            compute_type: &str,
            device_indices: &[i32],
            num_replicas_per_device: usize,
        ) -> SharedPtr<TextInferenceEngine>;

        fn inference(
            &self,
            context: Box<InferenceContext>,
            callback: fn(
                &mut InferenceContext,
                // step
                usize,
                // token_id
                u32,
                // token
                String,
            ) -> bool,
            tokens: &[String],
            max_decoding_length: usize,
            sampling_temperature: f32,
        ) -> Vec<u32>;
    }
}

unsafe impl Send for ffi::TextInferenceEngine {}
unsafe impl Sync for ffi::TextInferenceEngine {}

#[derive(Builder, Debug)]
pub struct CTranslate2EngineOptions {
    model_path: String,

    model_type: String,

    tokenizer_path: String,

    device: String,

    device_indices: Vec<i32>,

    num_replicas_per_device: usize,

    compute_type: String,

    stop_words_encoding_offset: Option<usize>,
}

pub struct InferenceContext {
    stop_re: Option<Regex>,
    cancel: CancellationToken,
    reversed_output_text: String,
}

impl InferenceContext {
    fn new(stop_re: Option<Regex>, cancel: CancellationToken) -> Self {
        InferenceContext {
            stop_re,
            cancel,
            reversed_output_text: "".to_owned(),
        }
    }
}

pub struct CTranslate2Engine {
    engine: cxx::SharedPtr<ffi::TextInferenceEngine>,
    tokenizer: Tokenizer,
    stop_regex_cache: DashMap<&'static Vec<&'static str>, Regex>,
    stop_words_encoding_offset: Option<usize>,
}

impl CTranslate2Engine {
    pub fn create(options: CTranslate2EngineOptions) -> Self where {
        let engine = ffi::create_engine(
            &options.model_path,
            &options.model_type,
            &options.device,
            &options.compute_type,
            &options.device_indices,
            options.num_replicas_per_device,
        );

        return Self {
            engine,
            stop_regex_cache: DashMap::new(),
            tokenizer: Tokenizer::from_file(&options.tokenizer_path).unwrap(),
            stop_words_encoding_offset: options.stop_words_encoding_offset,
        };
    }
}

#[async_trait]
impl TextGeneration for CTranslate2Engine {
    async fn generate(&self, prompt: &str, options: TextGenerationOptions) -> String {
        let encoding = self.tokenizer.encode(prompt, true).unwrap();
        let engine = self.engine.clone();

        let cancel = CancellationToken::new();
        let cancel_for_inference = cancel.clone();
        let _guard = cancel.drop_guard();

        let stop_re: Option<Regex> = if options.stop_words.is_empty() {
            None
        } else {
            let mut re = self.stop_regex_cache.get(options.stop_words);
            if re.is_none() {
                self.stop_regex_cache.insert(
                    options.stop_words,
                    create_stop_regex(
                        &self.tokenizer,
                        options.stop_words,
                        self.stop_words_encoding_offset,
                    ),
                );
                re = self.stop_regex_cache.get(options.stop_words);
            }
            re.map(|x| x.value().clone())
        };

        let context = InferenceContext::new(stop_re, cancel_for_inference);
        let output_ids = tokio::task::spawn_blocking(move || {
            let context = Box::new(context);
            engine.inference(
                context,
                inference_callback,
                encoding.get_tokens(),
                options.max_decoding_length,
                options.sampling_temperature,
            )
        })
        .await
        .expect("Inference failed");
        self.tokenizer.decode(output_ids, true).unwrap()
    }
}

fn inference_callback(
    context: &mut InferenceContext,
    _step: usize,
    _token_id: u32,
    token: String,
) -> bool {
    if context.cancel.is_cancelled() {
        true
    } else if let Some(re) = &context.stop_re {
        let mut new_token = reverse(&token);
        new_token.push_str(&context.reversed_output_text);
        context.reversed_output_text = new_token;
        re.find(&context.reversed_output_text).is_some()
    } else {
        false
    }
}

fn reverse(s: &String) -> String {
    // Special treatment for byte fallback token.
    // https://github.com/huggingface/tokenizers/blob/main/tokenizers/src/decoders/byte_fallback.rs
    if s.len() == 6 && s.starts_with("<0x") && s.ends_with('>') {
        // Keep byte fallback tokens like <0x0A> as is, do not reverse it.
        // This won't really affect stop words regex logic, but brings more readability when
        // debugging decoding steps.
        s.to_owned()
    } else {
        s.chars().rev().collect()
    }
}

fn create_stop_regex(
    tokenizer: &Tokenizer,
    stop_words: &[&str],
    stop_words_encoding_offset: Option<usize>,
) -> Regex {
    let encodings = tokenizer
        .encode_batch(stop_words.to_owned(), false)
        .unwrap();
    let stop_tokens: Vec<String> = encodings
        .iter()
        .map(|x| {
            x.get_tokens()[stop_words_encoding_offset.unwrap_or(0)..]
                .iter()
                .rev()
                .map(reverse)
                .collect::<Vec<String>>()
                .join("")
        })
        .collect();

    // (?m) enables multi-line matching mode.
    // \A means absolute begins of string.
    let regex_string = r"(?m)\A".to_owned() + &stop_tokens.join("|");
    Regex::new(&regex_string).unwrap()
}
refactor: extract TextGeneration trait (#324) * add tabby-inference * extract TextGeneration trait * format * Rename TextInferenceEngine to CTranslate2Engine 2023-08-02 06:12:51 +00:00			`use async_trait::async_trait;`
feat: support stop sequences [TAB-52] (#212) * refactor: pass step and string token to callback * add token to callback * add stop regexp * implement stop words logic * pass token_ids from inference * improve effiency of regexp match with reversed regex * fmt * add typescript and javascript stop words * add cache for stop words regexp 2023-06-06 23:28:58 +00:00			`use dashmap::DashMap;`
refactor: extract TextGeneration trait (#324) * add tabby-inference * extract TextGeneration trait * format * Rename TextInferenceEngine to CTranslate2Engine 2023-08-02 06:12:51 +00:00			`use derive_builder::Builder;`
feat: support stop sequences [TAB-52] (#212) * refactor: pass step and string token to callback * add token to callback * add stop regexp * implement stop words logic * pass token_ids from inference * improve effiency of regexp match with reversed regex * fmt * add typescript and javascript stop words * add cache for stop words regexp 2023-06-06 23:28:58 +00:00			`use regex::Regex;`
refactor: extract TextGeneration trait (#324) * add tabby-inference * extract TextGeneration trait * format * Rename TextInferenceEngine to CTranslate2Engine 2023-08-02 06:12:51 +00:00			`use tabby_inference::{TextGeneration, TextGenerationOptions};`
Switch to sccache (#154) * fix fmt * fix * fix test * fix clippy * switch to sc cache * fix * update * update * update * fix * add test * remove clippy * update * disable incremental * update * simply 2023-05-27 23:20:17 +00:00			`use tokenizers::tokenizer::Tokenizer;`
refactor: extract TextInferenceEngineImpl to reduce duplications between EncoderDecoderImpl and DecoderImpl #189 2023-06-04 22:28:39 +00:00			`use tokio_util::sync::CancellationToken;`
add ctranslate2-bindings / tabby rust packages (#146) * add ctranslate2-bindings * add fixme for linux build * turn off shared lib * add tabby-cli 2023-05-25 21:05:28 +00:00
			`#[cxx::bridge(namespace = "tabby")]`
			`mod ffi {`
refactor: extract TextInferenceEngineImpl to reduce duplications between EncoderDecoderImpl and DecoderImpl #189 2023-06-04 22:28:39 +00:00			`extern "Rust" {`
			`type InferenceContext;`
			`}`

add ctranslate2-bindings / tabby rust packages (#146) * add ctranslate2-bindings * add fixme for linux build * turn off shared lib * add tabby-cli 2023-05-25 21:05:28 +00:00			`unsafe extern "C++" {`
			`include!("ctranslate2-bindings/include/ctranslate2.h");`

			`type TextInferenceEngine;`

feat: support cuda devices in rust tabby (#149) 2023-05-26 06:23:07 +00:00			`fn create_engine(`
			`model_path: &str,`
Support causal lm (decoder only model) (#151) * support * support causal lm 2023-05-27 08:26:33 +00:00			`model_type: &str,`
feat: support cuda devices in rust tabby (#149) 2023-05-26 06:23:07 +00:00			`device: &str,`
feat: support set compute_type through commandline arguments 2023-06-13 19:04:07 +00:00			`compute_type: &str,`
feat: support cuda devices in rust tabby (#149) 2023-05-26 06:23:07 +00:00			`device_indices: &[i32],`
			`num_replicas_per_device: usize,`
chore: mark thread safety [TAB-52] (#186) * mark thread safety * use shared_ptr to ensure thread safety * fmt 2023-06-04 06:23:31 +00:00			`) -> SharedPtr<TextInferenceEngine>;`
feat: support cuda devices in rust tabby (#149) 2023-05-26 06:23:07 +00:00
add ctranslate2-bindings / tabby rust packages (#146) * add ctranslate2-bindings * add fixme for linux build * turn off shared lib * add tabby-cli 2023-05-25 21:05:28 +00:00			`fn inference(`
			`&self,`
refactor: extract TextInferenceEngineImpl to reduce duplications between EncoderDecoderImpl and DecoderImpl #189 2023-06-04 22:28:39 +00:00			`context: Box<InferenceContext>,`
feat: support stop sequences [TAB-52] (#212) * refactor: pass step and string token to callback * add token to callback * add stop regexp * implement stop words logic * pass token_ids from inference * improve effiency of regexp match with reversed regex * fmt * add typescript and javascript stop words * add cache for stop words regexp 2023-06-06 23:28:58 +00:00			`callback: fn(`
			`&mut InferenceContext,`
			`// step`
			`usize,`
			`// token_id`
			`u32,`
			`// token`
			`String,`
			`) -> bool,`
add ctranslate2-bindings / tabby rust packages (#146) * add ctranslate2-bindings * add fixme for linux build * turn off shared lib * add tabby-cli 2023-05-25 21:05:28 +00:00			`tokens: &[String],`
			`max_decoding_length: usize,`
			`sampling_temperature: f32,`
feat: support stop sequences [TAB-52] (#212) * refactor: pass step and string token to callback * add token to callback * add stop regexp * implement stop words logic * pass token_ids from inference * improve effiency of regexp match with reversed regex * fmt * add typescript and javascript stop words * add cache for stop words regexp 2023-06-06 23:28:58 +00:00			`) -> Vec<u32>;`
add ctranslate2-bindings / tabby rust packages (#146) * add ctranslate2-bindings * add fixme for linux build * turn off shared lib * add tabby-cli 2023-05-25 21:05:28 +00:00			`}`
			`}`

chore: mark thread safety [TAB-52] (#186) * mark thread safety * use shared_ptr to ensure thread safety * fmt 2023-06-04 06:23:31 +00:00			`unsafe impl Send for ffi::TextInferenceEngine {}`
			`unsafe impl Sync for ffi::TextInferenceEngine {}`

chore: remove unused lock 2023-05-26 07:06:08 +00:00			`#[derive(Builder, Debug)]`
refactor: extract TextGeneration trait (#324) * add tabby-inference * extract TextGeneration trait * format * Rename TextInferenceEngine to CTranslate2Engine 2023-08-02 06:12:51 +00:00			`pub struct CTranslate2EngineOptions {`
feat: support cuda devices in rust tabby (#149) 2023-05-26 06:23:07 +00:00			`model_path: String,`

Support causal lm (decoder only model) (#151) * support * support causal lm 2023-05-27 08:26:33 +00:00			`model_type: String,`

feat: support cuda devices in rust tabby (#149) 2023-05-26 06:23:07 +00:00			`tokenizer_path: String,`

			`device: String,`

			`device_indices: Vec<i32>,`

			`num_replicas_per_device: usize,`
feat: support set compute_type through commandline arguments 2023-06-13 19:04:07 +00:00
			`compute_type: String,`
feat: add stop words encoding offset for ctranslate model config (#371) * feat: add stop words encoding offset for ctranslate model config * feat: set default suffix to \n * add special treatment for bytefallback tokens 2023-08-28 06:07:01 +00:00
			`stop_words_encoding_offset: Option<usize>,`
feat: support cuda devices in rust tabby (#149) 2023-05-26 06:23:07 +00:00			`}`

feat: support stop sequences [TAB-52] (#212) * refactor: pass step and string token to callback * add token to callback * add stop regexp * implement stop words logic * pass token_ids from inference * improve effiency of regexp match with reversed regex * fmt * add typescript and javascript stop words * add cache for stop words regexp 2023-06-06 23:28:58 +00:00			`pub struct InferenceContext {`
			`stop_re: Option<Regex>,`
			`cancel: CancellationToken,`
			`reversed_output_text: String,`
			`}`

			`impl InferenceContext {`
			`fn new(stop_re: Option<Regex>, cancel: CancellationToken) -> Self {`
			`InferenceContext {`
			`stop_re,`
			`cancel,`
			`reversed_output_text: "".to_owned(),`
			`}`
			`}`
			`}`
refactor: extract TextInferenceEngineImpl to reduce duplications between EncoderDecoderImpl and DecoderImpl #189 2023-06-04 22:28:39 +00:00
refactor: extract TextGeneration trait (#324) * add tabby-inference * extract TextGeneration trait * format * Rename TextInferenceEngine to CTranslate2Engine 2023-08-02 06:12:51 +00:00			`pub struct CTranslate2Engine {`
chore: mark thread safety [TAB-52] (#186) * mark thread safety * use shared_ptr to ensure thread safety * fmt 2023-06-04 06:23:31 +00:00			`engine: cxx::SharedPtr<ffi::TextInferenceEngine>,`
add ctranslate2-bindings / tabby rust packages (#146) * add ctranslate2-bindings * add fixme for linux build * turn off shared lib * add tabby-cli 2023-05-25 21:05:28 +00:00			`tokenizer: Tokenizer,`
feat: support stop sequences [TAB-52] (#212) * refactor: pass step and string token to callback * add token to callback * add stop regexp * implement stop words logic * pass token_ids from inference * improve effiency of regexp match with reversed regex * fmt * add typescript and javascript stop words * add cache for stop words regexp 2023-06-06 23:28:58 +00:00			`stop_regex_cache: DashMap<&'static Vec<&'static str>, Regex>,`
feat: add stop words encoding offset for ctranslate model config (#371) * feat: add stop words encoding offset for ctranslate model config * feat: set default suffix to \n * add special treatment for bytefallback tokens 2023-08-28 06:07:01 +00:00			`stop_words_encoding_offset: Option<usize>,`
add ctranslate2-bindings / tabby rust packages (#146) * add ctranslate2-bindings * add fixme for linux build * turn off shared lib * add tabby-cli 2023-05-25 21:05:28 +00:00			`}`

refactor: extract TextGeneration trait (#324) * add tabby-inference * extract TextGeneration trait * format * Rename TextInferenceEngine to CTranslate2Engine 2023-08-02 06:12:51 +00:00			`impl CTranslate2Engine {`
			`pub fn create(options: CTranslate2EngineOptions) -> Self where {`
feat: support cuda devices in rust tabby (#149) 2023-05-26 06:23:07 +00:00			`let engine = ffi::create_engine(`
			`&options.model_path,`
Support causal lm (decoder only model) (#151) * support * support causal lm 2023-05-27 08:26:33 +00:00			`&options.model_type,`
feat: support cuda devices in rust tabby (#149) 2023-05-26 06:23:07 +00:00			`&options.device,`
feat: support set compute_type through commandline arguments 2023-06-13 19:04:07 +00:00			`&options.compute_type,`
feat: support cuda devices in rust tabby (#149) 2023-05-26 06:23:07 +00:00			`&options.device_indices,`
			`options.num_replicas_per_device,`
			`);`
refactor: extract TextGeneration trait (#324) * add tabby-inference * extract TextGeneration trait * format * Rename TextInferenceEngine to CTranslate2Engine 2023-08-02 06:12:51 +00:00
			`return Self {`
Switch to sccache (#154) * fix fmt * fix * fix test * fix clippy * switch to sc cache * fix * update * update * update * fix * add test * remove clippy * update * disable incremental * update * simply 2023-05-27 23:20:17 +00:00			`engine,`
feat: support stop sequences [TAB-52] (#212) * refactor: pass step and string token to callback * add token to callback * add stop regexp * implement stop words logic * pass token_ids from inference * improve effiency of regexp match with reversed regex * fmt * add typescript and javascript stop words * add cache for stop words regexp 2023-06-06 23:28:58 +00:00			`stop_regex_cache: DashMap::new(),`
feat: support cuda devices in rust tabby (#149) 2023-05-26 06:23:07 +00:00			`tokenizer: Tokenizer::from_file(&options.tokenizer_path).unwrap(),`
feat: add stop words encoding offset for ctranslate model config (#371) * feat: add stop words encoding offset for ctranslate model config * feat: set default suffix to \n * add special treatment for bytefallback tokens 2023-08-28 06:07:01 +00:00			`stop_words_encoding_offset: options.stop_words_encoding_offset,`
add ctranslate2-bindings / tabby rust packages (#146) * add ctranslate2-bindings * add fixme for linux build * turn off shared lib * add tabby-cli 2023-05-25 21:05:28 +00:00			`};`
			`}`
refactor: extract TextGeneration trait (#324) * add tabby-inference * extract TextGeneration trait * format * Rename TextInferenceEngine to CTranslate2Engine 2023-08-02 06:12:51 +00:00			`}`
add ctranslate2-bindings / tabby rust packages (#146) * add ctranslate2-bindings * add fixme for linux build * turn off shared lib * add tabby-cli 2023-05-25 21:05:28 +00:00
refactor: extract TextGeneration trait (#324) * add tabby-inference * extract TextGeneration trait * format * Rename TextInferenceEngine to CTranslate2Engine 2023-08-02 06:12:51 +00:00			`#[async_trait]`
			`impl TextGeneration for CTranslate2Engine {`
			`async fn generate(&self, prompt: &str, options: TextGenerationOptions) -> String {`
add ctranslate2-bindings / tabby rust packages (#146) * add ctranslate2-bindings * add fixme for linux build * turn off shared lib * add tabby-cli 2023-05-25 21:05:28 +00:00			`let encoding = self.tokenizer.encode(prompt, true).unwrap();`
chore: mark thread safety [TAB-52] (#186) * mark thread safety * use shared_ptr to ensure thread safety * fmt 2023-06-04 06:23:31 +00:00			`let engine = self.engine.clone();`
refactor: extract TextInferenceEngineImpl to reduce duplications between EncoderDecoderImpl and DecoderImpl #189 2023-06-04 22:28:39 +00:00
			`let cancel = CancellationToken::new();`
			`let cancel_for_inference = cancel.clone();`
			`let _guard = cancel.drop_guard();`

feat: support stop sequences [TAB-52] (#212) * refactor: pass step and string token to callback * add token to callback * add stop regexp * implement stop words logic * pass token_ids from inference * improve effiency of regexp match with reversed regex * fmt * add typescript and javascript stop words * add cache for stop words regexp 2023-06-06 23:28:58 +00:00			`let stop_re: Option<Regex> = if options.stop_words.is_empty() {`
			`None`
			`} else {`
			`let mut re = self.stop_regex_cache.get(options.stop_words);`
			`if re.is_none() {`
			`self.stop_regex_cache.insert(`
			`options.stop_words,`
feat: add stop words encoding offset for ctranslate model config (#371) * feat: add stop words encoding offset for ctranslate model config * feat: set default suffix to \n * add special treatment for bytefallback tokens 2023-08-28 06:07:01 +00:00			`create_stop_regex(`
			`&self.tokenizer,`
			`options.stop_words,`
			`self.stop_words_encoding_offset,`
			`),`
feat: support stop sequences [TAB-52] (#212) * refactor: pass step and string token to callback * add token to callback * add stop regexp * implement stop words logic * pass token_ids from inference * improve effiency of regexp match with reversed regex * fmt * add typescript and javascript stop words * add cache for stop words regexp 2023-06-06 23:28:58 +00:00			`);`
			`re = self.stop_regex_cache.get(options.stop_words);`
			`}`
			`re.map(\|x\| x.value().clone())`
			`};`

			`let context = InferenceContext::new(stop_re, cancel_for_inference);`
			`let output_ids = tokio::task::spawn_blocking(move \|\| {`
refactor: extract TextInferenceEngineImpl to reduce duplications between EncoderDecoderImpl and DecoderImpl #189 2023-06-04 22:28:39 +00:00			`let context = Box::new(context);`
chore: mark thread safety [TAB-52] (#186) * mark thread safety * use shared_ptr to ensure thread safety * fmt 2023-06-04 06:23:31 +00:00			`engine.inference(`
refactor: extract TextInferenceEngineImpl to reduce duplications between EncoderDecoderImpl and DecoderImpl #189 2023-06-04 22:28:39 +00:00			`context,`
feat: support stop sequences [TAB-52] (#212) * refactor: pass step and string token to callback * add token to callback * add stop regexp * implement stop words logic * pass token_ids from inference * improve effiency of regexp match with reversed regex * fmt * add typescript and javascript stop words * add cache for stop words regexp 2023-06-06 23:28:58 +00:00			`inference_callback,`
chore: mark thread safety [TAB-52] (#186) * mark thread safety * use shared_ptr to ensure thread safety * fmt 2023-06-04 06:23:31 +00:00			`encoding.get_tokens(),`
			`options.max_decoding_length,`
			`options.sampling_temperature,`
			`)`
			`})`
			`.await`
			`.expect("Inference failed");`
add ctranslate2-bindings / tabby rust packages (#146) * add ctranslate2-bindings * add fixme for linux build * turn off shared lib * add tabby-cli 2023-05-25 21:05:28 +00:00			`self.tokenizer.decode(output_ids, true).unwrap()`
			`}`
			`}`
feat: support stop sequences [TAB-52] (#212) * refactor: pass step and string token to callback * add token to callback * add stop regexp * implement stop words logic * pass token_ids from inference * improve effiency of regexp match with reversed regex * fmt * add typescript and javascript stop words * add cache for stop words regexp 2023-06-06 23:28:58 +00:00
			`fn inference_callback(`
			`context: &mut InferenceContext,`
			`_step: usize,`
			`_token_id: u32,`
			`token: String,`
			`) -> bool {`
			`if context.cancel.is_cancelled() {`
			`true`
			`} else if let Some(re) = &context.stop_re {`
feat: add stop words encoding offset for ctranslate model config (#371) * feat: add stop words encoding offset for ctranslate model config * feat: set default suffix to \n * add special treatment for bytefallback tokens 2023-08-28 06:07:01 +00:00			`let mut new_token = reverse(&token);`
feat: support stop sequences [TAB-52] (#212) * refactor: pass step and string token to callback * add token to callback * add stop regexp * implement stop words logic * pass token_ids from inference * improve effiency of regexp match with reversed regex * fmt * add typescript and javascript stop words * add cache for stop words regexp 2023-06-06 23:28:58 +00:00			`new_token.push_str(&context.reversed_output_text);`
			`context.reversed_output_text = new_token;`
			`re.find(&context.reversed_output_text).is_some()`
			`} else {`
			`false`
			`}`
			`}`

feat: add stop words encoding offset for ctranslate model config (#371) * feat: add stop words encoding offset for ctranslate model config * feat: set default suffix to \n * add special treatment for bytefallback tokens 2023-08-28 06:07:01 +00:00			`fn reverse(s: &String) -> String {`
			`// Special treatment for byte fallback token.`
			`// https://github.com/huggingface/tokenizers/blob/main/tokenizers/src/decoders/byte_fallback.rs`
			`if s.len() == 6 && s.starts_with("<0x") && s.ends_with('>') {`
			`// Keep byte fallback tokens like <0x0A> as is, do not reverse it.`
			`// This won't really affect stop words regex logic, but brings more readability when`
			`// debugging decoding steps.`
			`s.to_owned()`
			`} else {`
			`s.chars().rev().collect()`
			`}`
feat: support stop sequences [TAB-52] (#212) * refactor: pass step and string token to callback * add token to callback * add stop regexp * implement stop words logic * pass token_ids from inference * improve effiency of regexp match with reversed regex * fmt * add typescript and javascript stop words * add cache for stop words regexp 2023-06-06 23:28:58 +00:00			`}`

feat: add stop words encoding offset for ctranslate model config (#371) * feat: add stop words encoding offset for ctranslate model config * feat: set default suffix to \n * add special treatment for bytefallback tokens 2023-08-28 06:07:01 +00:00			`fn create_stop_regex(`
			`tokenizer: &Tokenizer,`
			`stop_words: &[&str],`
			`stop_words_encoding_offset: Option<usize>,`
			`) -> Regex {`
feat: improve error handling and messages [TAB-58] (#213) * add fatal macro * switch expect to fatal * improve error handling of serve * improve error handling on download module * improve error handling in scheduler * improve error handling * fmt * fmt 2023-06-07 02:02:58 +00:00			`let encodings = tokenizer`
			`.encode_batch(stop_words.to_owned(), false)`
			`.unwrap();`
feat: support stop sequences [TAB-52] (#212) * refactor: pass step and string token to callback * add token to callback * add stop regexp * implement stop words logic * pass token_ids from inference * improve effiency of regexp match with reversed regex * fmt * add typescript and javascript stop words * add cache for stop words regexp 2023-06-06 23:28:58 +00:00			`let stop_tokens: Vec<String> = encodings`
			`.iter()`
feat: add stop words encoding offset for ctranslate model config (#371) * feat: add stop words encoding offset for ctranslate model config * feat: set default suffix to \n * add special treatment for bytefallback tokens 2023-08-28 06:07:01 +00:00			`.map(\|x\| {`
			`x.get_tokens()[stop_words_encoding_offset.unwrap_or(0)..]`
			`.iter()`
			`.rev()`
			`.map(reverse)`
			`.collect::<Vec<String>>()`
			`.join("")`
			`})`
feat: support stop sequences [TAB-52] (#212) * refactor: pass step and string token to callback * add token to callback * add stop regexp * implement stop words logic * pass token_ids from inference * improve effiency of regexp match with reversed regex * fmt * add typescript and javascript stop words * add cache for stop words regexp 2023-06-06 23:28:58 +00:00			`.collect();`

			`// (?m) enables multi-line matching mode.`
			`// \A means absolute begins of string.`
			`let regex_string = r"(?m)\A".to_owned() + &stop_tokens.join("\|");`
			`Regex::new(&regex_string).unwrap()`
			`}`