#pragma once #include "rust/cxx.h" #include namespace llama { class TextInferenceEngine { public: virtual ~TextInferenceEngine(); virtual void start(rust::Slice input_token_ids) = 0; virtual uint32_t step() = 0; virtual void end() = 0; virtual uint32_t eos_token() const = 0; }; std::unique_ptr create_engine(bool use_gpu, rust::Str model_path); } // namespace