#pragma once #include #include #include std::vector generate_text(std::vector prompt, llama_model* model); std::string llama_untokenize(const std::vector& tokens, const llama_model* model); std::string llama_token_to_piece(const llama_model* model, llama_token token);