|
| Llava (const struct common_params ¶ms, const struct LlavaParams &llava_params, std::string system_prompt="") |
|
| ~Llava () |
|
void | reset () override |
|
bool | load_image (std::string base64_str) |
|
struct llava_image_embed * | base64_image_to_embed (const std::string &base64_str) |
|
| Llama (const struct common_params ¶ms, std::string system_prompt="", bool initial_reset=true) |
|
virtual | ~Llama () |
|
std::vector< llama_token > | tokenize (const std::string &text, bool add_bos, bool special=false) |
|
std::string | detokenize (const std::vector< llama_token > &tokens) |
|
void | cancel () |
|
std::string | format_chat_prompt (std::vector< struct common_chat_msg > chat_msgs, bool add_ass) |
|
std::vector< struct LoRA > | list_loras () |
|
void | update_loras (std::vector< struct LoRA > loras) |
|
std::vector< llama_token > | truncate_tokens (const std::vector< llama_token > &tokens, int limit_size, bool add_eos=true) |
|
struct EmbeddingsOuput | generate_embeddings (const std::string &input_prompt, int normalization=2) |
|
struct EmbeddingsOuput | generate_embeddings (const std::vector< llama_token > &tokens, int normalization=2) |
|
float | rank_document (const std::string &query, const std::string &document) |
|
std::vector< float > | rank_documents (const std::string &query, const std::vector< std::string > &documents) |
|
struct ResponseOutput | generate_response (const std::string &input_prompt, struct common_params_sampling sparams, GenerateResponseCallback callbakc=nullptr, std::vector< std::string > stop={}) |
|
struct ResponseOutput | generate_response (const std::string &input_prompt, GenerateResponseCallback callbakc=nullptr, std::vector< std::string > stop={}) |
|
const struct llama_context * | get_ctx () |
|
const struct llama_model * | get_model () |
|
const struct llama_vocab * | get_vocab () |
|
int | get_n_ctx () |
|
int | get_n_ctx_train () |
|
int | get_n_embd () |
|
int | get_n_vocab () |
|
std::string | get_metadata (const std::string &key, size_t size) |
|
std::string | get_metadata (const std::string &model_name, const std::string &key, size_t size) |
|
int | get_int_metadata (const std::string &key, size_t size) |
|
int | get_int_metadata (const std::string &model_name, const std::string &key, size_t size) |
|
float | get_float_metadata (const std::string &key, size_t size) |
|
float | get_float_metadata (const std::string &model_name, const std::string &key, size_t size) |
|
struct Metadata | get_metadata () |
|
bool | is_embedding () |
|
bool | is_reranking () |
|
bool | add_bos_token () |
|
bool | is_eog () |
|
llama_token | get_token_eos () |
|
llama_token | get_token_bos () |
|
llama_token | get_token_sep () |
|