Entropic 2.3.8
Local-first agentic inference engine
Loading...
Searching...
No Matches
entropic::LlamaCppBackend Member List

This is the complete list of members for entropic::LlamaCppBackend, including all inherited members.

activate()entropic::InferenceBackend
allocate_temp_seq_id()entropic::LlamaCppBackendprotected
apply_chat_template(const std::vector< Message > &messages, const GenerationParams &params) constentropic::LlamaCppBackendprotected
capabilities() constentropic::InferenceBackend
clear_prompt_cache() overrideentropic::LlamaCppBackendinlinevirtual
clear_state(int seq_id=-1)entropic::InferenceBackend
complete(const std::string &prompt, const GenerationParams &params)entropic::InferenceBackend
compute_perplexity(const int32_t *tokens, int n_tokens)entropic::InferenceBackend
compute_prefix_token_count(const std::vector< Message > &messages, const GenerationParams &params)entropic::LlamaCppBackendprotected
config() constentropic::InferenceBackendinline
context_length() constentropic::InferenceBackendinline
count_tokens(const std::string &text) constentropic::InferenceBackend
create_inference_context()entropic::LlamaCppBackendprotected
create_sampler(const GenerationParams &params) constentropic::LlamaCppBackendprotected
ctx_entropic::LlamaCppBackendprotected
deactivate()entropic::InferenceBackend
decode_loop(const std::vector< llama_token > &tokens, const GenerationParams &params, std::function< void(std::string_view)> on_token, std::atomic< bool > *cancel)entropic::LlamaCppBackendprotected
decode_tokens_from(const std::vector< llama_token > &tokens, int start_offset)entropic::LlamaCppBackendprotected
detokenize(llama_token token) constentropic::LlamaCppBackendprotected
do_activate() overrideentropic::LlamaCppBackendprotectedvirtual
do_backend_name() const overrideentropic::LlamaCppBackendprotectedvirtual
do_clear_state(int seq_id) overrideentropic::LlamaCppBackendprotectedvirtual
do_complete(const std::string &prompt, const GenerationParams &params) overrideentropic::LlamaCppBackendprotectedvirtual
do_count_tokens(const std::string &text) const overrideentropic::LlamaCppBackendprotectedvirtual
do_deactivate() overrideentropic::LlamaCppBackendprotectedvirtual
do_evaluate_logprobs(const int32_t *tokens, int n_tokens) overrideentropic::LlamaCppBackendprotectedvirtual
do_generate(const std::vector< Message > &messages, const GenerationParams &params) overrideentropic::LlamaCppBackendprotectedvirtual
do_generate_seq(int seq_id, const std::vector< Message > &messages, const GenerationParams &params)entropic::InferenceBackendprotectedvirtual
do_generate_speculative(const std::vector< Message > &messages, const GenerationParams &params, std::function< void(std::string_view token)> on_token, std::atomic< bool > &cancel) overrideentropic::LlamaCppBackendprotectedvirtual
do_generate_streaming(const std::vector< Message > &messages, const GenerationParams &params, std::function< void(std::string_view token)> on_token, std::atomic< bool > &cancel) overrideentropic::LlamaCppBackendprotectedvirtual
do_generate_streaming_seq(int seq_id, const std::vector< Message > &messages, const GenerationParams &params, std::function< void(std::string_view token)> on_token, std::atomic< bool > &cancel)entropic::InferenceBackendprotectedvirtual
do_generate_streaming_text_only(const std::vector< Message > &messages, const GenerationParams &params, std::function< void(std::string_view token)> on_token, std::atomic< bool > &cancel)entropic::LlamaCppBackendprotected
do_generate_text_only(const std::vector< Message > &messages, const GenerationParams &params)entropic::LlamaCppBackendprotected
do_info() const overrideentropic::LlamaCppBackendprotectedvirtual
do_load(const ModelConfig &config) overrideentropic::LlamaCppBackendprotectedvirtual
do_restore_state(int seq_id, const std::vector< uint8_t > &buffer)entropic::InferenceBackendprotectedvirtual
do_save_state(int seq_id, std::vector< uint8_t > &buffer) constentropic::InferenceBackendprotectedvirtual
do_supports(BackendCapability cap) const overrideentropic::LlamaCppBackendprotectedvirtual
do_unload() overrideentropic::LlamaCppBackendprotectedvirtual
evaluate_logprobs(const int32_t *tokens, int n_tokens)entropic::InferenceBackend
extract_system_prompt(const std::vector< Message > &messages)entropic::LlamaCppBackendprotectedstatic
extract_token_logprob(const float *logits, int32_t next_token, int n_vocab)entropic::LlamaCppBackendprotectedstatic
fire_model_load_hook(const ModelConfig &config)entropic::InferenceBackendprotected
free_seq_ids_entropic::LlamaCppBackendprotected
generate(const std::vector< Message > &messages, const GenerationParams &params)entropic::InferenceBackend
generate_multimodal(const std::vector< Message > &messages, const GenerationParams &params, std::function< void(std::string_view token)> on_token, std::atomic< bool > *cancel)entropic::LlamaCppBackendprotected
generate_seq(int seq_id, const std::vector< Message > &messages, const GenerationParams &params)entropic::InferenceBackend
generate_speculative(const std::vector< Message > &messages, const GenerationParams &params, std::function< void(std::string_view token)> on_token, std::atomic< bool > &cancel)entropic::InferenceBackend
generate_speculative_with_draft(const std::vector< Message > &messages, const GenerationParams &params, std::function< void(std::string_view token)> on_token, std::atomic< bool > &cancel, LlamaCppBackend &draft, int n_draft_max, const std::string &draft_path)entropic::LlamaCppBackend
generate_streaming(const std::vector< Message > &messages, const GenerationParams &params, std::function< void(std::string_view token)> on_token, std::atomic< bool > &cancel)entropic::InferenceBackend
generate_streaming_seq(int seq_id, const std::vector< Message > &messages, const GenerationParams &params, std::function< void(std::string_view token)> on_token, std::atomic< bool > &cancel)entropic::InferenceBackend
has_vision_entropic::LlamaCppBackendprotected
info() constentropic::InferenceBackend
init_mmproj_if_configured()entropic::LlamaCppBackendprotected
is_active() constentropic::InferenceBackendinline
is_loaded() constentropic::InferenceBackendinline
is_recurrent() constentropic::LlamaCppBackendprotected
is_recurrent_entropic::LlamaCppBackendprotected
last_error_entropic::InferenceBackendprotected
llama_context_ptr()entropic::LlamaCppBackendinline
llama_model_ptr()entropic::LlamaCppBackendinline
load(const ModelConfig &config)entropic::InferenceBackend
load_and_activate(const ModelConfig &config)entropic::InferenceBackend
load_gpu_model()entropic::LlamaCppBackendprotected
model_entropic::LlamaCppBackendprotected
mtmd_ctx_entropic::LlamaCppBackendprotected
mtmd_prefill(const std::string &prompt, const std::vector<::mtmd_bitmap * > &bitmaps, std::string &err_msg)entropic::LlamaCppBackendprotected
prefill_and_cache_prefix(const std::vector< llama_token > &tokens, int prefix_tokens, const CacheKey &key)entropic::LlamaCppBackendprotected
prompt_cache_entropic::LlamaCppBackendprotected
prompt_cache_config_entropic::LlamaCppBackendprotected
release_temp_seq_id(llama_seq_id seq_id)entropic::LlamaCppBackendprotected
restore_cached_prefix(const CacheEntry *cached, const std::vector< llama_token > &tokens)entropic::LlamaCppBackendprotected
restore_state(int seq_id, const std::vector< uint8_t > &buffer)entropic::InferenceBackend
run_prefill(const std::vector< llama_token > &tokens)entropic::LlamaCppBackendprotected
run_prefill_cached(const std::vector< llama_token > &tokens, const std::string &system_prompt, const std::vector< Message > &messages, const GenerationParams &params)entropic::LlamaCppBackendprotected
run_sampling_loop(const GenerationParams &params, std::function< void(std::string_view token)> on_token, std::atomic< bool > *cancel, const std::chrono::steady_clock::time_point &t0)entropic::LlamaCppBackendprotected
save_prefix_to_cache(const CacheKey &key, int prefix_tokens)entropic::LlamaCppBackendprotected
save_state(int seq_id, std::vector< uint8_t > &buffer) constentropic::InferenceBackend
seq_id_mutex_entropic::LlamaCppBackendprotected
set_hooks(const HookInterface &hooks)entropic::InferenceBackendinlineprotected
set_prompt_cache_config(const PromptCacheConfig &config)entropic::LlamaCppBackendinline
state() constentropic::InferenceBackendinline
step_token(llama_sampler *sampler, std::string &generated, std::function< void(std::string_view)> &on_token, const std::vector< std::string > &stop)entropic::LlamaCppBackendprotected
supports(BackendCapability cap) constentropic::InferenceBackend
tokenize(const std::string &text, bool add_special) constentropic::LlamaCppBackendprotected
tokenize_text(const std::string &text) const overrideentropic::LlamaCppBackendvirtual
unload()entropic::InferenceBackend
vocab_entropic::LlamaCppBackendprotected
~InferenceBackend()=default (defined in entropic::InferenceBackend)entropic::InferenceBackendvirtual
~LlamaCppBackend() overrideentropic::LlamaCppBackend