entropic/secondary__model__loader_8h_source.html

// SPDX-License-Identifier: Apache-2.0

#pragma once


#include <entropic/inference/backend.h>

#include <entropic/types/config.h>


#include <memory>

#include <mutex>

#include <string>

#include <unordered_map>

#include <vector>


namespace entropic {


class SecondaryModelLoader {

public:

    bool ensure_loaded(const std::string& role, const ModelConfig& config);


    InferenceBackend* get(const std::string& role) const;


    std::shared_ptr<InferenceBackend> get_shared(

        const std::string& role) const;


    bool release_role(const std::string& role);


    bool is_loaded(const std::string& role) const;


    std::vector<std::string> loaded_roles() const;


    void clear_all_prompt_caches();


    void shutdown();


private:

    mutable std::mutex slots_mutex_;


    std::unordered_map<std::string, std::shared_ptr<InferenceBackend>>

        slots_;


    std::unordered_map<std::string, std::string> slot_paths_;

};


} // namespace entropic

entropic::InferenceBackend
Concrete base class for inference backends (80% logic).
Definition backend.h:69

entropic::SecondaryModelLoader
Role-keyed lifecycle manager for non-primary models.
Definition secondary_model_loader.h:55

entropic::SecondaryModelLoader::get_shared
std::shared_ptr< InferenceBackend > get_shared(const std::string &role) const
Get the backend for a role as a shared_ptr.
Definition secondary_model_loader.cpp:80

entropic::SecondaryModelLoader::clear_all_prompt_caches
void clear_all_prompt_caches()
Fanout: clear prompt/KV cache on every loaded backend.
Definition secondary_model_loader.cpp:147

entropic::SecondaryModelLoader::is_loaded
bool is_loaded(const std::string &role) const
Check whether a role is currently loaded and active.
Definition secondary_model_loader.cpp:117

entropic::SecondaryModelLoader::loaded_roles
std::vector< std::string > loaded_roles() const
Names of all roles with a currently-loaded backend.
Definition secondary_model_loader.cpp:129

entropic::SecondaryModelLoader::release_role
bool release_role(const std::string &role)
Unload and drop a role.
Definition secondary_model_loader.cpp:95

entropic::SecondaryModelLoader::shutdown
void shutdown()
Unload every role.
Definition secondary_model_loader.cpp:159

entropic::SecondaryModelLoader::get
InferenceBackend * get(const std::string &role) const
Get the backend for a role.
Definition secondary_model_loader.cpp:67

entropic::SecondaryModelLoader::ensure_loaded
bool ensure_loaded(const std::string &role, const ModelConfig &config)
Lazily load and activate a model for a role.
Definition secondary_model_loader.cpp:34

config.h
Configuration structs with defaults.

backend.h
InferenceBackend concrete base class.

entropic
Activate model on GPU (WARM → ACTIVE).
Definition bundled_models.h:20

entropic::ModelConfig
Model configuration for a single tier.
Definition config.h:148