entropic/context__manager_8cpp_source.html

// SPDX-License-Identifier: Apache-2.0

#include <entropic/core/context_manager.h>

#include <entropic/types/logging.h>


static auto logger = entropic::log::get("core.context_manager");


namespace entropic {


ContextManager::ContextManager(

    CompactionManager& compaction,

    EngineCallbacks& callbacks,

    ContextManagerHooks hooks)

    : compaction_(compaction),

      callbacks_(callbacks),

      hooks_(std::move(hooks)) {}


void ContextManager::refresh_context_limit(

    LoopContext& ctx,

    int context_length) {

    (void)ctx;

    if (context_length <= 0) {

        return;

    }

    if (context_length != compaction_.counter.max_tokens) {

        logger->debug("Updating context limit: {} -> {}",

                      compaction_.counter.max_tokens, context_length);

        compaction_.counter.max_tokens = context_length;

    }

}


std::pair<int, int> ContextManager::prune_tool_results(

    LoopContext& ctx,

    int keep_recent) {

    std::vector<size_t> indices;

    for (size_t i = 0; i < ctx.messages.size(); ++i) {

        auto it = ctx.messages[i].metadata.find("tool_name");

        if (it != ctx.messages[i].metadata.end()) {

            indices.push_back(i);

        }

    }


    size_t cut = 0;

    if (keep_recent > 0

        && indices.size() > static_cast<size_t>(keep_recent)) {

        cut = indices.size() - static_cast<size_t>(keep_recent);

    } else {

        return {0, 0};

    }


    int pruned = 0;

    int freed = 0;

    for (size_t j = 0; j < cut; ++j) {

        auto& msg = ctx.messages[indices[j]];

        if (msg.content.rfind("[Previous:", 0) == 0) {

            continue;

        }

        auto name_it = msg.metadata.find("tool_name");

        std::string name = (name_it != msg.metadata.end())

                             ? name_it->second : "unknown";

        int chars = static_cast<int>(msg.content.size());

        freed += chars;

        msg.content = "[Previous: " + name + " result — "

                    + std::to_string(chars) + " chars, pruned]";

        ++pruned;

    }


    if (pruned > 0) {

        compaction_.counter.clear_cache();

        logger->info("Pruned {} tool result(s), freed {} chars",

                     pruned, freed);

    }

    return {pruned, freed};

}


void ContextManager::prune_old_tool_results(LoopContext& ctx) {

    // Gate on context fill — below the warning threshold, pruning has

    // no benefit and only loses evidence the validator + dedup cache

    // depend on. Same threshold ``inject_context_warning`` uses so

    // operators see the warning at exactly the fill where pruning

    // starts engaging. Set ``warning_threshold_percent`` to 0 in

    // config to restore the pre-2.1.3 always-prune behaviour.

    float threshold = compaction_.config.warning_threshold_percent;

    float usage = compaction_.counter.usage_percent(ctx.messages);

    if (usage < threshold) {

        return;

    }


    int ttl = compaction_.config.tool_result_ttl;

    int current = ctx.metrics.iterations;

    int pruned = 0;


    for (auto& msg : ctx.messages) {

        auto tn = msg.metadata.find("tool_name");

        if (tn == msg.metadata.end()) {

            continue;

        }

        if (msg.content.rfind("[Previous:", 0) == 0) {

            continue;

        }

        auto ai = msg.metadata.find("added_at_iteration");

        if (ai == msg.metadata.end()) {

            continue;

        }

        int added = 0;

        try { added = std::stoi(ai->second); }

        catch (...) { continue; }

        if (current - added < ttl) {

            continue;

        }

        // Issue #5 (v2.1.3, companion fix): preserve the original

        // content in metadata before stubbing. The model adapter still

        // sees the stub (which is the whole point of pruning — save

        // context for the agent's next inference), but the

        // constitutional validator's POST_GENERATE hook can read

        // original_content to verify citations against actual evidence

        // instead of the stub. Without this, a long delegation that

        // legitimately fills the context window has its file:line

        // citations false-flagged as hallucinations because the stub

        // is the only evidence the validator sees.

        msg.metadata["original_content"] = msg.content;

        int chars = static_cast<int>(msg.content.size());

        msg.content = "[Previous: " + tn->second + " result — "

                    + std::to_string(chars) + " chars, pruned]";

        ++pruned;

    }


    if (pruned > 0) {

        compaction_.counter.clear_cache();

        logger->info("[AUTO-PRUNE] Pruned {} results (TTL={})", pruned, ttl);

    }

}


void ContextManager::inject_context_warning(LoopContext& ctx) {

    float threshold = compaction_.config.warning_threshold_percent;

    float usage = compaction_.counter.usage_percent(ctx.messages);

    if (usage < threshold) {

        return;

    }


    auto last = ctx.metadata.find("last_warning_iteration");

    std::string iter_str = std::to_string(ctx.metrics.iterations);

    if (last != ctx.metadata.end() && last->second == iter_str) {

        return;

    }


    int max_tok = compaction_.counter.max_tokens;

    int cur_tok = compaction_.counter.count_messages(ctx.messages);

    int pct = static_cast<int>(usage * 100.0f);


    Message warning;

    warning.role = "user";

    warning.content = "[CONTEXT WARNING] Context at "

        + std::to_string(pct) + "% capacity ("

        + std::to_string(cur_tok) + "/" + std::to_string(max_tok)

        + " tokens). Capture findings with entropic.todo if needed,"

          " then call entropic.prune_context.";

    ctx.messages.push_back(std::move(warning));

    ctx.metadata["last_warning_iteration"] = iter_str;

    logger->info("[WARNING] Context at {}% — warning injected", pct);

}


void ContextManager::check_compaction(

    LoopContext& ctx,

    bool force) {

    int cur = compaction_.counter.count_messages(ctx.messages);

    int max = compaction_.counter.max_tokens;

    if (max > 0) {

        int pct = (cur * 100) / max;

        logger->info("Context: {}/{} tokens ({}%)", cur, max, pct);

    }


    if (fire_pre_compact_hook(ctx, force)) { return; }


    auto result = compaction_.check_and_compact(

        ctx.messages, force, ctx.conversation_id);


    if (result.compacted) {

        fire_post_compact_hooks(ctx, result.old_token_count,

                                result.new_token_count);

    }

}


bool ContextManager::fire_pre_compact_hook(LoopContext& ctx, bool force) {

    if (hook_iface_.fire_pre == nullptr) { return false; }

    int tok = compaction_.counter.count_messages(ctx.messages);

    std::string json = "{\"token_count\":"

        + std::to_string(tok) + ",\"force\":"

        + (force ? "true" : "false") + "}";

    char* mod = nullptr;

    int rc = hook_iface_.fire_pre(hook_iface_.registry,

        ENTROPIC_HOOK_ON_PRE_COMPACT, json.c_str(), &mod);

    free(mod);

    if (rc != 0) {

        logger->info("ON_PRE_COMPACT hook cancelled compaction");

        return true;

    }

    return false;

}


void ContextManager::fire_post_compact_hooks(LoopContext& ctx, int old_count,

                                             int new_count) {

    logger->info("Compacted: {} -> {} tokens", old_count, new_count);

    if (callbacks_.on_compaction != nullptr) {

        std::string json = "{\"old\":" + std::to_string(old_count)

            + ",\"new\":" + std::to_string(new_count) + "}";

        callbacks_.on_compaction(json.c_str(), callbacks_.user_data);

    }


    // Hook: ON_POST_COMPACT (v1.9.1)

    if (hook_iface_.fire_post != nullptr) {

        std::string json = "{\"tokens_before\":" + std::to_string(old_count)

            + ",\"tokens_after\":" + std::to_string(new_count) + "}";

        char* out = nullptr;

        hook_iface_.fire_post(hook_iface_.registry,

            ENTROPIC_HOOK_ON_POST_COMPACT, json.c_str(), &out);

        free(out);

    }


    if (hooks_.after_compaction) {

        hooks_.after_compaction(ctx);

    }

}


} // namespace entropic

entropic::CompactionManager
Manages automatic context compaction.
Definition compaction.h:113

entropic::CompactionManager::config
CompactionConfig config
Compaction configuration.
Definition compaction.h:157

entropic::CompactionManager::counter
TokenCounter & counter
Shared token counter.
Definition compaction.h:158

entropic::CompactionManager::check_and_compact
CompactionResult check_and_compact(std::vector< Message > &messages, bool force=false, const std::string &conversation_id="")
Check if compaction is needed and perform if so.
Definition compaction.cpp:124

entropic::ContextManager::fire_post_compact_hooks
void fire_post_compact_hooks(LoopContext &ctx, int old_count, int new_count)
Fire post-compaction callbacks + ON_POST_COMPACT hook.
Definition context_manager.cpp:277

entropic::ContextManager::prune_tool_results
std::pair< int, int > prune_tool_results(LoopContext &ctx, int keep_recent)
Replace old tool results with stubs.
Definition context_manager.cpp:60

entropic::ContextManager::prune_old_tool_results
void prune_old_tool_results(LoopContext &ctx)
Auto-prune tool results older than TTL iterations.
Definition context_manager.cpp:123

entropic::ContextManager::refresh_context_limit
void refresh_context_limit(LoopContext &ctx, int context_length)
Refresh context limit based on tier config.
Definition context_manager.cpp:38

entropic::ContextManager::ContextManager
ContextManager(CompactionManager &compaction, EngineCallbacks &callbacks, ContextManagerHooks hooks={})
Construct a context manager.
Definition context_manager.cpp:23

entropic::ContextManager::fire_pre_compact_hook
bool fire_pre_compact_hook(LoopContext &ctx, bool force)
Fire ON_PRE_COMPACT; report whether compaction was cancelled.
Definition context_manager.cpp:252

entropic::ContextManager::inject_context_warning
void inject_context_warning(LoopContext &ctx)
Inject context usage warning if over threshold.
Definition context_manager.cpp:187

entropic::ContextManager::check_compaction
void check_compaction(LoopContext &ctx, bool force=false)
Check and perform compaction if needed.
Definition context_manager.cpp:223

entropic::TokenCounter::max_tokens
int max_tokens
Maximum context window size.
Definition compaction.h:71

entropic::TokenCounter::clear_cache
void clear_cache()
Clear the token count cache.
Definition compaction.cpp:98

entropic::TokenCounter::count_messages
int count_messages(const std::vector< Message > &messages) const
Count total tokens in a message list.
Definition compaction.cpp:68

entropic::TokenCounter::usage_percent
float usage_percent(const std::vector< Message > &messages) const
Get usage as fraction of context window (0.0–1.0).
Definition compaction.cpp:84

context_manager.h
Context management subsystem for the agentic loop.

ENTROPIC_HOOK_ON_POST_COMPACT
@ ENTROPIC_HOOK_ON_POST_COMPACT
12: After context compaction
Definition hooks.h:48

ENTROPIC_HOOK_ON_PRE_COMPACT
@ ENTROPIC_HOOK_ON_PRE_COMPACT
11: Before context compaction
Definition hooks.h:47

logging.h
spdlog initialization and logger access.

entropic::log::get
ENTROPIC_EXPORT std::shared_ptr< spdlog::logger > get(const std::string &name)
Get or create a named logger.
Definition logging.cpp:211

entropic
Activate model on GPU (WARM → ACTIVE).
Definition bundled_models.h:20

entropic::CompactionConfig::warning_threshold_percent
float warning_threshold_percent
Warning trigger (0.3–0.9)
Definition config.h:516

entropic::CompactionConfig::tool_result_ttl
int tool_result_ttl
Tool result TTL in turns (>= 1; v2.1.3 #6: gated on fill, no upper bound)
Definition config.h:515

entropic::ContextManagerHooks
Engine-level hooks called during context management.
Definition context_manager.h:26

entropic::ContextManagerHooks::after_compaction
std::function< void(LoopContext &)> after_compaction
Post-compaction hook.
Definition context_manager.h:27

entropic::EngineCallbacks
Callback function pointer types for engine events.
Definition engine_types.h:300

entropic::EngineCallbacks::on_compaction
void(* on_compaction)(const char *json, void *ud)
Compaction result.
Definition engine_types.h:312

entropic::EngineCallbacks::user_data
void * user_data
Opaque pointer passed to all callbacks.
Definition engine_types.h:324

entropic::LoopContext
Mutable state carried through the agentic loop.
Definition engine_types.h:223

entropic::LoopContext::metrics
LoopMetrics metrics
Timing and counts.
Definition engine_types.h:227

entropic::LoopContext::conversation_id
std::string conversation_id
Conversation ID for storage (v1.8.8)
Definition engine_types.h:234

entropic::LoopContext::metadata
std::unordered_map< std::string, std::string > metadata
Runtime metadata.
Definition engine_types.h:238

entropic::LoopContext::messages
std::vector< Message > messages
Conversation history.
Definition engine_types.h:224

entropic::LoopMetrics::iterations
int iterations
Total iterations completed.
Definition engine_types.h:129

entropic::Message
A message in a conversation.
Definition message.h:35

entropic::Message::content
std::string content
Message text content (always populated)
Definition message.h:37

entropic::Message::role
std::string role
Message role.
Definition message.h:36