entropic/tool__executor_8cpp_source.html

// SPDX-License-Identifier: Apache-2.0

#include <entropic/mcp/tool_executor.h>

#include <entropic/mcp/tool_result_classify.h>

#include <entropic/mcp/utf8_sanitize.h>

#include <entropic/types/logging.h>


#include <nlohmann/json.hpp>


#include <algorithm>

#include <chrono>

#include <memory>

#include <optional>


static auto logger = entropic::log::get("mcp.tool_executor");


namespace entropic {


ToolExecutor::ToolExecutor(

    ServerManager& server_manager,

    const LoopConfig& loop_config,

    EngineCallbacks& callbacks,

    ToolExecutorHooks hooks)

    : server_manager_(server_manager),

      loop_config_(loop_config),

      callbacks_(callbacks),

      hooks_(hooks) {}


void ToolExecutor::set_permission_persist(

    const PermissionPersistInterface& persist) {

    permission_persist_ = persist;

}


std::vector<Message> ToolExecutor::process_tool_calls(

    LoopContext& ctx,

    const std::vector<ToolCall>& tool_calls) {

    logger->info("Processing {} tool calls", tool_calls.size());

    ctx.state = AgentState::WAITING_TOOL;

    fire_state_callback(ctx);


    auto limited = sort_tool_calls(tool_calls);

    int eff_limit = ctx.effective_max_tool_calls_per_turn >= 0

        ? ctx.effective_max_tool_calls_per_turn

        : loop_config_.max_tool_calls_per_turn;

    truncate_to_limit(limited, eff_limit);


    std::vector<Message> results;

    for (const auto& call : limited) {

        auto msgs = process_single_call(ctx, call);

        for (auto& m : msgs) {

            results.push_back(std::move(m));

        }

        if (should_stop_batch(ctx, results)) {

            break;

        }

    }


    ctx.consecutive_errors = 0;

    return results;

}


std::vector<ToolCall> ToolExecutor::sort_tool_calls(

    const std::vector<ToolCall>& calls) {

    auto sorted = calls;

    std::stable_sort(sorted.begin(), sorted.end(),

        [](const ToolCall& a, const ToolCall& b) {

            bool a_delegate = (a.name == "entropic.delegate");

            bool b_delegate = (b.name == "entropic.delegate");

            return !a_delegate && b_delegate;

        });

    return sorted;

}


std::string ToolExecutor::check_duplicate(

    const LoopContext& ctx,

    const ToolCall& call) const {

    if (server_manager_.skip_duplicate_check(call.name)) {

        return "";

    }

    auto key = tool_call_key(call);

    auto it = ctx.recent_tool_calls.find(key);

    if (it != ctx.recent_tool_calls.end()) {

        return it->second;

    }

    return "";

}


Message ToolExecutor::handle_duplicate(

    LoopContext& ctx,

    const ToolCall& call,

    const std::string& previous_result) {

    ctx.consecutive_duplicate_attempts++;

    logger->warn("Duplicate tool call #{}: {}",

                 ctx.consecutive_duplicate_attempts, call.name);


    if (ctx.consecutive_duplicate_attempts >= 3) {

        return create_circuit_breaker_message();

    }

    return create_duplicate_message(call, previous_result);

}


bool ToolExecutor::check_approval(const ToolCall& call) {

    auto args_json = serialize_args(call);

    bool auto_ok = loop_config_.auto_approve_tools

                || server_manager_.is_explicitly_allowed(

                       call.name, args_json);


    bool approved = auto_ok;

    if (!approved && callbacks_.on_tool_call != nullptr) {

        auto call_json = serialize_tool_call(call);

        callbacks_.on_tool_call(call_json.c_str(),

                                callbacks_.user_data);

        approved = true;

    }


    // Hook: ON_PERMISSION_CHECK — informational (v1.9.1)

    if (hook_iface_.fire_info != nullptr) {

        std::string perm = approved ? "allowed" : "denied";

        std::string json = "{\"tool_name\":\""

            + call.name + "\",\"permission\":\"" + perm + "\"}";

        hook_iface_.fire_info(hook_iface_.registry,

            ENTROPIC_HOOK_ON_PERMISSION_CHECK, json.c_str());

    }


    if (!approved) {

        logger->warn("No approval callback — denying: {}", call.name);

    }

    return approved;

}


std::optional<Message> ToolExecutor::check_tier_allowed(

    const LoopContext& ctx, const ToolCall& call) const {

    // Tier allowlist enforcement is wired when the facade provides

    // tier config. For now, pass through (no tier locked = no filter).

    if (ctx.locked_tier.empty()) {

        return std::nullopt;

    }

    // Actual tier allowlist lookup deferred to facade integration

    return std::nullopt;

}


static std::string check_required_fields(

    const nlohmann::json& schema,

    const nlohmann::json& args)

{

    for (const auto& req : schema.value("required",

                                         nlohmann::json::array())) {

        if (!args.contains(req.get<std::string>())) {

            return "Missing required argument: "

                 + req.get<std::string>();

        }

    }

    return "";

}


static std::string check_enum(

    const std::string& key,

    const nlohmann::json& allowed,

    const nlohmann::json& val)

{

    for (const auto& e : allowed) {

        if (e == val) { return ""; }

    }

    return "Invalid value for '" + key + "': "

         + val.dump() + ". Must be one of: " + allowed.dump();

}


static std::string check_type(

    const std::string& key,

    const std::string& type,

    const nlohmann::json& val)

{

    bool ok = (type == "string" && val.is_string())

           || (type == "integer" && val.is_number_integer())

           || (type == "number" && val.is_number())

           || (type == "boolean" && val.is_boolean())

           || (type == "array" && val.is_array())

           || (type == "object" && val.is_object());

    return ok ? "" : "Type mismatch for '" + key

                   + "': expected " + type;

}


static std::string check_property_constraints(

    const std::string& key,

    const nlohmann::json& prop,

    const nlohmann::json& val)

{

    if (prop.contains("enum")) {

        auto err = check_enum(key, prop["enum"], val);

        if (!err.empty()) { return err; }

    }

    if (!prop.contains("type")) { return ""; }

    return check_type(key, prop["type"].get<std::string>(), val);

}


static std::string validate_tool_args(

    const std::string& schema_json,

    const nlohmann::json& args)

{

    auto schema = nlohmann::json::parse(schema_json, nullptr, false);

    if (!schema.is_object()) { return ""; }


    auto err = check_required_fields(schema, args);

    auto props = schema.value("properties", nlohmann::json::object());

    for (auto it = props.begin(); it != props.end() && err.empty(); ++it) {

        if (args.contains(it.key())) {

            err = check_property_constraints(

                it.key(), it.value(), args[it.key()]);

        }

    }

    return err;

}


static std::string parse_tool_result_text(const std::string& result_json) {

    try {

        auto j = nlohmann::json::parse(result_json);

        return j.value("result", result_json);

    } catch (...) {

        return result_json;

    }

}


std::pair<Message, std::string> ToolExecutor::execute_tool(

    LoopContext& ctx, const ToolCall& call) {


    auto args_json = serialize_args(call);


    if (callbacks_.on_tool_start != nullptr) {

        auto call_json = serialize_tool_call(call);

        callbacks_.on_tool_start(call_json.c_str(),

                                 callbacks_.user_data);

    }


    auto start = std::chrono::steady_clock::now();

    // Inbound boundary from MCP server subprocess. v2.1.0 (#47) introduced

    // this; v2.1.1 (#3) generalized it as one of several boundary-policy

    // sanitize sites — see include/entropic/mcp/utf8_sanitize.h for the

    // full policy. The earlier "trust downstream" assumption was wrong:

    // bytes also enter via the model token stream and the audit-replay

    // path; both now sanitize at their own boundaries.

    auto result_json = mcp::sanitize_utf8(

        server_manager_.execute(call.name, args_json));

    auto end = std::chrono::steady_clock::now();

    auto ms = std::chrono::duration_cast<

        std::chrono::milliseconds>(end - start).count();


    ctx.metrics.tool_calls++;


    std::string result_text = parse_tool_result_text(result_json);


    // P1-11 (2.0.6-rc16): stash into history ring buffer so the

    // constitutional validator revision prompt (and diagnostic tools)

    // can surface prior-iteration tool calls without re-reading

    // messages[].

    record_tool_history(call, args_json, result_text, ms,

                        ctx.metrics.iterations);


    fire_tool_complete_callback(call, result_text, ms);


    Message msg;

    msg.role = "user";

    msg.content = result_text;

    msg.metadata["tool_call_id"] = call.id;

    msg.metadata["tool_name"] = call.name;


    return {std::move(msg), result_json};

}


void ToolExecutor::record_tool_history(const ToolCall& call,

                                       const std::string& args_json,

                                       const std::string& result_text,

                                       long long ms, int iteration) {

    ToolCallRecord rec;

    rec.sequence = ++history_seq_;

    rec.tool_name = call.name;

    rec.params_summary = summarize_params(args_json);

    rec.status = (result_text.rfind("error", 0) == 0)

        ? "error" : "success";

    rec.result_summary = truncate_result(result_text, 200);

    rec.elapsed_ms = static_cast<double>(ms);

    rec.iteration = iteration;

    history_.record(rec);

}


std::string ToolExecutor::tool_call_key(const ToolCall& call) {

    // Sort arguments for consistent key

    nlohmann::json args;

    for (const auto& [k, v] : call.arguments) {

        args[k] = v;

    }

    return call.name + ":" + args.dump();

}


void ToolExecutor::record_tool_call(

    LoopContext& ctx,

    const ToolCall& call,

    const std::string& result) {

    // Extract result text from JSON envelope

    std::string text = result;

    try {

        auto j = nlohmann::json::parse(result);

        text = j.value("result", result);

    } catch (...) {}


    // Don't cache error results

    if (text.find("Error:") == 0 || text.find("error:") == 0) {

        return;

    }

    auto key = tool_call_key(call);

    ctx.recent_tool_calls[key] = text;

}


Message ToolExecutor::create_denied_message(

    const ToolCall& call,

    const std::string& reason) {

    Message msg;

    msg.role = "user";

    msg.content =

        "Tool `" + call.name + "` was denied: " + reason + "\n\n"

        "This tool is not available to you. Do NOT retry it. "

        "Use a different approach to accomplish your task.";

    return msg;

}


Message ToolExecutor::create_error_message(

    const ToolCall& call,

    const std::string& error) {

    Message msg;

    msg.role = "user";

    msg.content =

        "Tool `" + call.name + "` failed with error: " + error +

        "\n\nRECOVERY:\n"

        "- Check arguments are correct\n"

        "- Try a different approach\n"

        "- Do NOT retry with the same arguments";

    return msg;

}


// ── Private helpers ──────────────────────────────────────


void ToolExecutor::fire_state_callback(const LoopContext& ctx) {

    if (callbacks_.on_state_change != nullptr) {

        callbacks_.on_state_change(

            static_cast<int>(ctx.state), callbacks_.user_data);

    }

}


void ToolExecutor::truncate_to_limit(

    std::vector<ToolCall>& calls,

    int limit) const {

    auto lim = static_cast<size_t>(limit);

    if (calls.size() > lim) {

        calls.resize(lim);

    }

}


std::optional<Message> ToolExecutor::check_mcp_authorization(

    const LoopContext& ctx,

    const ToolCall& call) const {

    if (auth_mgr_ == nullptr) {

        return std::nullopt;

    }

    auto identity = ctx.locked_tier.empty()

                        ? "lead" : ctx.locked_tier;

    auto required = server_manager_.get_required_access_level(

        call.name);

    if (!auth_mgr_->is_enforced(identity) ||

        auth_mgr_->check_access(identity, call.name, required)) {

        return std::nullopt;

    }

    auto level_str = mcp_access_level_name(required);

    logger->warn("MCP key denied: {} requires {} for {}",

                 call.name, level_str, identity);

    Message msg;

    msg.role = "user";

    msg.content =

        "Tool `" + call.name + "` was denied: identity `"

        + identity + "` lacks " + level_str

        + " access.\n\n"

        "Your MCP key set does not authorize this tool. "

        "Use `entropic.delegate` to hand off to an identity "

        "that has the required access.";

    return msg;

}


std::optional<Message> ToolExecutor::check_dup_or_approval(

    LoopContext& ctx, const ToolCall& call) {

    auto dup_result = check_duplicate(ctx, call);

    if (!dup_result.empty()) {

        return handle_duplicate(ctx, call, dup_result);

    }

    ctx.consecutive_duplicate_attempts = 0;

    return check_approval(call)

        ? std::nullopt

        : std::optional{create_denied_message(

              call, "Permission denied")};

}


std::optional<Message> ToolExecutor::check_schema(

    const ToolCall& call) {

    auto schema = server_manager_.get_tool_schema(call.name);

    if (schema.empty()) { return std::nullopt; }

    auto args = nlohmann::json::parse(

        serialize_args(call), nullptr, false);

    auto err = args.is_discarded()

        ? std::string{} : validate_tool_args(schema, args);

    if (err.empty()) { return std::nullopt; }

    logger->warn("Tool '{}' argument validation failed: {}",

                 call.name, err);

    return create_denied_message(call, err);

}


PreconditionCheck ToolExecutor::check_call_preconditions(

    LoopContext& ctx, const ToolCall& call) {

    // Issue #14 (v2.1.4): anti-spiral hard block fires FIRST. Cheaper

    // than schema/auth checks and short-circuits a tool that the

    // engine has decided to refuse, regardless of whether the call

    // would otherwise pass other preconditions.

    PreconditionCheck pc = check_anti_spiral_hard_block(ctx, call);

    if (pc.rejection.has_value()) {

        return pc;

    }

    if (auto r = check_schema(call); r.has_value()) {

        pc.rejection = std::move(r);

        pc.kind = ToolResultKind::rejected_schema;

    } else if (auto a = check_mcp_authorization(ctx, call);

               a.has_value()) {

        pc.rejection = std::move(a);

        pc.kind = ToolResultKind::rejected_precondition;

    } else if (auto t = check_tier_allowed(ctx, call); t.has_value()) {

        pc.rejection = std::move(t);

        pc.kind = ToolResultKind::rejected_precondition;

    } else if (auto dup = check_duplicate(ctx, call); !dup.empty()) {

        pc.rejection = handle_duplicate(ctx, call, dup);

        pc.kind = ToolResultKind::rejected_duplicate;

    } else {

        pc = check_approval_pc(ctx, call);

    }

    return pc;

}


PreconditionCheck ToolExecutor::check_approval_pc(

    LoopContext& ctx, const ToolCall& call) {

    PreconditionCheck pc;

    ctx.consecutive_duplicate_attempts = 0;

    if (!check_approval(call)) {

        pc.rejection = create_denied_message(

            call, "Permission denied");

        pc.kind = ToolResultKind::rejected_precondition;

    }

    return pc;

}


std::vector<Message> ToolExecutor::process_single_call(

    LoopContext& ctx, const ToolCall& call) {

    // Hook: PRE_TOOL_CALL first — fires for every attempt, including

    // those that a precondition will reject. (E9, 2.0.6-rc19)

    if (fire_pre_tool_hook(ctx, call)) {

        auto msg = create_denied_message(call, "Cancelled by hook");

        fire_post_tool_hook(ctx, call, "", 0.0,

            ToolResultKind::rejected_precondition, msg);

        return {std::move(msg)};

    }


    auto pc = check_call_preconditions(ctx, call);

    if (pc.rejection.has_value()) {

        logger->info("Tool '{}' rejected by precondition (kind={})",

                     call.name, result_kind_to_string(pc.kind));

        fire_post_tool_hook(ctx, call, "", 0.0, pc.kind, *pc.rejection);

        return {std::move(*pc.rejection)};

    }


    auto exec_start = std::chrono::steady_clock::now();

    auto [msg, raw_result] = execute_tool(ctx, call);

    auto exec_ms = std::chrono::duration<double, std::milli>(

        std::chrono::steady_clock::now() - exec_start).count();


    finalize_tool_call(ctx, call, msg, raw_result, exec_ms);


    return {std::move(msg)};

}


static ToolResultKind classify_tool_result(const std::string& content) {

    if (mcp::looks_like_tool_error(content)) {

        return ToolResultKind::error;

    }

    if (mcp::is_effectively_empty(content)) {

        return ToolResultKind::ok_empty;

    }

    return ToolResultKind::ok;

}


void ToolExecutor::log_tool_call(LoopContext& ctx, const ToolCall& call,

                                 double exec_ms,

                                 const std::string& raw_result,

                                 ToolResultKind kind) {

    auto args_log = serialize_args(call);

    if (args_log.size() > 512) { args_log.resize(512); }

    logger->info("[tool_call] iter={} tier={} tool={} args={} "

                 "elapsed_ms={:.0f} result_chars={} status={}",

                 ctx.metrics.iterations,

                 ctx.locked_tier.empty() ? "lead" : ctx.locked_tier,

                 call.name, args_log, exec_ms,

                 raw_result.size(), result_kind_to_string(kind));

}


void ToolExecutor::finalize_tool_call(LoopContext& ctx, const ToolCall& call,

                                      Message& msg,

                                      const std::string& raw_result,

                                      double exec_ms) {

    // #46 (v2.1.0): cap result content at LoopConfig.max_tool_result_bytes

    // so a single runaway tool can't exhaust the context budget. Applied

    // BEFORE classification so kind reflects the bounded form, and BEFORE

    // record_tool_call so the duplicate cache stores what the model saw.

    apply_result_size_cap(msg.content);

    ctx.effective_tool_calls++;

    msg.metadata["added_at_iteration"] =

        std::to_string(ctx.metrics.iterations);

    record_tool_call(ctx, call, raw_result);


    // #44 (v2.1.0): honest byte-level signal — error trumps empty.

    ToolResultKind kind = classify_tool_result(msg.content);

    fire_post_tool_hook(ctx, call, raw_result, exec_ms, kind, msg);


    // Demo ask #5 (v2.1.0): anti-spiral primitive. Track consecutive

    // same-tool calls; at threshold, populate pending_anti_spiral_warning

    // so the next turn's reminder tells the model to pivot or complete.

    update_anti_spiral_tracking(ctx, call.name);


    log_tool_call(ctx, call, exec_ms, raw_result, kind);


    extract_and_process_directives(ctx, raw_result);

    run_post_tool_hooks(ctx);

}


bool ToolExecutor::fire_pre_tool_hook(

    const LoopContext& ctx, const ToolCall& call) {

    if (hook_iface_.fire_pre == nullptr) { return false; }

    auto json = build_pre_tool_json(call, ctx.locked_tier,

                                    ctx.metrics.iterations);

    char* mod = nullptr;

    int rc = hook_iface_.fire_pre(hook_iface_.registry,

        ENTROPIC_HOOK_PRE_TOOL_CALL, json.c_str(), &mod);

    free(mod);

    return rc != 0;

}


void ToolExecutor::apply_result_size_cap(std::string& content) const {

    mcp::truncate_to_cap(content, loop_config_.max_tool_result_bytes);

}


void ToolExecutor::update_anti_spiral_tracking(

    LoopContext& ctx, const std::string& tool_name) {

    if (tool_name == ctx.last_tool_name) {

        ++ctx.consecutive_same_tool_calls;

    } else {

        ctx.last_tool_name = tool_name;

        ctx.consecutive_same_tool_calls = 1;

    }

    if (ctx.consecutive_same_tool_calls

            >= loop_config_.max_consecutive_same_tool) {

        ctx.pending_anti_spiral_warning =

            tool_name + " has been called "

            + std::to_string(ctx.consecutive_same_tool_calls)

            + " times consecutively; pivot to a different tool or "

              "complete the task next turn.";

    }

}


int ToolExecutor::effective_hard_block_threshold() const {

    int configured = loop_config_.max_consecutive_same_tool_hard_block;

    if (configured < 0) {

        configured = loop_config_.max_consecutive_same_tool + 2;

    }

    return configured;

}


PreconditionCheck ToolExecutor::check_anti_spiral_hard_block(

    const LoopContext& ctx, const ToolCall& call) const {

    PreconditionCheck pc;

    int projected = (call.name == ctx.last_tool_name)

        ? (ctx.consecutive_same_tool_calls + 1)

        : 1;

    int threshold = effective_hard_block_threshold();

    if (projected >= threshold) {

        std::string text =

            "[anti-spiral] tool '" + call.name + "' blocked after "

            + std::to_string(projected)

            + " consecutive calls (threshold "

            + std::to_string(threshold)

            + "); pivot to a different tool or complete the task.";

        pc.rejection = create_denied_message(call, text);

        pc.kind = ToolResultKind::rejected_anti_spiral;

    }

    return pc;

}


void ToolExecutor::fire_post_tool_hook(

    const LoopContext& ctx, const ToolCall& call,

    const std::string& raw_result, double elapsed_ms,

    ToolResultKind kind, Message& msg) {

    if (hook_iface_.fire_post == nullptr) { return; }

    auto json = build_post_tool_json(

        call, raw_result, elapsed_ms, ctx.locked_tier,

        ctx.metrics.iterations, kind);

    char* out = nullptr;

    hook_iface_.fire_post(hook_iface_.registry,

        ENTROPIC_HOOK_POST_TOOL_CALL, json.c_str(), &out);

    if (out != nullptr) {

        msg.content = out;

        free(out);

    }

}


bool ToolExecutor::should_stop_batch(

    const LoopContext& ctx,

    const std::vector<Message>& /*results*/) const {

    return ctx.state == AgentState::COMPLETE

        || ctx.pending_delegation.has_value()

        || ctx.pending_pipeline.has_value()

        || ctx.consecutive_duplicate_attempts >= 3;

}


void ToolExecutor::run_post_tool_hooks(LoopContext& ctx) {

    if (hooks_.after_tool != nullptr) {

        hooks_.after_tool(ctx, hooks_.user_data);

    }

}


Message ToolExecutor::create_circuit_breaker_message() {

    Message msg;

    msg.role = "user";

    msg.content =

        "STOP: You have called the same tool 3 times with "

        "identical arguments. This indicates you are stuck. "

        "Please try a completely different approach or respond "

        "to the user explaining what's blocking you.";

    logger->error("Circuit breaker triggered");

    return msg;

}


Message ToolExecutor::create_duplicate_message(

    const ToolCall& call,

    const std::string& previous_result) {

    bool was_denied =

        previous_result.find("was denied") != std::string::npos

        || previous_result.find("not available") != std::string::npos;


    Message msg;

    msg.role = "user";


    if (was_denied) {

        msg.content =

            "Tool `" + call.name + "` is not available to you "

            "and retrying will not help. You MUST use a different "

            "approach. Do NOT call `" + call.name + "` again.";

    } else {

        msg.content =

            "Tool `" + call.name + "` was already called with "

            "the same arguments.\n\nPrevious result:\n" +

            previous_result +

            "\n\nDo NOT call this tool again. "

            "Use the previous result above.";

    }

    return msg;

}


std::string ToolExecutor::serialize_args(const ToolCall& call) {

    if (!call.arguments_json.empty()) {

        return call.arguments_json;

    }

    nlohmann::json args;

    for (const auto& [k, v] : call.arguments) {

        args[k] = v;

    }

    return args.dump();

}


std::string ToolExecutor::serialize_tool_call(const ToolCall& call) {

    nlohmann::json j;

    j["id"] = call.id;

    j["name"] = call.name;

    j["arguments"] = nlohmann::json::object();

    for (const auto& [k, v] : call.arguments) {

        j["arguments"][k] = v;

    }

    return j.dump();

}


void ToolExecutor::fire_tool_complete_callback(

    const ToolCall& call,

    const std::string& result,

    long long ms) {

    if (callbacks_.on_tool_complete == nullptr) {

        return;

    }

    auto call_json = serialize_tool_call(call);

    callbacks_.on_tool_complete(

        call_json.c_str(), result.c_str(),

        static_cast<double>(ms), callbacks_.user_data);

}


std::string ToolExecutor::build_post_tool_json(

    const ToolCall& call,

    const std::string& raw_result,

    double elapsed_ms,

    const std::string& tier,

    int iteration,

    ToolResultKind kind) {

    nlohmann::json ctx;

    ctx["tool_name"] = call.name;

    ctx["args"] = nlohmann::json::parse(serialize_args(call));

    ctx["elapsed_ms"] = elapsed_ms;

    ctx["tier"] = tier.empty() ? std::string{"lead"} : tier;

    ctx["iteration"] = iteration;

    ctx["result_kind"] = result_kind_to_string(kind);

    try {

        auto sr = nlohmann::json::parse(raw_result);

        ctx["result"] = sr.value("result", raw_result);

        ctx["directives"] = sr.value(

            "directives", nlohmann::json::array());

    } catch (...) {

        ctx["result"] = raw_result;

        ctx["directives"] = nlohmann::json::array();

    }

    return ctx.dump();

}


std::string ToolExecutor::build_pre_tool_json(

    const ToolCall& call,

    const std::string& tier,

    int iteration) {

    nlohmann::json j;

    j["tool_name"] = call.name;

    j["args"] = nlohmann::json::parse(serialize_args(call));

    j["tier"] = tier.empty() ? std::string{"lead"} : tier;

    j["iteration"] = iteration;

    return j.dump();

}


static std::vector<std::string> extract_pipeline_stages(

    const nlohmann::json& result_json) {

    std::vector<std::string> stages;

    if (!result_json.contains("stages")) { return stages; }

    for (const auto& s : result_json["stages"]) {

        stages.push_back(s.get<std::string>());

    }

    return stages;

}


static std::unique_ptr<Directive> build_complete_directive(

    const nlohmann::json& result_json) {

    auto cd = std::make_unique<CompleteDirective>(

        result_json.value("summary", ""));

    cd->coverage_gap = result_json.value("coverage_gap", false);

    cd->gap_description = result_json.value("gap_description", "");

    if (result_json.contains("suggested_files")

        && result_json["suggested_files"].is_array()) {

        cd->suggested_files =

            result_json["suggested_files"].get<std::vector<std::string>>();

    }

    return cd;

}


static std::unique_ptr<Directive> build_directive(

    const nlohmann::json& d, const nlohmann::json& result_json) {

    auto type_str = d.value("type", "");

    std::unique_ptr<Directive> result;

    if (type_str == "stop_processing") {

        result = std::make_unique<StopProcessingDirective>();

    } else if (type_str == "delegate") {

        // gh#32 (v2.1.6): resume_delegation emits action=resume_delegation

        // with delegation_id but no target. The directive's target is

        // resolved later by the engine after loading the original

        // delegation's tier from storage.

        result = std::make_unique<DelegateDirective>(

            result_json.value("target", ""),

            result_json.value("task", ""),

            result_json.value("max_turns", -1),

            result_json.value("delegation_id", ""));

    } else if (type_str == "complete") {

        result = build_complete_directive(result_json);

    } else if (type_str == "pipeline") {

        result = std::make_unique<PipelineDirective>(

            extract_pipeline_stages(result_json),

            result_json.value("task", ""));

    }

    return result;

}


static std::optional<std::pair<nlohmann::json, nlohmann::json>>


extract_directive_array(const std::string& raw_result) {

    auto resp = nlohmann::json::parse(raw_result, nullptr, false);

    if (!resp.is_object() || !resp.contains("directives")) {

        return std::nullopt;

    }

    auto dirs = resp["directives"];

    if (!dirs.is_array() || dirs.empty()) { return std::nullopt; }

    return std::make_pair(std::move(resp), std::move(dirs));

}


void ToolExecutor::extract_and_process_directives(

    LoopContext& ctx, const std::string& raw_result) {

    if (hooks_.process_directives == nullptr) { return; }

    auto extracted = extract_directive_array(raw_result);

    if (!extracted) { return; }

    auto& [resp, dirs] = *extracted;


    auto result_json = nlohmann::json::parse(

        resp.value("result", "{}"), nullptr, false);


    std::vector<std::unique_ptr<Directive>> owned;

    for (const auto& d : dirs) {

        auto directive = build_directive(d, result_json);

        if (directive) { owned.push_back(std::move(directive)); }

    }

    if (owned.empty()) { return; }


    std::vector<const Directive*> ptrs;

    ptrs.reserve(owned.size());

    for (const auto& d : owned) { ptrs.push_back(d.get()); }

    logger->info("Processing {} directives from tool result", ptrs.size());

    hooks_.process_directives(ctx, ptrs, hooks_.user_data);

}


} // namespace entropic

entropic::MCPAuthorizationManager::is_enforced
bool is_enforced(const std::string &identity_name) const
Check if an identity has authorization enforcement enabled.
Definition mcp_authorization.cpp:37

entropic::MCPAuthorizationManager::check_access
bool check_access(const std::string &identity_name, const std::string &tool_name, MCPAccessLevel required_level) const
Check if a tool call is authorized for an identity.
Definition mcp_authorization.cpp:94

entropic::ServerManager
Manages MCP server instances and routes tool calls.
Definition server_manager.h:56

entropic::ServerManager::get_required_access_level
MCPAccessLevel get_required_access_level(const std::string &tool_name) const
Get the required access level for a tool.
Definition server_manager.cpp:338

entropic::ServerManager::is_explicitly_allowed
bool is_explicitly_allowed(const std::string &tool_name, const std::string &args_json) const
Check if tool is explicitly allowed (skip prompting).
Definition server_manager.cpp:286

entropic::ServerManager::skip_duplicate_check
bool skip_duplicate_check(const std::string &tool_name) const
Check if tool should skip duplicate detection.
Definition server_manager.cpp:320

entropic::ServerManager::get_tool_schema
std::string get_tool_schema(const std::string &tool_name) const
Get the JSON Schema for a tool's input parameters.
Definition server_manager.cpp:206

entropic::ServerManager::execute
std::string execute(const std::string &tool_name, const std::string &args_json)
Execute a tool call via the appropriate server.
Definition server_manager.cpp:153

entropic::ToolCallHistory::record
void record(const ToolCallRecord &entry)
Record a completed tool call.
Definition tool_call_history.cpp:37

entropic::ToolExecutor::process_tool_calls
std::vector< Message > process_tool_calls(LoopContext &ctx, const std::vector< ToolCall > &tool_calls)
Process a batch of tool calls.
Definition tool_executor.cpp:62

entropic::ToolExecutor::ToolExecutor
ToolExecutor(ServerManager &server_manager, const LoopConfig &loop_config, EngineCallbacks &callbacks, ToolExecutorHooks hooks={})
Construct with shared dependencies.
Definition tool_executor.cpp:33

entropic::ToolExecutor::set_permission_persist
void set_permission_persist(const PermissionPersistInterface &persist)
Set permission persistence interface.
Definition tool_executor.cpp:49

ENTROPIC_HOOK_ON_PERMISSION_CHECK
@ ENTROPIC_HOOK_ON_PERMISSION_CHECK
15: Permission check evaluated
Definition hooks.h:51

ENTROPIC_HOOK_PRE_TOOL_CALL
@ ENTROPIC_HOOK_PRE_TOOL_CALL
3: Before tool execution
Definition hooks.h:39

ENTROPIC_HOOK_POST_TOOL_CALL
@ ENTROPIC_HOOK_POST_TOOL_CALL
4: After tool execution returns
Definition hooks.h:40

logging.h
spdlog initialization and logger access.

entropic::log::get
ENTROPIC_EXPORT std::shared_ptr< spdlog::logger > get(const std::string &name)
Get or create a named logger.
Definition logging.cpp:211

entropic::log::elapsed_ms
double elapsed_ms(std::chrono::steady_clock::time_point start, std::chrono::steady_clock::time_point end)
Compute elapsed milliseconds between two time points.
Definition logging.h:203

entropic
Activate model on GPU (WARM → ACTIVE).
Definition bundled_models.h:20

entropic::check_type
static std::string check_type(const std::string &key, const std::string &type, const nlohmann::json &val)
Check a single value against a type constraint.
Definition tool_executor.cpp:270

entropic::ToolResultKind
ToolResultKind
Categorical outcome of a single tool invocation.
Definition tool_result.h:31

entropic::ToolResultKind::ok
@ ok
Tool dispatched, returned non-empty content.

entropic::ToolResultKind::rejected_schema
@ rejected_schema
Precondition: argument schema violation.

entropic::ToolResultKind::rejected_anti_spiral
@ rejected_anti_spiral
Anti-spiral hard threshold crossed; tool blocked. (#14, v2.1.4)

entropic::ToolResultKind::rejected_duplicate
@ rejected_duplicate
Precondition: duplicate in recent history.

entropic::ToolResultKind::ok_empty
@ ok_empty
Tool dispatched cleanly but returned no content (v2.1.0, #44)

entropic::ToolResultKind::error
@ error
Tool server returned an error payload.

entropic::ToolResultKind::rejected_precondition
@ rejected_precondition
Any other precondition reject (auth, tier, hook-cancel)

entropic::parse_tool_result_text
static std::string parse_tool_result_text(const std::string &result_json)
Extract the "result" text from an MCP result JSON envelope.
Definition tool_executor.cpp:344

entropic::extract_pipeline_stages
static std::vector< std::string > extract_pipeline_stages(const nlohmann::json &result_json)
Extract directives from ServerResponse JSON and process them.
Definition tool_executor.cpp:1185

entropic::check_property_constraints
static std::string check_property_constraints(const std::string &key, const nlohmann::json &prop, const nlohmann::json &val)
Check one property's enum and type constraints.
Definition tool_executor.cpp:294

entropic::classify_tool_result
static ToolResultKind classify_tool_result(const std::string &content)
Classify a tool result by its content (error/empty/ok).
Definition tool_executor.cpp:747

entropic::mcp_access_level_name
const char * mcp_access_level_name(MCPAccessLevel level)
Convert MCPAccessLevel to string representation.
Definition config.cpp:21

entropic::build_directive
static std::unique_ptr< Directive > build_directive(const nlohmann::json &d, const nlohmann::json &result_json)
Build a Directive from a parsed directive + result JSON.
Definition tool_executor.cpp:1234

entropic::result_kind_to_string
const char * result_kind_to_string(ToolResultKind kind)
Serialize a ToolResultKind to its wire-stable string form.
Definition tool_result.h:49

entropic::build_complete_directive
static std::unique_ptr< Directive > build_complete_directive(const nlohmann::json &result_json)
Build a typed Directive from a directive-descriptor JSON.
Definition tool_executor.cpp:1215

entropic::extract_directive_array
static std::optional< std::pair< nlohmann::json, nlohmann::json > > extract_directive_array(const std::string &raw_result)
Pull the "directives" array out of a tool ServerResponse JSON.
Definition tool_executor.cpp:1269

entropic::truncate_result
std::string truncate_result(const std::string &text, size_t max_len)
Truncate a string to max_len characters with "..." suffix.
Definition tool_call_history.cpp:171

entropic::dup
static char * dup(const std::string &s)
Heap-allocate a C string copy.
Definition interface_factory.cpp:117

entropic::summarize_params
std::string summarize_params(const std::string &args_json)
Extract top-level JSON keys as a comma-separated summary.
Definition tool_call_history.cpp:144

entropic::validate_tool_args
static std::string validate_tool_args(const std::string &schema_json, const nlohmann::json &args)
Validate tool arguments against the tool's JSON Schema.
Definition tool_executor.cpp:319

entropic::check_enum
static std::string check_enum(const std::string &key, const nlohmann::json &allowed, const nlohmann::json &val)
Check one property's enum and type constraints.
Definition tool_executor.cpp:249

entropic::check_required_fields
static std::string check_required_fields(const nlohmann::json &schema, const nlohmann::json &args)
Check required fields are present.
Definition tool_executor.cpp:217

entropic::EngineCallbacks
Callback function pointer types for engine events.
Definition engine_types.h:300

entropic::EngineCallbacks::on_tool_call
void(* on_tool_call)(const char *json, void *ud)
Tool call request.
Definition engine_types.h:306

entropic::EngineCallbacks::on_tool_complete
void(* on_tool_complete)(const char *json, const char *result, double ms, void *ud)
Tool execution done.
Definition engine_types.h:308

entropic::EngineCallbacks::user_data
void * user_data
Opaque pointer passed to all callbacks.
Definition engine_types.h:324

entropic::EngineCallbacks::on_tool_start
void(* on_tool_start)(const char *json, void *ud)
Tool execution start.
Definition engine_types.h:307

entropic::EngineCallbacks::on_state_change
void(* on_state_change)(int state, void *ud)
AgentState as int.
Definition engine_types.h:301

entropic::LoopConfig
Configuration for the agentic loop.
Definition engine_types.h:74

entropic::LoopConfig::max_consecutive_same_tool
int max_consecutive_same_tool
Anti-spiral SOFT threshold: after N consecutive calls of the SAME tool (regardless of arg similarity,...
Definition engine_types.h:90

entropic::LoopConfig::max_consecutive_same_tool_hard_block
int max_consecutive_same_tool_hard_block
Anti-spiral HARD threshold: when consecutive same-tool calls exceed this, the engine blocks the call ...
Definition engine_types.h:98

entropic::LoopConfig::auto_approve_tools
bool auto_approve_tools
Skip tool approval (v1.8.5)
Definition engine_types.h:82

entropic::LoopConfig::max_tool_result_bytes
int max_tool_result_bytes
Maximum byte length for a single tool's result content before the engine truncates with a "[....
Definition engine_types.h:116

entropic::LoopConfig::max_tool_calls_per_turn
int max_tool_calls_per_turn
Tool calls per iteration (v1.8.5)
Definition engine_types.h:77

entropic::LoopContext
Mutable state carried through the agentic loop.
Definition engine_types.h:223

entropic::LoopContext::consecutive_errors
int consecutive_errors
Error streak counter.
Definition engine_types.h:228

entropic::LoopContext::effective_max_tool_calls_per_turn
int effective_max_tool_calls_per_turn
Per-identity override (-1 = LoopConfig, P3-18)
Definition engine_types.h:248

entropic::LoopContext::state
AgentState state
Current state.
Definition engine_types.h:226

entropic::PermissionPersistInterface
Permission persistence interface.
Definition engine_types.h:512

entropic::ToolCall
A tool call request parsed from model output.
Definition tool_call.h:31

entropic::ToolExecutorHooks
Engine-level hooks called during tool processing.
Definition engine_types.h:378

entropic::ToolExecutorHooks::after_tool
void(* after_tool)(LoopContext &ctx, void *user_data)
Called after each tool execution.
Definition engine_types.h:381

entropic::ToolExecutorHooks::process_directives
DirectiveResult(* process_directives)(LoopContext &ctx, const std::vector< const Directive * > &directives, void *user_data)
Process directives from tool results.
Definition engine_types.h:385

entropic::ToolExecutorHooks::user_data
void * user_data
Opaque pointer for hooks.
Definition engine_types.h:390

tool_executor.h
Processes tool calls from model output.

tool_result_classify.h
Byte-level classifiers for tool-result content (#44, v2.1.0).

utf8_sanitize.h
UTF-8 validation + replacement at every system boundary where bytes change ownership.