Entropic 2.3.8
Local-first agentic inference engine
Loading...
Searching...
No Matches
response_generator.h
Go to the documentation of this file.
1// SPDX-License-Identifier: Apache-2.0
12#pragma once
13
18
19#include <string>
20#include <vector>
21
22namespace entropic {
23
29 std::string content;
30 std::string tool_calls_json;
31 std::string finish_reason;
32};
33
43public:
52 ResponseGenerator(const InferenceInterface& inference,
53 const LoopConfig& loop_config,
54 EngineCallbacks& callbacks,
55 GenerationEvents events);
56
64
72 bool is_response_complete(const std::string& content,
73 const std::string& tool_calls_json);
74
75private:
81 void lock_tier_if_needed(LoopContext& ctx);
82
89 GenerateResult generate_streaming(LoopContext& ctx);
90
97 GenerateResult generate_batch(LoopContext& ctx);
98
112 std::pair<std::string, std::string> prepare_prompts(
113 LoopContext& ctx, const char* mode);
114
122 std::string handle_pause(LoopContext& ctx,
123 const std::string& partial);
124
131 static std::string serialize_messages(
132 const std::vector<Message>& messages);
133
140 static std::string build_params_json(const std::string& tier);
141
149 std::vector<Message> inject_tool_prompt(
150 const std::vector<Message>& messages,
151 const std::string& tier);
152
177 std::vector<Message> inject_engine_state_reminder(
178 const std::vector<Message>& messages,
179 const LoopContext& ctx);
180
181 InferenceInterface inference_;
182 LoopConfig loop_config_;
183 EngineCallbacks& callbacks_;
184 GenerationEvents events_;
185 HookInterface hooks_;
190 TokenCallback stream_observer_ = nullptr;
191 void* stream_observer_data_ = nullptr;
192
197 void (*state_observer_)(int, void*) = nullptr;
198 void* state_observer_data_ = nullptr;
199
200public:
207 void set_hooks(const HookInterface& hooks) { hooks_ = hooks; }
208
222 void set_stream_observer(TokenCallback observer, void* user_data) {
223 stream_observer_ = observer;
224 stream_observer_data_ = user_data;
225 }
226
233 TokenCallback stream_observer() const { return stream_observer_; }
234
248 void (*observer)(int, void*), void* user_data) {
249 state_observer_ = observer;
250 state_observer_data_ = user_data;
251 }
252
259 void* stream_observer_data() const { return stream_observer_data_; }
260};
261
262} // namespace entropic
Handles model response generation, tier routing, pause/injection.
GenerateResult generate_response(LoopContext &ctx)
Generate model response, routing tier first if needed.
void set_stream_observer(TokenCallback observer, void *user_data)
Set the global stream observer.
bool is_response_complete(const std::string &content, const std::string &tool_calls_json)
Check if the last response indicates completion.
void set_hooks(const HookInterface &hooks)
Set the hook dispatch interface.
void set_state_observer(void(*observer)(int, void *), void *user_data)
Set the persistent state-transition observer.
void * stream_observer_data() const
Get the observer's user_data pointer.
TokenCallback stream_observer() const
Get the registered stream observer callback.
Types for the agentic loop engine.
Hook dispatch interface injected into engine subsystems.
Function pointer types for core-to-inference communication.
Activate model on GPU (WARM → ACTIVE).
void(*)(const char *, size_t, void *) TokenCallback
Token callback type matching the C API signature.
Streaming filter that strips <think>...</think> blocks.
Callback function pointer types for engine events.
Result of a generate_response call.
std::string tool_calls_json
Tool calls as JSON (empty if none)
std::string finish_reason
"stop", "length", "interrupted"
std::string content
Cleaned response content.
Atomic flags for interrupt/pause signaling.
Configuration for the agentic loop.
Mutable state carried through the agentic loop.