From 05fe38e289bf00ba8a6e0b9188f20c9f513a678f Mon Sep 17 00:00:00 2001
From: Petr Mironychev <9195189+Palm1r@users.noreply.github.com>
Date: Thu, 11 Jun 2026 13:36:23 +0200
Subject: [PATCH] refactor: Remove project rules

---
 ChatView/ChatCompressor.cpp                   |   6 +-
 ChatView/ChatModel.cpp                        |  16 -
 ChatView/ChatModel.hpp                        |   1 -
 ChatView/ClientInterface.cpp                  |  12 +-
 ChatView/ClientInterface.hpp                  |   1 -
 LLMClientInterface.cpp                        |   7 +-
 QuickRefactorHandler.cpp                      |   5 +-
 README.md                                     |   3 +-
 bench/main.cpp                                | 228 ++++--
 docs/agent-roles.md                           |   1 -
 docs/chat-summarization.md                    |   1 -
 docs/core-class-diagram.svg                   |   1 +
 docs/project-rules.md                         |  35 -
 docs/quick-refactoring.md                     |   2 -
 docs/target-architecture.md                   | 652 ++++++++++++++++++
 settings/AgentDetailPane.cpp                  |  14 +-
 settings/AgentDetailPane.hpp                  |   2 +-
 sources/Session/CMakeLists.txt                |   1 +
 sources/Session/ErrorInfo.hpp                 |  61 ++
 sources/Session/ResponseEvent.hpp             |  24 +-
 sources/Session/ResponseRouter.cpp            |  22 +-
 sources/Session/ResponseRouter.hpp            |   6 +-
 sources/Session/Session.cpp                   | 111 +--
 sources/Session/Session.hpp                   |  24 +-
 sources/Session/SessionManager.cpp            |  12 -
 sources/Session/SessionManager.hpp            |   6 +-
 sources/Session/SystemPromptBuilder.cpp       |  37 +-
 sources/Session/SystemPromptBuilder.hpp       |  14 +-
 sources/agents/Agent.cpp                      |   2 +
 sources/agents/AgentConfig.hpp                |   2 +
 sources/agents/AgentFactory.cpp               |   2 +-
 sources/agents/AgentLoader.cpp                |  97 ++-
 sources/agents/AgentLoader.hpp                |   5 +-
 sources/agents/anthropic_base_chat.toml       |   1 +
 .../agents/partials/anthropic_messages.jinja  |  13 +-
 sources/agents/partials/ollama_messages.jinja |  39 +-
 .../agents/partials/openai_assistant.jinja    |   2 +-
 .../partials/openai_image_content.jinja       |   9 +-
 sources/providers/CMakeLists.txt              |   1 +
 sources/providers/ClaudeCacheControl.hpp      |  90 +++
 sources/providers/Provider.cpp                |  37 +-
 sources/providers/Provider.hpp                |   6 +-
 sources/templates/JsonPromptTemplate.cpp      |  13 +-
 sources/templates/JsonPromptTemplate.hpp      |   4 +-
 sources/templates/PromptTemplate.hpp          |   4 +-
 45 files changed, 1333 insertions(+), 299 deletions(-)
 create mode 100644 docs/core-class-diagram.svg
 delete mode 100644 docs/project-rules.md
 create mode 100644 docs/target-architecture.md
 create mode 100644 sources/Session/ErrorInfo.hpp
 create mode 100644 sources/providers/ClaudeCacheControl.hpp

diff --git a/ChatView/ChatCompressor.cpp b/ChatView/ChatCompressor.cpp
index a5b1a9d..115c5a7 100644
--- a/ChatView/ChatCompressor.cpp
+++ b/ChatView/ChatCompressor.cpp
@@ -125,10 +125,10 @@ void ChatCompressor::startCompression(const QString &chatFilePath, ChatModel *ch
     std::vector<std::unique_ptr<LLMQore::ContentBlock>> blocks;
     blocks.push_back(std::make_unique<LLMQore::TextContent>(buildCompressionPrompt()));
 
-    m_currentRequestId = session->send(
-        std::move(blocks), /*toolsOverride=*/false, /*thinkingOverride=*/false);
+    m_currentRequestId = session->send(std::move(blocks), /*toolsOverride=*/false);
     if (m_currentRequestId.isEmpty()) {
-        handleCompressionError(tr("Failed to start compression request"));
+        handleCompressionError(tr("Failed to start compression request: %1")
+                                   .arg(session->lastError().message));
         return;
     }
     LOG_MESSAGE(QString("Starting compression request: %1").arg(m_currentRequestId));
diff --git a/ChatView/ChatModel.cpp b/ChatView/ChatModel.cpp
index d5973fa..125e536 100644
--- a/ChatView/ChatModel.cpp
+++ b/ChatView/ChatModel.cpp
@@ -390,22 +390,6 @@ void ChatModel::addToolExecutionStatus(
     }
 }
 
-void ChatModel::dropTrailingAssistantMessage(const QString &requestId)
-{
-    if (m_messages.isEmpty())
-        return;
-
-    const Message &last = m_messages.last();
-    if (last.role != ChatRole::Assistant || last.id != requestId)
-        return;
-
-    const int idx = m_messages.size() - 1;
-    beginRemoveRows(QModelIndex(), idx, idx);
-    m_messages.removeLast();
-    endRemoveRows();
-    LOG_MESSAGE(QString("Dropped leaked pre-tool assistant message at index %1").arg(idx));
-}
-
 void ChatModel::setToolMessageData(
     const QString &toolId,
     const QString &toolName,
diff --git a/ChatView/ChatModel.hpp b/ChatView/ChatModel.hpp
index 0da2fac..c06c198 100644
--- a/ChatView/ChatModel.hpp
+++ b/ChatView/ChatModel.hpp
@@ -102,7 +102,6 @@ public:
         const QString &toolId,
         const QString &toolName,
         const QJsonObject &toolArguments);
-    void dropTrailingAssistantMessage(const QString &requestId);
     void setToolMessageData(
         const QString &toolId,
         const QString &toolName,
diff --git a/ChatView/ClientInterface.cpp b/ChatView/ClientInterface.cpp
index 7376a50..47550ca 100644
--- a/ChatView/ClientInterface.cpp
+++ b/ChatView/ClientInterface.cpp
@@ -268,8 +268,8 @@ void ClientInterface::sendMessage(
 
     const LLMQore::RequestID requestId = session->send(std::move(blocks));
     if (requestId.isEmpty()) {
-        const QString error = QStringLiteral("Failed to start chat request for agent: %1")
-                                  .arg(m_activeAgent);
+        const QString error = QStringLiteral("Failed to start chat request for agent '%1': %2")
+                                  .arg(m_activeAgent, session->lastError().message);
         LOG_MESSAGE(error);
         m_sessionManager->removeSession(session);
         emit errorOccurred(error);
@@ -277,7 +277,7 @@ void ClientInterface::sendMessage(
     }
 
     QJsonObject request{{"id", requestId}};
-    m_activeRequests[requestId] = {request, session, /*dropPreToolText=*/false};
+    m_activeRequests[requestId] = {request, session};
 
     emit requestStarted(requestId);
 }
@@ -613,15 +613,11 @@ void ClientInterface::handleToolExecutionStarted(
     const QString &toolName,
     const QJsonObject &arguments)
 {
-    const auto requestIt = m_activeRequests.constFind(requestId);
-    if (requestIt == m_activeRequests.constEnd()) {
+    if (!m_activeRequests.contains(requestId)) {
         LOG_MESSAGE(QString("Ignoring tool execution start for non-chat request: %1").arg(requestId));
         return;
     }
 
-    if (requestIt->dropPreToolText) {
-        m_chatModel->dropTrailingAssistantMessage(requestId);
-    }
     m_chatModel->addToolExecutionStatus(requestId, toolId, toolName, arguments);
     m_awaitingContinuation.insert(requestId);
 }
diff --git a/ChatView/ClientInterface.hpp b/ChatView/ClientInterface.hpp
index 549b09b..06ee6bb 100644
--- a/ChatView/ClientInterface.hpp
+++ b/ChatView/ClientInterface.hpp
@@ -91,7 +91,6 @@ private:
     {
         QJsonObject originalRequest;
         QPointer<Session> session;
-        bool dropPreToolText = false;
     };
 
     ChatModel *m_chatModel;
diff --git a/LLMClientInterface.cpp b/LLMClientInterface.cpp
index a6a1bf4..a1ac8af 100644
--- a/LLMClientInterface.cpp
+++ b/LLMClientInterface.cpp
@@ -276,8 +276,8 @@ void LLMClientInterface::handleCompletion(const QJsonObject &request)
     connect(session, &Session::finished, this, [this, session](const LLMQore::RequestID &, const QString &) {
         onCompletionFinished(requestIdForSession(session));
     });
-    connect(session, &Session::failed, this, [this, session](const LLMQore::RequestID &, const QString &error) {
-        onCompletionFailed(requestIdForSession(session), error);
+    connect(session, &Session::failed, this, [this, session](const LLMQore::RequestID &, const QodeAssist::ErrorInfo &error) {
+        onCompletionFailed(requestIdForSession(session), error.message);
     });
 
     if (auto *client = session->client())
@@ -286,8 +286,9 @@ void LLMClientInterface::handleCompletion(const QJsonObject &request)
 
     const LLMQore::RequestID requestId = session->sendCompletion(std::move(context));
     if (requestId.isEmpty()) {
+        QString error = QString("Failed to start completion request for agent '%1': %2")
+                            .arg(agentName, session->lastError().message);
         session->deleteLater();
-        QString error = QString("Failed to start completion request for agent: %1").arg(agentName);
         LOG_MESSAGE(error);
         sendErrorResponse(request, error);
         return;
diff --git a/QuickRefactorHandler.cpp b/QuickRefactorHandler.cpp
index 7f9af1a..3e8cd5f 100644
--- a/QuickRefactorHandler.cpp
+++ b/QuickRefactorHandler.cpp
@@ -202,9 +202,10 @@ void QuickRefactorHandler::prepareAndSendRequest(
     const LLMQore::RequestID requestId = session->send(std::move(blocks), enableTools);
     if (requestId.isEmpty()) {
         m_isRefactoringInProgress = false;
+        const QString reason = session->lastError().message;
         m_sessionManager->removeSession(session);
-        emitError(QStringLiteral("Failed to start quick refactor request for agent: %1")
-                      .arg(agentName));
+        emitError(QStringLiteral("Failed to start quick refactor request for agent '%1': %2")
+                      .arg(agentName, reason));
         return;
     }
 
diff --git a/README.md b/README.md
index dca71bf..40fb928 100644
--- a/README.md
+++ b/README.md
@@ -218,7 +218,6 @@ For optimal coding assistance, we recommend using these top-tier models:
 
 - **[Agent Roles](docs/agent-roles.md)** - Create AI personas with specialized system prompts
 - **[Chat Summarization](docs/chat-summarization.md)** - Compress conversations to save context tokens
-- **[Project Rules](docs/project-rules.md)** - Customize AI behavior for your project
 - **[Ignoring Files](docs/ignoring-files.md)** - Exclude files from context using `.qodeassistignore`
 
 ## Features
@@ -473,7 +472,7 @@ QodeAssist uses a flexible prompt composition system that adapts to different co
 - **Custom Instructions** provide reusable templates that can be augmented with specific details
 - **Tool Calling** is available for Chat and Quick Refactor when enabled
 
-See [Project Rules Documentation](docs/project-rules.md), [Agent Roles Guide](docs/agent-roles.md), and [Quick Refactoring Guide](docs/quick-refactoring.md) for more details.
+See [Agent Roles Guide](docs/agent-roles.md) and [Quick Refactoring Guide](docs/quick-refactoring.md) for more details.
 
 ## QtCreator Version Compatibility
 
diff --git a/bench/main.cpp b/bench/main.cpp
index 62d9f58..da962a1 100644
--- a/bench/main.cpp
+++ b/bench/main.cpp
@@ -7,18 +7,23 @@
 #include <QFile>
 #include <QFileInfo>
 #include <QHash>
+#include <QJsonArray>
 #include <QJsonDocument>
 #include <QJsonObject>
 #include <QRegularExpression>
 #include <QTextStream>
 #include <QTimer>
 
+#include <functional>
 #include <memory>
+#include <optional>
 #include <vector>
 
 #include <LLMQore/BaseClient.hpp>
+#include <LLMQore/BaseTool.hpp>
 #include <LLMQore/ContentBlocks.hpp>
 #include <LLMQore/ToolRegistry.hpp>
+#include <LLMQore/ToolResult.hpp>
 #include <LLMQore/ToolsManager.hpp>
 
 #include <Agent.hpp>
@@ -145,6 +150,69 @@ QString imageMediaType(const QString &path)
     return {};
 }
 
+class BenchEchoTool : public LLMQore::BaseTool
+{
+public:
+    using BaseTool::BaseTool;
+    QString id() const override { return QStringLiteral("bench_echo"); }
+    QString displayName() const override { return QStringLiteral("Bench echo"); }
+    QString description() const override
+    {
+        return QStringLiteral("Echoes the given text back verbatim. "
+                              "Use whenever the user asks to echo something.");
+    }
+    QJsonObject parametersSchema() const override
+    {
+        return QJsonObject{
+            {QStringLiteral("type"), QStringLiteral("object")},
+            {QStringLiteral("properties"),
+             QJsonObject{
+                 {QStringLiteral("text"),
+                  QJsonObject{
+                      {QStringLiteral("type"), QStringLiteral("string")},
+                      {QStringLiteral("description"), QStringLiteral("Text to echo back")}}}}},
+            {QStringLiteral("required"), QJsonArray{QStringLiteral("text")}}};
+    }
+    QFuture<LLMQore::ToolResult> executeAsync(const QJsonObject &input) override
+    {
+        return QtFuture::makeReadyValueFuture(LLMQore::ToolResult::text(
+            QStringLiteral("echo: %1").arg(input.value(QStringLiteral("text")).toString())));
+    }
+};
+
+class BenchAddTool : public LLMQore::BaseTool
+{
+public:
+    using BaseTool::BaseTool;
+    QString id() const override { return QStringLiteral("bench_add"); }
+    QString displayName() const override { return QStringLiteral("Bench add"); }
+    QString description() const override
+    {
+        return QStringLiteral("Adds two numbers and returns the sum. "
+                              "Use whenever the user asks to add numbers.");
+    }
+    QJsonObject parametersSchema() const override
+    {
+        return QJsonObject{
+            {QStringLiteral("type"), QStringLiteral("object")},
+            {QStringLiteral("properties"),
+             QJsonObject{
+                 {QStringLiteral("a"),
+                  QJsonObject{{QStringLiteral("type"), QStringLiteral("number")}}},
+                 {QStringLiteral("b"),
+                  QJsonObject{{QStringLiteral("type"), QStringLiteral("number")}}}}},
+            {QStringLiteral("required"),
+             QJsonArray{QStringLiteral("a"), QStringLiteral("b")}}};
+    }
+    QFuture<LLMQore::ToolResult> executeAsync(const QJsonObject &input) override
+    {
+        const double sum = input.value(QStringLiteral("a")).toDouble()
+                           + input.value(QStringLiteral("b")).toDouble();
+        return QtFuture::makeReadyValueFuture(
+            LLMQore::ToolResult::text(QString::number(sum)));
+    }
+};
+
 void printEvent(const ResponseEvent &ev, bool showThinking)
 {
     switch (ev.kind()) {
@@ -178,8 +246,10 @@ void printEvent(const ResponseEvent &ev, bool showThinking)
             err() << "[tool-result" << (d->isError ? " ERROR" : "") << "] " << d->text << "\n";
         break;
     case ResponseEvent::Kind::Usage:
-        if (const auto *d = ev.as<ResponseEvents::Usage>())
-            err() << "\n[usage] in=" << d->inputTokens << " out=" << d->outputTokens << "\n";
+        if (const auto *d = ev.as<ResponseEvents::Usage>()) {
+            err() << "\n[usage] in=" << d->inputTokens << " out=" << d->outputTokens
+                  << " cached=" << d->cachedTokens << " reasoning=" << d->reasoningTokens << "\n";
+        }
         break;
     case ResponseEvent::Kind::Error:
         if (const auto *d = ev.as<ResponseEvents::Error>())
@@ -212,7 +282,9 @@ int main(int argc, char *argv[])
         QStringList{"f", "file"}, "Load an agent from a TOML file instead of by name.", "path");
     QCommandLineOption promptOpt(
         QStringList{"p", "prompt"},
-        "Prompt text. If omitted, positional args or stdin are used.",
+        "Prompt text. Repeatable: each occurrence is one chat turn, sent after the "
+        "previous turn finishes (history is replayed through the agent template). "
+        "If omitted, positional args or stdin are used as a single turn.",
         "text");
     QCommandLineOption noThinkingOpt("no-thinking", "Hide thinking deltas from output.");
     QCommandLineOption envOpt(
@@ -221,6 +293,11 @@ int main(int argc, char *argv[])
         "path");
     QCommandLineOption apiKeyOpt(
         "api-key", "API key to use for the agent's provider (overrides env/settings).", "value");
+    QCommandLineOption timeoutOpt(
+        "timeout",
+        "Network transfer timeout in seconds (a stalled stream fails instead of hanging). "
+        "Default 60, 0 disables.",
+        "seconds");
     QCommandLineOption projectDirOpt(
         QStringList{"C", "project-dir"},
         "Project root for the agent's context (${PROJECT_DIR}). Defaults to the current directory.",
@@ -233,6 +310,11 @@ int main(int argc, char *argv[])
         "mcp",
         "Load MCP servers from a JSON config (mcpServers map) to give the agent executable tools.",
         "path");
+    QCommandLineOption builtinToolsOpt(
+        "builtin-tools",
+        "Register local test tools (bench_echo, bench_add) and force tools on. "
+        "Lets the model exercise tool calls without an MCP server, e.g. "
+        "-p \"echo hello via the tool\" -p \"now add 2 and 3\".");
     QCommandLineOption fimOpt(
         "fim",
         "Fill-in-the-middle completion mode: send prompt as the prefix and --suffix as the suffix.");
@@ -245,9 +327,11 @@ int main(int argc, char *argv[])
     parser.addOption(noThinkingOpt);
     parser.addOption(envOpt);
     parser.addOption(apiKeyOpt);
+    parser.addOption(timeoutOpt);
     parser.addOption(projectDirOpt);
     parser.addOption(imageOpt);
     parser.addOption(mcpOpt);
+    parser.addOption(builtinToolsOpt);
     parser.addOption(fimOpt);
     parser.addOption(suffixOpt);
     parser.addPositionalArgument("prompt", "Prompt text (alternative to --prompt).", "[prompt...]");
@@ -292,6 +376,20 @@ int main(int argc, char *argv[])
         return 1;
     }
 
+    {
+        bool ok = false;
+        const int timeoutSecs = parser.isSet(timeoutOpt)
+                                    ? parser.value(timeoutOpt).toInt(&ok)
+                                    : 60;
+        if (parser.isSet(timeoutOpt) && !ok) {
+            err() << "Invalid --timeout value.\n";
+            return 2;
+        }
+        if (timeoutSecs > 0)
+            if (auto *client = session->client())
+                client->setTransferTimeout(timeoutSecs * 1000);
+    }
+
     {
         QHash<QString, QString> envFile;
         QString envPath = parser.value(envOpt);
@@ -327,21 +425,41 @@ int main(int argc, char *argv[])
 
     const QStringList imagePaths = parser.values(imageOpt);
 
-    QString prompt = parser.value(promptOpt);
-    if (prompt.isEmpty())
-        prompt = parser.positionalArguments().join(QLatin1Char(' '));
-    if (prompt.isEmpty() && imagePaths.isEmpty())
-        prompt = readStdin().trimmed();
-    if (prompt.isEmpty() && imagePaths.isEmpty()) {
+    QStringList turns = parser.values(promptOpt);
+    if (turns.isEmpty()) {
+        QString prompt = parser.positionalArguments().join(QLatin1Char(' '));
+        if (prompt.isEmpty() && imagePaths.isEmpty())
+            prompt = readStdin().trimmed();
+        if (!prompt.isEmpty())
+            turns << prompt;
+    }
+    if (turns.isEmpty() && imagePaths.isEmpty()) {
         err() << "Empty prompt.\n";
         return 2;
     }
+    if (fimMode && turns.size() > 1) {
+        err() << "FIM mode takes a single prompt; extra turns ignored.\n";
+        turns = {turns.first()};
+    }
 
     if (!imagePaths.isEmpty() && !session->supportsImages())
         err() << "[warning] agent's provider does not advertise image support.\n";
 
+    std::optional<bool> toolsOverride;
+    if (parser.isSet(builtinToolsOpt) || parser.isSet(mcpOpt))
+        toolsOverride = true;
+
+    if (parser.isSet(builtinToolsOpt)) {
+        auto *tools = session->client()->tools();
+        tools->addTool(new BenchEchoTool(tools));
+        tools->addTool(new BenchAddTool(tools));
+        err() << "[tools] registered bench_echo, bench_add\n";
+    }
+
     const bool showThinking = !parser.isSet(noThinkingOpt);
     int exitCode = 0;
+    int nextTurn = 0;
+    std::function<void()> sendNextTurn;
 
     QObject::connect(
         session, &Session::event, &app, [showThinking](const ResponseEvent &ev) {
@@ -351,65 +469,83 @@ int main(int argc, char *argv[])
         session, &Session::finished, &app,
         [&](const LLMQore::RequestID &, const QString &reason) {
             err() << "\n[done] stopReason=" << (reason.isEmpty() ? "<none>" : reason) << "\n";
+            if (!fimMode && nextTurn < turns.size()) {
+                sendNextTurn();
+                return;
+            }
             QCoreApplication::quit();
         });
     QObject::connect(
         session, &Session::failed, &app,
-        [&](const LLMQore::RequestID &, const QString &msg) {
-            err() << "\n[failed] " << msg << "\n";
+        [&](const LLMQore::RequestID &, const QodeAssist::ErrorInfo &info) {
+            err() << "\n[failed] " << info.message << "\n";
             exitCode = 1;
             QCoreApplication::quit();
         });
+    QObject::connect(
+        session, &Session::cancelled, &app, [&](const LLMQore::RequestID &) {
+            err() << "\n[cancelled]\n";
+            QCoreApplication::quit();
+        });
 
-    auto dispatch = [&] {
-        if (fimMode) {
-            Templates::ContextData ctx;
-            ctx.prefix = prompt;
-            if (parser.isSet(suffixOpt))
-                ctx.suffix = parser.value(suffixOpt);
-            if (session->sendCompletion(std::move(ctx)).isEmpty()) {
-                err() << "Failed to dispatch FIM request (check provider URL / model).\n";
-                exitCode = 1;
-                QCoreApplication::quit();
-            }
-            return;
-        }
-
+    sendNextTurn = [&] {
         std::vector<std::unique_ptr<LLMQore::ContentBlock>> blocks;
-        for (const QString &imgPath : imagePaths) {
-            QFile img(imgPath);
-            if (!img.open(QIODevice::ReadOnly)) {
-                err() << "[image] cannot open: " << imgPath << "\n";
-                exitCode = 1;
-                QCoreApplication::quit();
-                return;
+        if (nextTurn == 0) {
+            for (const QString &imgPath : imagePaths) {
+                QFile img(imgPath);
+                if (!img.open(QIODevice::ReadOnly)) {
+                    err() << "[image] cannot open: " << imgPath << "\n";
+                    exitCode = 1;
+                    QCoreApplication::quit();
+                    return;
+                }
+                const QString media = imageMediaType(imgPath);
+                if (media.isEmpty()) {
+                    err() << "[image] unsupported type: " << imgPath << "\n";
+                    exitCode = 1;
+                    QCoreApplication::quit();
+                    return;
+                }
+                const QString b64 = QString::fromLatin1(img.readAll().toBase64());
+                blocks.push_back(std::make_unique<LLMQore::ImageContent>(
+                    b64, media, LLMQore::ImageContent::ImageSourceType::Base64));
             }
-            const QString media = imageMediaType(imgPath);
-            if (media.isEmpty()) {
-                err() << "[image] unsupported type: " << imgPath << "\n";
-                exitCode = 1;
-                QCoreApplication::quit();
-                return;
-            }
-            const QString b64 = QString::fromLatin1(img.readAll().toBase64());
-            blocks.push_back(std::make_unique<LLMQore::ImageContent>(
-                b64, media, LLMQore::ImageContent::ImageSourceType::Base64));
         }
-        if (!prompt.isEmpty())
-            blocks.push_back(std::make_unique<LLMQore::TextContent>(prompt));
+        const QString text = turns.value(nextTurn);
+        if (!text.isEmpty())
+            blocks.push_back(std::make_unique<LLMQore::TextContent>(text));
         if (blocks.empty()) {
             err() << "Nothing to send.\n";
             exitCode = 1;
             QCoreApplication::quit();
             return;
         }
-        if (session->send(std::move(blocks)).isEmpty()) {
-            err() << "Failed to dispatch request (check provider URL / model).\n";
+        if (turns.size() > 1)
+            err() << "\n[turn " << (nextTurn + 1) << "/" << turns.size() << "] " << text << "\n";
+        ++nextTurn;
+        if (session->send(std::move(blocks), toolsOverride).isEmpty()) {
+            err() << "Failed to dispatch request: " << session->lastError().message << "\n";
             exitCode = 1;
             QCoreApplication::quit();
         }
     };
 
+    auto dispatch = [&] {
+        if (fimMode) {
+            Templates::ContextData ctx;
+            ctx.prefix = turns.value(0);
+            if (parser.isSet(suffixOpt))
+                ctx.suffix = parser.value(suffixOpt);
+            if (session->sendCompletion(std::move(ctx)).isEmpty()) {
+                err() << "Failed to dispatch FIM request: " << session->lastError().message << "\n";
+                exitCode = 1;
+                QCoreApplication::quit();
+            }
+            return;
+        }
+        sendNextTurn();
+    };
+
     if (parser.isSet(mcpOpt)) {
         const QString mcpPath = parser.value(mcpOpt);
         QFile mcpFile(mcpPath);
diff --git a/docs/agent-roles.md b/docs/agent-roles.md
index c8195a5..494a423 100644
--- a/docs/agent-roles.md
+++ b/docs/agent-roles.md
@@ -168,7 +168,6 @@ This allows roles to augment rather than replace your base configuration.
 
 ## Related Documentation
 
-- [Project Rules](project-rules.md) - Project-specific AI behavior customization
 - [Chat Assistant Features](../README.md#chat-assistant) - Overview of chat functionality
 - [File Context](file-context.md) - Attaching files to chat context
 
diff --git a/docs/chat-summarization.md b/docs/chat-summarization.md
index a98d030..233eda2 100644
--- a/docs/chat-summarization.md
+++ b/docs/chat-summarization.md
@@ -112,4 +112,3 @@ No additional configuration is required.
 
 - [Agent Roles](agent-roles.md) - Switch between AI personas
 - [File Context](file-context.md) - Attach files to chat
-- [Project Rules](project-rules.md) - Customize AI behavior
diff --git a/docs/core-class-diagram.svg b/docs/core-class-diagram.svg
new file mode 100644
index 0000000..d5f1cfa
--- /dev/null
+++ b/docs/core-class-diagram.svg
@@ -0,0 +1 @@
+<svg id="mermaid-1781134331628" width="100%" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" class="classDiagram" style="max-width: 2319.703125px;" viewBox="0 0 2319.703125 1078" role="graphics-document document" aria-roledescription="class"><style>#mermaid-1781134331628{font-family:"trebuchet ms",verdana,arial,sans-serif;font-size:16px;fill:#333;}@keyframes edge-animation-frame{from{stroke-dashoffset:0;}}@keyframes dash{to{stroke-dashoffset:0;}}#mermaid-1781134331628 .edge-animation-slow{stroke-dasharray:9,5!important;stroke-dashoffset:900;animation:dash 50s linear infinite;stroke-linecap:round;}#mermaid-1781134331628 .edge-animation-fast{stroke-dasharray:9,5!important;stroke-dashoffset:900;animation:dash 20s linear infinite;stroke-linecap:round;}#mermaid-1781134331628 .error-icon{fill:#552222;}#mermaid-1781134331628 .error-text{fill:#552222;stroke:#552222;}#mermaid-1781134331628 .edge-thickness-normal{stroke-width:1px;}#mermaid-1781134331628 .edge-thickness-thick{stroke-width:3.5px;}#mermaid-1781134331628 .edge-pattern-solid{stroke-dasharray:0;}#mermaid-1781134331628 .edge-thickness-invisible{stroke-width:0;fill:none;}#mermaid-1781134331628 .edge-pattern-dashed{stroke-dasharray:3;}#mermaid-1781134331628 .edge-pattern-dotted{stroke-dasharray:2;}#mermaid-1781134331628 .marker{fill:#333333;stroke:#333333;}#mermaid-1781134331628 .marker.cross{stroke:#333333;}#mermaid-1781134331628 svg{font-family:"trebuchet ms",verdana,arial,sans-serif;font-size:16px;}#mermaid-1781134331628 p{margin:0;}#mermaid-1781134331628 g.classGroup text{fill:#9370DB;stroke:none;font-family:"trebuchet ms",verdana,arial,sans-serif;font-size:10px;}#mermaid-1781134331628 g.classGroup text .title{font-weight:bolder;}#mermaid-1781134331628 .cluster-label text{fill:#333;}#mermaid-1781134331628 .cluster-label span{color:#333;}#mermaid-1781134331628 .cluster-label span p{background-color:transparent;}#mermaid-1781134331628 .cluster rect{fill:#ffffde;stroke:#aaaa33;stroke-width:1px;}#mermaid-1781134331628 .cluster text{fill:#333;}#mermaid-1781134331628 .cluster span{color:#333;}#mermaid-1781134331628 .nodeLabel,#mermaid-1781134331628 .edgeLabel{color:#131300;}#mermaid-1781134331628 .edgeLabel .label rect{fill:#ECECFF;}#mermaid-1781134331628 .label text{fill:#131300;}#mermaid-1781134331628 .labelBkg{background:#ECECFF;}#mermaid-1781134331628 .edgeLabel .label span{background:#ECECFF;}#mermaid-1781134331628 .classTitle{font-weight:bolder;}#mermaid-1781134331628 .node rect,#mermaid-1781134331628 .node circle,#mermaid-1781134331628 .node ellipse,#mermaid-1781134331628 .node polygon,#mermaid-1781134331628 .node path{fill:#ECECFF;stroke:#9370DB;stroke-width:1px;}#mermaid-1781134331628 .divider{stroke:#9370DB;stroke-width:1;}#mermaid-1781134331628 g.clickable{cursor:pointer;}#mermaid-1781134331628 g.classGroup rect{fill:#ECECFF;stroke:#9370DB;}#mermaid-1781134331628 g.classGroup line{stroke:#9370DB;stroke-width:1;}#mermaid-1781134331628 .classLabel .box{stroke:none;stroke-width:0;fill:#ECECFF;opacity:0.5;}#mermaid-1781134331628 .classLabel .label{fill:#9370DB;font-size:10px;}#mermaid-1781134331628 .relation{stroke:#333333;stroke-width:1;fill:none;}#mermaid-1781134331628 .dashed-line{stroke-dasharray:3;}#mermaid-1781134331628 .dotted-line{stroke-dasharray:1 2;}#mermaid-1781134331628 #compositionStart,#mermaid-1781134331628 .composition{fill:#333333!important;stroke:#333333!important;stroke-width:1;}#mermaid-1781134331628 #compositionEnd,#mermaid-1781134331628 .composition{fill:#333333!important;stroke:#333333!important;stroke-width:1;}#mermaid-1781134331628 #dependencyStart,#mermaid-1781134331628 .dependency{fill:#333333!important;stroke:#333333!important;stroke-width:1;}#mermaid-1781134331628 #dependencyStart,#mermaid-1781134331628 .dependency{fill:#333333!important;stroke:#333333!important;stroke-width:1;}#mermaid-1781134331628 #extensionStart,#mermaid-1781134331628 .extension{fill:transparent!important;stroke:#333333!important;stroke-width:1;}#mermaid-1781134331628 #extensionEnd,#mermaid-1781134331628 .extension{fill:transparent!important;stroke:#333333!important;stroke-width:1;}#mermaid-1781134331628 #aggregationStart,#mermaid-1781134331628 .aggregation{fill:transparent!important;stroke:#333333!important;stroke-width:1;}#mermaid-1781134331628 #aggregationEnd,#mermaid-1781134331628 .aggregation{fill:transparent!important;stroke:#333333!important;stroke-width:1;}#mermaid-1781134331628 #lollipopStart,#mermaid-1781134331628 .lollipop{fill:#ECECFF!important;stroke:#333333!important;stroke-width:1;}#mermaid-1781134331628 #lollipopEnd,#mermaid-1781134331628 .lollipop{fill:#ECECFF!important;stroke:#333333!important;stroke-width:1;}#mermaid-1781134331628 .edgeTerminals{font-size:11px;line-height:initial;}#mermaid-1781134331628 .classTitleText{text-anchor:middle;font-size:18px;fill:#333;}#mermaid-1781134331628 .label-icon{display:inline-block;height:1em;overflow:visible;vertical-align:-0.125em;}#mermaid-1781134331628 .node .label-icon path{fill:currentColor;stroke:revert;stroke-width:revert;}#mermaid-1781134331628 :root{--mermaid-font-family:"trebuchet ms",verdana,arial,sans-serif;}</style><g><defs><marker id="mermaid-1781134331628_class-aggregationStart" class="marker aggregation class" refX="18" refY="7" markerWidth="190" markerHeight="240" orient="auto"><path d="M 18,7 L9,13 L1,7 L9,1 Z"></path></marker></defs><defs><marker id="mermaid-1781134331628_class-aggregationEnd" class="marker aggregation class" refX="1" refY="7" markerWidth="20" markerHeight="28" orient="auto"><path d="M 18,7 L9,13 L1,7 L9,1 Z"></path></marker></defs><defs><marker id="mermaid-1781134331628_class-extensionStart" class="marker extension class" refX="18" refY="7" markerWidth="190" markerHeight="240" orient="auto"><path d="M 1,7 L18,13 V 1 Z"></path></marker></defs><defs><marker id="mermaid-1781134331628_class-extensionEnd" class="marker extension class" refX="1" refY="7" markerWidth="20" markerHeight="28" orient="auto"><path d="M 1,1 V 13 L18,7 Z"></path></marker></defs><defs><marker id="mermaid-1781134331628_class-compositionStart" class="marker composition class" refX="18" refY="7" markerWidth="190" markerHeight="240" orient="auto"><path d="M 18,7 L9,13 L1,7 L9,1 Z"></path></marker></defs><defs><marker id="mermaid-1781134331628_class-compositionEnd" class="marker composition class" refX="1" refY="7" markerWidth="20" markerHeight="28" orient="auto"><path d="M 18,7 L9,13 L1,7 L9,1 Z"></path></marker></defs><defs><marker id="mermaid-1781134331628_class-dependencyStart" class="marker dependency class" refX="6" refY="7" markerWidth="190" markerHeight="240" orient="auto"><path d="M 5,7 L9,13 L1,7 L9,1 Z"></path></marker></defs><defs><marker id="mermaid-1781134331628_class-dependencyEnd" class="marker dependency class" refX="13" refY="7" markerWidth="20" markerHeight="28" orient="auto"><path d="M 18,7 L9,13 L14,7 L9,1 Z"></path></marker></defs><defs><marker id="mermaid-1781134331628_class-lollipopStart" class="marker lollipop class" refX="13" refY="7" markerWidth="190" markerHeight="240" orient="auto"><circle fill="transparent" cx="7" cy="7" r="6"></circle></marker></defs><defs><marker id="mermaid-1781134331628_class-lollipopEnd" class="marker lollipop class" refX="1" refY="7" markerWidth="190" markerHeight="240" orient="auto"><circle fill="transparent" cx="7" cy="7" r="6"></circle></marker></defs><g class="root"><g class="clusters"></g><g class="edgePaths"><path d="M1161.956,133.388L1081.165,147.657C1000.373,161.926,838.79,190.463,757.999,210.898C677.207,231.333,677.207,243.667,677.207,249.833L677.207,256" id="id_SessionManager_Session_1" class=" edge-thickness-normal edge-pattern-solid relation" style=";;;" data-edge="true" data-et="edge" data-id="id_SessionManager_Session_1" data-points="W3sieCI6MTE3OC45NDMzNTkzNzUsInkiOjEzMC4zODgyNjI1MjI5MTQ5N30seyJ4Ijo2NzcuMjA3MDMxMjUsInkiOjIxOX0seyJ4Ijo2NzcuMjA3MDMxMjUsInkiOjI1Nn1d" marker-start="url(#mermaid-1781134331628_class-aggregationStart)"></path><path d="M1379.318,182L1379.318,188.167C1379.318,194.333,1379.318,206.667,1379.318,228C1379.318,249.333,1379.318,279.667,1379.318,294.833L1379.318,310" id="id_SessionManager_AgentFactory_2" class=" edge-thickness-normal edge-pattern-solid relation" style=";;;" data-edge="true" data-et="edge" data-id="id_SessionManager_AgentFactory_2" data-points="W3sieCI6MTM3OS4zMTgzNTkzNzUsInkiOjE4Mn0seyJ4IjoxMzc5LjMxODM1OTM3NSwieSI6MjE5fSx7IngiOjEzNzkuMzE4MzU5Mzc1LCJ5IjozMTZ9XQ==" marker-end="url(#mermaid-1781134331628_class-dependencyEnd)"></path><path d="M1579.693,162.877L1607.306,172.231C1634.919,181.585,1690.144,200.292,1717.757,226.813C1745.369,253.333,1745.369,287.667,1745.369,304.833L1745.369,322" id="id_SessionManager_ToolContributorRegistry_3" class=" edge-thickness-normal edge-pattern-solid relation" style=";;;" data-edge="true" data-et="edge" data-id="id_SessionManager_ToolContributorRegistry_3" data-points="W3sieCI6MTU3OS42OTMzNTkzNzUsInkiOjE2Mi44NzcxOTQyOTI5NzA3OH0seyJ4IjoxNzQ1LjM2OTE0MDYyNSwieSI6MjE5fSx7IngiOjE3NDUuMzY5MTQwNjI1LCJ5IjozMjh9XQ==" marker-end="url(#mermaid-1781134331628_class-dependencyEnd)"></path><path d="M488.526,472.276L436.449,491.397C384.371,510.517,280.217,548.759,228.14,574.046C176.063,599.333,176.063,611.667,176.063,617.833L176.063,624" id="id_Session_ConversationHistory_4" class=" edge-thickness-normal edge-pattern-solid relation" style=";;;" data-edge="true" data-et="edge" data-id="id_Session_ConversationHistory_4" data-points="W3sieCI6NTA0LjcxODc1LCJ5Ijo0NjYuMzMwNzE5NTI0ODM3NjZ9LHsieCI6MTc2LjA2MjUsInkiOjU4N30seyJ4IjoxNzYuMDYyNSwieSI6NjI0fV0=" marker-start="url(#mermaid-1781134331628_class-compositionStart)"></path><path d="M557.99,563.859L555.132,567.716C552.274,571.573,546.557,579.286,543.698,591.31C540.84,603.333,540.84,619.667,540.84,627.833L540.84,636" id="id_Session_SystemPromptBuilder_5" class=" edge-thickness-normal edge-pattern-solid relation" style=";;;" data-edge="true" data-et="edge" data-id="id_Session_SystemPromptBuilder_5" data-points="W3sieCI6NTY4LjI2MTUwNjQ1MzgwNDQsInkiOjU1MH0seyJ4Ijo1NDAuODM5ODQzNzUsInkiOjU4N30seyJ4Ijo1NDAuODM5ODQzNzUsInkiOjYzNn1d" marker-start="url(#mermaid-1781134331628_class-compositionStart)"></path><path d="M841.733,561.987L846.047,566.156C850.361,570.325,858.989,578.662,863.303,592.998C867.617,607.333,867.617,627.667,867.617,637.833L867.617,648" id="id_Session_ResponseRouter_6" class=" edge-thickness-normal edge-pattern-solid relation" style=";;;" data-edge="true" data-et="edge" data-id="id_Session_ResponseRouter_6" data-points="W3sieCI6ODI5LjMyODE4ODY4ODg1ODcsInkiOjU1MH0seyJ4Ijo4NjcuNjE3MTg3NSwieSI6NTg3fSx7IngiOjg2Ny42MTcxODc1LCJ5Ijo2NDh9XQ==" marker-start="url(#mermaid-1781134331628_class-compositionStart)"></path><path d="M849.695,489.187L882.321,505.489C914.947,521.791,980.199,554.396,1021.545,578.212C1062.892,602.028,1080.332,617.056,1089.052,624.57L1097.772,632.083" id="id_Session_Agent_7" class=" edge-thickness-normal edge-pattern-solid relation" style=";;;" data-edge="true" data-et="edge" data-id="id_Session_Agent_7" data-points="W3sieCI6ODQ5LjY5NTMxMjUsInkiOjQ4OS4xODY5NjE5ODcwNDc5fSx7IngiOjEwNDUuNDUxMTcxODc1LCJ5Ijo1ODd9LHsieCI6MTEwMi4zMTc4MjgwMTAxMTA0LCJ5Ijo2MzZ9XQ==" marker-end="url(#mermaid-1781134331628_class-dependencyEnd)"></path><path d="M176.063,839.25L176.063,840.542C176.063,841.833,176.063,844.417,176.063,854.375C176.063,864.333,176.063,881.667,176.063,890.333L176.063,899" id="id_ConversationHistory_Message_8" class=" edge-thickness-normal edge-pattern-solid relation" style=";;;" data-edge="true" data-et="edge" data-id="id_ConversationHistory_Message_8" data-points="W3sieCI6MTc2LjA2MjUsInkiOjgyMn0seyJ4IjoxNzYuMDYyNSwieSI6ODQ3fSx7IngiOjE3Ni4wNjI1LCJ5Ijo4OTl9XQ==" marker-start="url(#mermaid-1781134331628_class-aggregationStart)"></path><path d="M1180.654,826.854L1179.922,830.212C1179.19,833.57,1177.727,840.285,1177.903,847.809C1178.08,855.333,1179.896,863.667,1180.804,867.833L1181.712,872" id="id_Agent_Provider_9" class=" edge-thickness-normal edge-pattern-solid relation" style=";;;" data-edge="true" data-et="edge" data-id="id_Agent_Provider_9" data-points="W3sieCI6MTE4NC4zMjY1MzQxNDgxODU0LCJ5Ijo4MTB9LHsieCI6MTE3Ni4yNjM2NzE4NzUsInkiOjg0N30seyJ4IjoxMTgxLjcxMTU1MTc4OTMxNDYsInkiOjg3Mn1d" marker-start="url(#mermaid-1781134331628_class-compositionStart)"></path><path d="M1375.932,750.104L1478.798,766.254C1581.664,782.403,1787.395,814.701,1903.737,841.017C2020.079,867.333,2047.032,887.667,2060.508,897.833L2073.984,908" id="id_Agent_PromptTemplate_10" class=" edge-thickness-normal edge-pattern-solid relation" style=";;;" data-edge="true" data-et="edge" data-id="id_Agent_PromptTemplate_10" data-points="W3sieCI6MTM1OC44OTA2MjUsInkiOjc0Ny40MjkwNDE2MTQ4NDA4fSx7IngiOjE5OTMuMTI2OTUzMTI1LCJ5Ijo4NDd9LHsieCI6MjA3My45ODQwNDQyMjg4MzA1LCJ5Ijo5MDh9XQ==" marker-start="url(#mermaid-1781134331628_class-compositionStart)"></path><path d="M1307.016,490L1293.58,506.167C1280.145,522.333,1253.273,554.667,1238.617,578.014C1223.961,601.362,1221.52,615.723,1220.299,622.904L1219.079,630.085" id="id_AgentFactory_Agent_11" class=" edge-thickness-normal edge-pattern-dashed relation" style=";;;" data-edge="true" data-et="edge" data-id="id_AgentFactory_Agent_11" data-points="W3sieCI6MTMwNy4wMTU2NzgwNzQwNDksInkiOjQ5MH0seyJ4IjoxMjI2LjQwMjM0Mzc1LCJ5Ijo1ODd9LHsieCI6MTIxOC4wNzMzNTcwNzcyMDU5LCJ5Ijo2MzZ9XQ==" marker-end="url(#mermaid-1781134331628_class-dependencyEnd)"></path><path d="M1466.244,490L1482.396,506.167C1498.549,522.333,1530.855,554.667,1547.007,582C1563.16,609.333,1563.16,631.667,1563.16,642.833L1563.16,654" id="id_AgentFactory_AgentRouter_12" class=" edge-thickness-normal edge-pattern-solid relation" style=";;;" data-edge="true" data-et="edge" data-id="id_AgentFactory_AgentRouter_12" data-points="W3sieCI6MTQ2Ni4yNDM1NTY4MTA0NjIsInkiOjQ5MH0seyJ4IjoxNTYzLjE2MDE1NjI1LCJ5Ijo1ODd9LHsieCI6MTU2My4xNjAxNTYyNSwieSI6NjYwfV0=" marker-end="url(#mermaid-1781134331628_class-dependencyEnd)"></path><path d="M1859.73,783L1857.405,793.667C1855.081,804.333,1850.432,825.667,1767.934,851.807C1685.436,877.946,1525.089,908.893,1444.916,924.366L1364.742,939.839" id="id_GenericProvider_Provider_13" class=" edge-thickness-normal edge-pattern-solid relation" style=";;;" data-edge="true" data-et="edge" data-id="id_GenericProvider_Provider_13" data-points="W3sieCI6MTg1OS43Mjk3NzU3MDU2NDUxLCJ5Ijo3ODN9LHsieCI6MTg0NS43ODMyMDMxMjUsInkiOjg0N30seyJ4IjoxMzQ3LjgwNDY4NzUsInkiOjk0My4xMDgyMDgwMTM3NjQ2fV0=" marker-end="url(#mermaid-1781134331628_class-extensionEnd)"></path><path d="M2167.492,795L2167.492,803.667C2167.492,812.333,2167.492,829.667,2166.903,845.634C2166.315,861.602,2165.137,876.204,2164.548,883.505L2163.959,890.806" id="id_JsonPromptTemplate_PromptTemplate_14" class=" edge-thickness-normal edge-pattern-solid relation" style=";;;" data-edge="true" data-et="edge" data-id="id_JsonPromptTemplate_PromptTemplate_14" data-points="W3sieCI6MjE2Ny40OTIxODc1LCJ5Ijo3OTV9LHsieCI6MjE2Ny40OTIxODc1LCJ5Ijo4NDd9LHsieCI6MjE2Mi41NzI4MzI2NjEyOTAyLCJ5Ijo5MDh9XQ==" marker-end="url(#mermaid-1781134331628_class-extensionEnd)"></path></g><g class="edgeLabels"><g class="edgeLabel" transform="translate(677.20703125, 219)"><g class="label" data-id="id_SessionManager_Session_1" transform="translate(-19.125, -12)"><foreignObject width="38.25" height="24"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel "><p>pools</p></span></div></foreignObject></g></g><g class="edgeLabel" transform="translate(1379.318359375, 219)"><g class="label" data-id="id_SessionManager_AgentFactory_2" transform="translate(-33.3515625, -12)"><foreignObject width="66.703125" height="24"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel "><p>builds via</p></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" data-id="id_SessionManager_ToolContributorRegistry_3" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel "></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" data-id="id_Session_ConversationHistory_4" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel "></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" data-id="id_Session_SystemPromptBuilder_5" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel "></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" data-id="id_Session_ResponseRouter_6" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel "></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" data-id="id_Session_Agent_7" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel "></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" data-id="id_ConversationHistory_Message_8" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel "></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" data-id="id_Agent_Provider_9" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel "></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" data-id="id_Agent_PromptTemplate_10" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel "></span></div></foreignObject></g></g><g class="edgeLabel" transform="translate(1250.82512, 557.61269)"><g class="label" data-id="id_AgentFactory_Agent_11" transform="translate(-26.234375, -12)"><foreignObject width="52.46875" height="24"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel "><p>creates</p></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" data-id="id_AgentFactory_AgentRouter_12" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel "></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" data-id="id_GenericProvider_Provider_13" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel "></span></div></foreignObject></g></g><g class="edgeLabel"><g class="label" data-id="id_JsonPromptTemplate_PromptTemplate_14" transform="translate(0, 0)"><foreignObject width="0" height="0"><div xmlns="http://www.w3.org/1999/xhtml" class="labelBkg" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="edgeLabel "></span></div></foreignObject></g></g></g><g class="nodes"><g class="node default " id="classId-SessionManager-0" transform="translate(1379.318359375, 95)"><g class="basic label-container"><path d="M-200.375 -87 L200.375 -87 L200.375 87 L-200.375 87" stroke="none" stroke-width="0" fill="#ECECFF" style=""></path><path d="M-200.375 -87 C-45.43682052789407 -87, 109.50135894421186 -87, 200.375 -87 M-200.375 -87 C-102.32061635802002 -87, -4.266232716040037 -87, 200.375 -87 M200.375 -87 C200.375 -48.974650315201124, 200.375 -10.949300630402249, 200.375 87 M200.375 -87 C200.375 -37.83271791585853, 200.375 11.334564168282938, 200.375 87 M200.375 87 C60.269589041485204 87, -79.83582191702959 87, -200.375 87 M200.375 87 C70.14190120672387 87, -60.091197586552255 87, -200.375 87 M-200.375 87 C-200.375 32.44356045516282, -200.375 -22.112879089674365, -200.375 -87 M-200.375 87 C-200.375 38.03012122821733, -200.375 -10.939757543565335, -200.375 -87" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="annotation-group text" transform="translate(0, -63)"></g><g class="label-group text" transform="translate(-63.578125, -63)"><g class="label" style="font-weight: bolder" transform="translate(0,-12)"><foreignObject width="127.15625" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 171px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>SessionManager</p></span></div></foreignObject></g></g><g class="members-group text" transform="translate(-188.375, -15)"></g><g class="methods-group text" transform="translate(-188.375, 15)"><g class="label" style="" transform="translate(0,-12)"><foreignObject width="225.453125" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 280px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+acquire(agentName) : Session</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,12)"><foreignObject width="126.734375" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 181px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+release(session)</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,36)"><foreignObject width="313.171875" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 368px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+toolContributors() : ToolContributorRegistry</p></span></div></foreignObject></g></g><g class="divider" style=""><path d="M-200.375 -39 C-87.39363639955589 -39, 25.587727200888224 -39, 200.375 -39 M-200.375 -39 C-88.30043568680222 -39, 23.774128626395566 -39, 200.375 -39" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="divider" style=""><path d="M-200.375 -15 C-116.66407394532533 -15, -32.953147890650655 -15, 200.375 -15 M-200.375 -15 C-83.89657932738426 -15, 32.58184134523148 -15, 200.375 -15" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g></g><g class="node default " id="classId-Session-1" transform="translate(677.20703125, 403)"><g class="basic label-container"><path d="M-172.48828125 -147 L172.48828125 -147 L172.48828125 147 L-172.48828125 147" stroke="none" stroke-width="0" fill="#ECECFF" style=""></path><path d="M-172.48828125 -147 C-53.89519375075892 -147, 64.69789374848216 -147, 172.48828125 -147 M-172.48828125 -147 C-50.678610109216265 -147, 71.13106103156747 -147, 172.48828125 -147 M172.48828125 -147 C172.48828125 -78.40710099656272, 172.48828125 -9.814201993125437, 172.48828125 147 M172.48828125 -147 C172.48828125 -81.5175822321675, 172.48828125 -16.035164464334997, 172.48828125 147 M172.48828125 147 C80.62904212326238 147, -11.23019700347524 147, -172.48828125 147 M172.48828125 147 C71.14756257845875 147, -30.193156093082507 147, -172.48828125 147 M-172.48828125 147 C-172.48828125 66.19012353674322, -172.48828125 -14.61975292651357, -172.48828125 -147 M-172.48828125 147 C-172.48828125 50.837028035222176, -172.48828125 -45.32594392955565, -172.48828125 -147" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="annotation-group text" transform="translate(0, -123)"></g><g class="label-group text" transform="translate(-30.6796875, -123)"><g class="label" style="font-weight: bolder" transform="translate(0,-12)"><foreignObject width="61.359375" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 107px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>Session</p></span></div></foreignObject></g></g><g class="members-group text" transform="translate(-160.48828125, -75)"></g><g class="methods-group text" transform="translate(-160.48828125, -45)"><g class="label" style="" transform="translate(0,-12)"><foreignObject width="266.34375" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 321px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+send(blocks, toolPolicy) : RequestID</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,12)"><foreignObject width="66.25" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 121px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+cancel()</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,36)"><foreignObject width="224.515625" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 279px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+history() : ConversationHistory</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,60)"><foreignObject width="290.296875" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 345px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+systemPrompt() : SystemPromptBuilder</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,84)"><foreignObject width="172.109375" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 227px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+event(ResponseEvent)</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,108)"><foreignObject width="181.890625" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 236px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+finished(id, stopReason)</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,132)"><foreignObject width="141.84375" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 196px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+failed(id, ErrorInfo)</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,156)"><foreignObject width="100.0625" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 155px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+cancelled(id)</p></span></div></foreignObject></g></g><g class="divider" style=""><path d="M-172.48828125 -99 C-71.38979706511005 -99, 29.70868711977991 -99, 172.48828125 -99 M-172.48828125 -99 C-39.06761034375879 -99, 94.35306056248243 -99, 172.48828125 -99" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="divider" style=""><path d="M-172.48828125 -75 C-35.55667419232137 -75, 101.37493286535727 -75, 172.48828125 -75 M-172.48828125 -75 C-98.09637814445809 -75, -23.704475038916172 -75, 172.48828125 -75" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g></g><g class="node default " id="classId-ConversationHistory-2" transform="translate(176.0625, 723)"><g class="basic label-container"><path d="M-168.0625 -99 L168.0625 -99 L168.0625 99 L-168.0625 99" stroke="none" stroke-width="0" fill="#ECECFF" style=""></path><path d="M-168.0625 -99 C-61.04890093622379 -99, 45.964698127552424 -99, 168.0625 -99 M-168.0625 -99 C-38.74915537895427 -99, 90.56418924209146 -99, 168.0625 -99 M168.0625 -99 C168.0625 -20.10441156351625, 168.0625 58.7911768729675, 168.0625 99 M168.0625 -99 C168.0625 -58.23518818352074, 168.0625 -17.47037636704148, 168.0625 99 M168.0625 99 C56.42114954604111 99, -55.220200907917786 99, -168.0625 99 M168.0625 99 C77.67261095747779 99, -12.717278085044427 99, -168.0625 99 M-168.0625 99 C-168.0625 21.20010100336934, -168.0625 -56.59979799326132, -168.0625 -99 M-168.0625 99 C-168.0625 50.4900645276494, -168.0625 1.9801290552988036, -168.0625 -99" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="annotation-group text" transform="translate(0, -75)"></g><g class="label-group text" transform="translate(-78.6875, -75)"><g class="label" style="font-weight: bolder" transform="translate(0,-12)"><foreignObject width="157.375" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 194px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>ConversationHistory</p></span></div></foreignObject></g></g><g class="members-group text" transform="translate(-156.0625, -27)"></g><g class="methods-group text" transform="translate(-156.0625, 3)"><g class="label" style="" transform="translate(0,-12)"><foreignObject width="233.4375" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 321px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+messages() : vector&lt;Message&gt;</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,12)"><foreignObject width="191.625" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 246px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+lastAssistantText() : string</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,36)"><foreignObject width="138.3125" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 193px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+append(Message)</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,60)"><foreignObject width="182.75" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 270px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+reset(vector&lt;Message&gt;)</p></span></div></foreignObject></g></g><g class="divider" style=""><path d="M-168.0625 -51 C-49.16914634573331 -51, 69.72420730853338 -51, 168.0625 -51 M-168.0625 -51 C-82.23263507483125 -51, 3.5972298503374986 -51, 168.0625 -51" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="divider" style=""><path d="M-168.0625 -27 C-96.82994789783095 -27, -25.597395795661896 -27, 168.0625 -27 M-168.0625 -27 C-100.3671695770236 -27, -32.671839154047206 -27, 168.0625 -27" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g></g><g class="node default " id="classId-Message-3" transform="translate(176.0625, 971)"><g class="basic label-container"><path d="M-137.1796875 -72 L137.1796875 -72 L137.1796875 72 L-137.1796875 72" stroke="none" stroke-width="0" fill="#ECECFF" style=""></path><path d="M-137.1796875 -72 C-71.12499417749102 -72, -5.070300854982037 -72, 137.1796875 -72 M-137.1796875 -72 C-34.382130703081 -72, 68.415426093838 -72, 137.1796875 -72 M137.1796875 -72 C137.1796875 -21.780552403695523, 137.1796875 28.438895192608953, 137.1796875 72 M137.1796875 -72 C137.1796875 -39.5933974274533, 137.1796875 -7.186794854906594, 137.1796875 72 M137.1796875 72 C31.800564057821276 72, -73.57855938435745 72, -137.1796875 72 M137.1796875 72 C39.39494387591962 72, -58.389799748160755 72, -137.1796875 72 M-137.1796875 72 C-137.1796875 24.078738606917412, -137.1796875 -23.842522786165176, -137.1796875 -72 M-137.1796875 72 C-137.1796875 17.457402984361153, -137.1796875 -37.085194031277695, -137.1796875 -72" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="annotation-group text" transform="translate(0, -48)"></g><g class="label-group text" transform="translate(-33.796875, -48)"><g class="label" style="font-weight: bolder" transform="translate(0,-12)"><foreignObject width="67.59375" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 115px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>Message</p></span></div></foreignObject></g></g><g class="members-group text" transform="translate(-125.1796875, 0)"><g class="label" style="" transform="translate(0,-12)"><foreignObject width="73.375" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 128px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+role Role</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,12)"><foreignObject width="216.5625" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 304px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+blocks vector&lt;ContentBlock&gt;</p></span></div></foreignObject></g></g><g class="methods-group text" transform="translate(-125.1796875, 72)"></g><g class="divider" style=""><path d="M-137.1796875 -24 C-46.589372277429405 -24, 44.00094294514119 -24, 137.1796875 -24 M-137.1796875 -24 C-80.56442659748046 -24, -23.94916569496091 -24, 137.1796875 -24" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="divider" style=""><path d="M-137.1796875 48 C-35.68210292869746 48, 65.81548164260508 48, 137.1796875 48 M-137.1796875 48 C-79.60617489711535 48, -22.03266229423069 48, 137.1796875 48" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g></g><g class="node default " id="classId-SystemPromptBuilder-4" transform="translate(540.83984375, 723)"><g class="basic label-container"><path d="M-146.71484375 -87 L146.71484375 -87 L146.71484375 87 L-146.71484375 87" stroke="none" stroke-width="0" fill="#ECECFF" style=""></path><path d="M-146.71484375 -87 C-65.2608306829802 -87, 16.193182384039602 -87, 146.71484375 -87 M-146.71484375 -87 C-38.837183732205176 -87, 69.04047628558965 -87, 146.71484375 -87 M146.71484375 -87 C146.71484375 -26.658260245628504, 146.71484375 33.68347950874299, 146.71484375 87 M146.71484375 -87 C146.71484375 -42.61436408609196, 146.71484375 1.7712718278160793, 146.71484375 87 M146.71484375 87 C77.06345407232736 87, 7.4120643946547204 87, -146.71484375 87 M146.71484375 87 C85.96099970773915 87, 25.207155665478297 87, -146.71484375 87 M-146.71484375 87 C-146.71484375 35.62240501449928, -146.71484375 -15.755189971001442, -146.71484375 -87 M-146.71484375 87 C-146.71484375 20.00805647470571, -146.71484375 -46.98388705058858, -146.71484375 -87" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="annotation-group text" transform="translate(0, -63)"></g><g class="label-group text" transform="translate(-84.0234375, -63)"><g class="label" style="font-weight: bolder" transform="translate(0,-12)"><foreignObject width="168.046875" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 205px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>SystemPromptBuilder</p></span></div></foreignObject></g></g><g class="members-group text" transform="translate(-134.71484375, -15)"></g><g class="methods-group text" transform="translate(-134.71484375, 15)"><g class="label" style="" transform="translate(0,-12)"><foreignObject width="185.40625" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 240px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+setLayer(id, text, priority)</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,12)"><foreignObject width="125.828125" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 180px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+removeLayer(id)</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,36)"><foreignObject width="137.390625" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 192px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+compose() : string</p></span></div></foreignObject></g></g><g class="divider" style=""><path d="M-146.71484375 -39 C-37.44072893780452 -39, 71.83338587439096 -39, 146.71484375 -39 M-146.71484375 -39 C-36.77894767173629 -39, 73.15694840652742 -39, 146.71484375 -39" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="divider" style=""><path d="M-146.71484375 -15 C-71.15010625150619 -15, 4.414631246987625 -15, 146.71484375 -15 M-146.71484375 -15 C-53.33081304284559 -15, 40.05321766430882 -15, 146.71484375 -15" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g></g><g class="node default " id="classId-ResponseRouter-5" transform="translate(867.6171875, 723)"><g class="basic label-container"><path d="M-130.0625 -75 L130.0625 -75 L130.0625 75 L-130.0625 75" stroke="none" stroke-width="0" fill="#ECECFF" style=""></path><path d="M-130.0625 -75 C-55.53204067613056 -75, 18.998418647738873 -75, 130.0625 -75 M-130.0625 -75 C-40.56485585368665 -75, 48.9327882926267 -75, 130.0625 -75 M130.0625 -75 C130.0625 -38.808892825398026, 130.0625 -2.6177856507960513, 130.0625 75 M130.0625 -75 C130.0625 -40.01255226134134, 130.0625 -5.025104522682682, 130.0625 75 M130.0625 75 C70.81852991710024 75, 11.574559834200471 75, -130.0625 75 M130.0625 75 C59.358266647594036 75, -11.345966704811929 75, -130.0625 75 M-130.0625 75 C-130.0625 35.89122454739592, -130.0625 -3.2175509052081566, -130.0625 -75 M-130.0625 75 C-130.0625 15.729652890204143, -130.0625 -43.540694219591714, -130.0625 -75" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="annotation-group text" transform="translate(0, -51)"></g><g class="label-group text" transform="translate(-64.015625, -51)"><g class="label" style="font-weight: bolder" transform="translate(0,-12)"><foreignObject width="128.03125" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 171px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>ResponseRouter</p></span></div></foreignObject></g></g><g class="members-group text" transform="translate(-118.0625, -3)"></g><g class="methods-group text" transform="translate(-118.0625, 27)"><g class="label" style="" transform="translate(0,-12)"><foreignObject width="140.96875" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 195px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+attach(BaseClient)</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,12)"><foreignObject width="172.109375" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 227px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+event(ResponseEvent)</p></span></div></foreignObject></g></g><g class="divider" style=""><path d="M-130.0625 -27 C-61.92847568456561 -27, 6.205548630868776 -27, 130.0625 -27 M-130.0625 -27 C-39.300674260273695 -27, 51.46115147945261 -27, 130.0625 -27" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="divider" style=""><path d="M-130.0625 -3 C-32.29696129998479 -3, 65.46857740003043 -3, 130.0625 -3 M-130.0625 -3 C-62.00172337202471 -3, 6.059053255950573 -3, 130.0625 -3" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g></g><g class="node default " id="classId-Agent-6" transform="translate(1203.28515625, 723)"><g class="basic label-container"><path d="M-155.60546875 -87 L155.60546875 -87 L155.60546875 87 L-155.60546875 87" stroke="none" stroke-width="0" fill="#ECECFF" style=""></path><path d="M-155.60546875 -87 C-77.1561884697115 -87, 1.2930918105770104 -87, 155.60546875 -87 M-155.60546875 -87 C-41.92815197154444 -87, 71.74916480691112 -87, 155.60546875 -87 M155.60546875 -87 C155.60546875 -35.28278307152351, 155.60546875 16.434433856952978, 155.60546875 87 M155.60546875 -87 C155.60546875 -41.667126232577715, 155.60546875 3.66574753484457, 155.60546875 87 M155.60546875 87 C90.36547037644308 87, 25.12547200288617 87, -155.60546875 87 M155.60546875 87 C35.24698533884694 87, -85.11149807230612 87, -155.60546875 87 M-155.60546875 87 C-155.60546875 31.742955913537955, -155.60546875 -23.51408817292409, -155.60546875 -87 M-155.60546875 87 C-155.60546875 19.895385162812417, -155.60546875 -47.209229674375166, -155.60546875 -87" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="annotation-group text" transform="translate(0, -63)"></g><g class="label-group text" transform="translate(-22.6640625, -63)"><g class="label" style="font-weight: bolder" transform="translate(0,-12)"><foreignObject width="45.328125" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 92px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>Agent</p></span></div></foreignObject></g></g><g class="members-group text" transform="translate(-143.60546875, -15)"></g><g class="methods-group text" transform="translate(-143.60546875, 15)"><g class="label" style="" transform="translate(0,-12)"><foreignObject width="163.21875" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 218px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+config() : AgentConfig</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,12)"><foreignObject width="150.71875" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 206px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+provider() : Provider</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,36)"><foreignObject width="264.546875" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 319px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+promptTemplate() : PromptTemplate</p></span></div></foreignObject></g></g><g class="divider" style=""><path d="M-155.60546875 -39 C-54.18493700168244 -39, 47.235594746635115 -39, 155.60546875 -39 M-155.60546875 -39 C-86.51912548512628 -39, -17.432782220252562 -39, 155.60546875 -39" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="divider" style=""><path d="M-155.60546875 -15 C-67.20827283448891 -15, 21.188923081022182 -15, 155.60546875 -15 M-155.60546875 -15 C-54.814789086675646 -15, 45.97589057664871 -15, 155.60546875 -15" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g></g><g class="node default " id="classId-AgentFactory-7" transform="translate(1379.318359375, 403)"><g class="basic label-container"><path d="M-170.078125 -87 L170.078125 -87 L170.078125 87 L-170.078125 87" stroke="none" stroke-width="0" fill="#ECECFF" style=""></path><path d="M-170.078125 -87 C-68.92427463139202 -87, 32.22957573721595 -87, 170.078125 -87 M-170.078125 -87 C-63.44504924071539 -87, 43.18802651856922 -87, 170.078125 -87 M170.078125 -87 C170.078125 -26.99947121660739, 170.078125 33.00105756678522, 170.078125 87 M170.078125 -87 C170.078125 -41.287153618775264, 170.078125 4.425692762449472, 170.078125 87 M170.078125 87 C38.48071400374633 87, -93.11669699250734 87, -170.078125 87 M170.078125 87 C98.68911588529032 87, 27.30010677058064 87, -170.078125 87 M-170.078125 87 C-170.078125 23.054309563154824, -170.078125 -40.89138087369035, -170.078125 -87 M-170.078125 87 C-170.078125 49.14786088201417, -170.078125 11.295721764028343, -170.078125 -87" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="annotation-group text" transform="translate(0, -63)"></g><g class="label-group text" transform="translate(-51.5625, -63)"><g class="label" style="font-weight: bolder" transform="translate(0,-12)"><foreignObject width="103.125" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 145px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>AgentFactory</p></span></div></foreignObject></g></g><g class="members-group text" transform="translate(-158.078125, -15)"></g><g class="methods-group text" transform="translate(-158.078125, 15)"><g class="label" style="" transform="translate(0,-12)"><foreignObject width="158.765625" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 214px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+create(name) : Agent</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,12)"><foreignObject width="264.59375" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 319px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+configByName(name) : AgentConfig</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,36)"><foreignObject width="215.359375" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 270px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+effectiveModel(name) : string</p></span></div></foreignObject></g></g><g class="divider" style=""><path d="M-170.078125 -39 C-39.493026311879674 -39, 91.09207237624065 -39, 170.078125 -39 M-170.078125 -39 C-69.16933807230225 -39, 31.739448855395494 -39, 170.078125 -39" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="divider" style=""><path d="M-170.078125 -15 C-52.83453465928794 -15, 64.40905568142412 -15, 170.078125 -15 M-170.078125 -15 C-70.4932505555859 -15, 29.091623888828195 -15, 170.078125 -15" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g></g><g class="node default " id="classId-AgentRouter-8" transform="translate(1563.16015625, 723)"><g class="basic label-container"><path d="M-154.26953125 -63 L154.26953125 -63 L154.26953125 63 L-154.26953125 63" stroke="none" stroke-width="0" fill="#ECECFF" style=""></path><path d="M-154.26953125 -63 C-37.75135585296725 -63, 78.7668195440655 -63, 154.26953125 -63 M-154.26953125 -63 C-53.31706523468729 -63, 47.63540078062542 -63, 154.26953125 -63 M154.26953125 -63 C154.26953125 -32.125561668737376, 154.26953125 -1.251123337474759, 154.26953125 63 M154.26953125 -63 C154.26953125 -35.52697345613881, 154.26953125 -8.053946912277624, 154.26953125 63 M154.26953125 63 C31.181090113281286 63, -91.90735102343743 63, -154.26953125 63 M154.26953125 63 C91.51189843167987 63, 28.75426561335972 63, -154.26953125 63 M-154.26953125 63 C-154.26953125 33.81585709933033, -154.26953125 4.63171419866066, -154.26953125 -63 M-154.26953125 63 C-154.26953125 26.08876089857187, -154.26953125 -10.82247820285626, -154.26953125 -63" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="annotation-group text" transform="translate(0, -39)"></g><g class="label-group text" transform="translate(-48.4453125, -39)"><g class="label" style="font-weight: bolder" transform="translate(0,-12)"><foreignObject width="96.890625" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 141px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>AgentRouter</p></span></div></foreignObject></g></g><g class="members-group text" transform="translate(-142.26953125, 9)"></g><g class="methods-group text" transform="translate(-142.26953125, 39)"><g class="label" style="" transform="translate(0,-12)"><foreignObject width="236.09375" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 291px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+pickAgent(roster, fileCtx) : string</p></span></div></foreignObject></g></g><g class="divider" style=""><path d="M-154.26953125 -15 C-35.834557672896054 -15, 82.60041590420789 -15, 154.26953125 -15 M-154.26953125 -15 C-80.60657693979137 -15, -6.943622629582734 -15, 154.26953125 -15" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="divider" style=""><path d="M-154.26953125 9 C-91.0962922430119 9, -27.92305323602382 9, 154.26953125 9 M-154.26953125 9 C-86.93234598082343 9, -19.595160711646855 9, 154.26953125 9" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g></g><g class="node default " id="classId-Provider-9" transform="translate(1203.28515625, 971)"><g class="basic label-container"><path d="M-144.51953125 -99 L144.51953125 -99 L144.51953125 99 L-144.51953125 99" stroke="none" stroke-width="0" fill="#ECECFF" style=""></path><path d="M-144.51953125 -99 C-52.582264982504086 -99, 39.35500128499183 -99, 144.51953125 -99 M-144.51953125 -99 C-48.0296181933205 -99, 48.460294863358996 -99, 144.51953125 -99 M144.51953125 -99 C144.51953125 -42.463610636805825, 144.51953125 14.07277872638835, 144.51953125 99 M144.51953125 -99 C144.51953125 -31.557052377573555, 144.51953125 35.88589524485289, 144.51953125 99 M144.51953125 99 C67.05724216229882 99, -10.40504692540236 99, -144.51953125 99 M144.51953125 99 C70.2273881956757 99, -4.064754858648598 99, -144.51953125 99 M-144.51953125 99 C-144.51953125 34.85638170572575, -144.51953125 -29.287236588548495, -144.51953125 -99 M-144.51953125 99 C-144.51953125 22.714372625373812, -144.51953125 -53.571254749252375, -144.51953125 -99" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="annotation-group text" transform="translate(0, -75)"></g><g class="label-group text" transform="translate(-32.4609375, -75)"><g class="label" style="font-weight: bolder" transform="translate(0,-12)"><foreignObject width="64.921875" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 110px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>Provider</p></span></div></foreignObject></g></g><g class="members-group text" transform="translate(-132.51953125, -27)"></g><g class="methods-group text" transform="translate(-132.51953125, 3)"><g class="label" style="" transform="translate(0,-12)"><foreignObject width="195.203125" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 250px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+capabilities() : Capabilities</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,12)"><foreignObject width="217.453125" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 272px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+prepareRequest(request, ctx)</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,36)"><foreignObject width="232.578125" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 287px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+sendRequest(json) : RequestID</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,60)"><foreignObject width="201.4375" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 256px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+cancelRequest(RequestID)</p></span></div></foreignObject></g></g><g class="divider" style=""><path d="M-144.51953125 -51 C-65.94055997741698 -51, 12.638411295166037 -51, 144.51953125 -51 M-144.51953125 -51 C-66.37883123493651 -51, 11.761868780126974 -51, 144.51953125 -51" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="divider" style=""><path d="M-144.51953125 -27 C-73.75763948717531 -27, -2.995747724350622 -27, 144.51953125 -27 M-144.51953125 -27 C-48.40434157542103 -27, 47.71084809915794 -27, 144.51953125 -27" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g></g><g class="node default " id="classId-GenericProvider-10" transform="translate(1872.8046875, 723)"><g class="basic label-container"><path d="M-105.375 -60 L105.375 -60 L105.375 60 L-105.375 60" stroke="none" stroke-width="0" fill="#ECECFF" style=""></path><path d="M-105.375 -60 C-34.83671741086488 -60, 35.70156517827024 -60, 105.375 -60 M-105.375 -60 C-33.50195734666191 -60, 38.37108530667618 -60, 105.375 -60 M105.375 -60 C105.375 -27.94933260957815, 105.375 4.1013347808437, 105.375 60 M105.375 -60 C105.375 -16.615881616363012, 105.375 26.768236767273976, 105.375 60 M105.375 60 C60.035536882267685 60, 14.69607376453537 60, -105.375 60 M105.375 60 C46.96507275423945 60, -11.444854491521099 60, -105.375 60 M-105.375 60 C-105.375 29.398531382066523, -105.375 -1.2029372358669548, -105.375 -60 M-105.375 60 C-105.375 12.203470038415382, -105.375 -35.593059923169236, -105.375 -60" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="annotation-group text" transform="translate(0, -36)"></g><g class="label-group text" transform="translate(-62.25, -36)"><g class="label" style="font-weight: bolder" transform="translate(0,-12)"><foreignObject width="124.5" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 166px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>GenericProvider</p></span></div></foreignObject></g></g><g class="members-group text" transform="translate(-93.375, 12)"><g class="label" style="" transform="translate(0,-12)"><foreignObject width="124.5" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 180px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>-client BaseClient</p></span></div></foreignObject></g></g><g class="methods-group text" transform="translate(-93.375, 60)"></g><g class="divider" style=""><path d="M-105.375 -12 C-58.321638029355356 -12, -11.268276058710711 -12, 105.375 -12 M-105.375 -12 C-53.44521153051921 -12, -1.515423061038419 -12, 105.375 -12" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="divider" style=""><path d="M-105.375 36 C-52.09718040573348 36, 1.1806391885330356 36, 105.375 36 M-105.375 36 C-61.15208445363972 36, -16.929168907279447 36, 105.375 36" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g></g><g class="node default " id="classId-PromptTemplate-11" transform="translate(2157.4921875, 971)"><g class="basic label-container"><path d="M-154.2109375 -63 L154.2109375 -63 L154.2109375 63 L-154.2109375 63" stroke="none" stroke-width="0" fill="#ECECFF" style=""></path><path d="M-154.2109375 -63 C-54.435288516771465 -63, 45.34036046645707 -63, 154.2109375 -63 M-154.2109375 -63 C-83.07091999731395 -63, -11.930902494627901 -63, 154.2109375 -63 M154.2109375 -63 C154.2109375 -27.725321393809878, 154.2109375 7.549357212380244, 154.2109375 63 M154.2109375 -63 C154.2109375 -34.67206569347018, 154.2109375 -6.3441313869403615, 154.2109375 63 M154.2109375 63 C80.26057280689574 63, 6.310208113791475 63, -154.2109375 63 M154.2109375 63 C41.326010185887114 63, -71.55891712822577 63, -154.2109375 63 M-154.2109375 63 C-154.2109375 37.5597520775966, -154.2109375 12.119504155193198, -154.2109375 -63 M-154.2109375 63 C-154.2109375 31.996477011471377, -154.2109375 0.9929540229427545, -154.2109375 -63" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="annotation-group text" transform="translate(0, -39)"></g><g class="label-group text" transform="translate(-62.53125, -39)"><g class="label" style="font-weight: bolder" transform="translate(0,-12)"><foreignObject width="125.0625" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 167px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>PromptTemplate</p></span></div></foreignObject></g></g><g class="members-group text" transform="translate(-142.2109375, 9)"></g><g class="methods-group text" transform="translate(-142.2109375, 39)"><g class="label" style="" transform="translate(0,-12)"><foreignObject width="221.890625" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 276px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+buildFullRequest(request, ctx)</p></span></div></foreignObject></g></g><g class="divider" style=""><path d="M-154.2109375 -15 C-61.66593150925074 -15, 30.87907448149852 -15, 154.2109375 -15 M-154.2109375 -15 C-41.104341498759894 -15, 72.00225450248021 -15, 154.2109375 -15" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="divider" style=""><path d="M-154.2109375 9 C-70.28863190238967 9, 13.633673695220665 9, 154.2109375 9 M-154.2109375 9 C-60.961695348710606 9, 32.28754680257879 9, 154.2109375 9" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g></g><g class="node default " id="classId-JsonPromptTemplate-12" transform="translate(2167.4921875, 723)"><g class="basic label-container"><path d="M-139.3125 -72 L139.3125 -72 L139.3125 72 L-139.3125 72" stroke="none" stroke-width="0" fill="#ECECFF" style=""></path><path d="M-139.3125 -72 C-79.63642379855236 -72, -19.960347597104715 -72, 139.3125 -72 M-139.3125 -72 C-62.25825533795599 -72, 14.795989324088026 -72, 139.3125 -72 M139.3125 -72 C139.3125 -23.416519207077783, 139.3125 25.166961585844433, 139.3125 72 M139.3125 -72 C139.3125 -32.279844102288685, 139.3125 7.44031179542263, 139.3125 72 M139.3125 72 C58.63380817944547 72, -22.044883641109067 72, -139.3125 72 M139.3125 72 C58.58237624303936 72, -22.147747513921274 72, -139.3125 72 M-139.3125 72 C-139.3125 26.097346500360928, -139.3125 -19.805306999278145, -139.3125 -72 M-139.3125 72 C-139.3125 21.2675547449628, -139.3125 -29.464890510074397, -139.3125 -72" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="annotation-group text" transform="translate(0, -48)"></g><g class="label-group text" transform="translate(-81.203125, -48)"><g class="label" style="font-weight: bolder" transform="translate(0,-12)"><foreignObject width="162.40625" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 200px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>JsonPromptTemplate</p></span></div></foreignObject></g></g><g class="members-group text" transform="translate(-127.3125, 0)"><g class="label" style="" transform="translate(0,-12)"><foreignObject width="173.421875" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 228px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>-bodySpec QJsonObject</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,12)"><foreignObject width="151.1875" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 206px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>-env InjaEnvironment</p></span></div></foreignObject></g></g><g class="methods-group text" transform="translate(-127.3125, 72)"></g><g class="divider" style=""><path d="M-139.3125 -24 C-76.61662125663923 -24, -13.92074251327847 -24, 139.3125 -24 M-139.3125 -24 C-28.15729904933309 -24, 82.99790190133382 -24, 139.3125 -24" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="divider" style=""><path d="M-139.3125 48 C-64.6607668047461 48, 9.990966390507793 48, 139.3125 48 M-139.3125 48 C-51.878551293566034 48, 35.55539741286793 48, 139.3125 48" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g></g><g class="node default " id="classId-ToolContributorRegistry-13" transform="translate(1745.369140625, 403)"><g class="basic label-container"><path d="M-145.97265625 -75 L145.97265625 -75 L145.97265625 75 L-145.97265625 75" stroke="none" stroke-width="0" fill="#ECECFF" style=""></path><path d="M-145.97265625 -75 C-50.59752269154521 -75, 44.77761086690958 -75, 145.97265625 -75 M-145.97265625 -75 C-61.75440737688152 -75, 22.463841496236967 -75, 145.97265625 -75 M145.97265625 -75 C145.97265625 -16.041587080341003, 145.97265625 42.916825839317994, 145.97265625 75 M145.97265625 -75 C145.97265625 -28.279809726288228, 145.97265625 18.440380547423544, 145.97265625 75 M145.97265625 75 C32.23111472200644 75, -81.51042680598712 75, -145.97265625 75 M145.97265625 75 C74.82146292941066 75, 3.6702696088213145 75, -145.97265625 75 M-145.97265625 75 C-145.97265625 40.3267867624927, -145.97265625 5.653573524985404, -145.97265625 -75 M-145.97265625 75 C-145.97265625 25.880935569916367, -145.97265625 -23.238128860167265, -145.97265625 -75" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="annotation-group text" transform="translate(0, -51)"></g><g class="label-group text" transform="translate(-92.2890625, -51)"><g class="label" style="font-weight: bolder" transform="translate(0,-12)"><foreignObject width="184.578125" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 217px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>ToolContributorRegistry</p></span></div></foreignObject></g></g><g class="members-group text" transform="translate(-133.97265625, -3)"></g><g class="methods-group text" transform="translate(-133.97265625, 27)"><g class="label" style="" transform="translate(0,-12)"><foreignObject width="165.84375" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 220px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+registerContributor(fn)</p></span></div></foreignObject></g><g class="label" style="" transform="translate(0,12)"><foreignObject width="175.65625" height="24"><div xmlns="http://www.w3.org/1999/xhtml" style="display: table-cell; white-space: nowrap; line-height: 1.5; max-width: 230px; text-align: center;"><span class="nodeLabel markdown-node-label" style=""><p>+applyTo(ToolsManager)</p></span></div></foreignObject></g></g><g class="divider" style=""><path d="M-145.97265625 -27 C-41.612184177423714 -27, 62.74828789515257 -27, 145.97265625 -27 M-145.97265625 -27 C-58.90269318861709 -27, 28.167269872765814 -27, 145.97265625 -27" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g><g class="divider" style=""><path d="M-145.97265625 -3 C-38.335521041776104 -3, 69.30161416644779 -3, 145.97265625 -3 M-145.97265625 -3 C-87.13119829911906 -3, -28.28974034823814 -3, 145.97265625 -3" stroke="#9370DB" stroke-width="1.3" fill="none" stroke-dasharray="0 0" style=""></path></g></g></g></g></g></svg>
\ No newline at end of file
diff --git a/docs/project-rules.md b/docs/project-rules.md
deleted file mode 100644
index b8bf9d3..0000000
--- a/docs/project-rules.md
+++ /dev/null
@@ -1,35 +0,0 @@
-# Project Rules Configuration
-
-QodeAssist supports project-specific rules to customize AI behavior for your codebase. Create a `.qodeassist/rules/` directory in your project root.
-
-## Quick Start
-
-```bash
-mkdir -p .qodeassist/rules/{common,completion,chat,quickrefactor}
-```
-
-## Directory Structure
-
-```
-.qodeassist/
-└── rules/
-    ├── common/           # Applied to all contexts
-    ├── completion/       # Code completion only
-    ├── chat/            # Chat assistant only
-    └── quickrefactor/   # Quick refactor only
-```
-
-All `.md` files in each directory are automatically loaded and added to the system prompt.
-
-## Example
-
-Create `.qodeassist/rules/common/general.md`:
-
-```markdown
-# Project Guidelines
-- Use snake_case for private members
-- Prefix interfaces with 'I'
-- Always document public APIs
-- Prefer Qt containers over STL
-```
-
diff --git a/docs/quick-refactoring.md b/docs/quick-refactoring.md
index 1357936..91e9cc4 100644
--- a/docs/quick-refactoring.md
+++ b/docs/quick-refactoring.md
@@ -206,7 +206,6 @@ The LLM receives:
 - **Cursor Position**: Marked with `<cursor>` tag
 - **Selection Markers**: `<selection_start>` and `<selection_end>` tags
 - **Your Instructions**: Built-in, custom, or typed
-- **Project Rules**: If configured (see [Project Rules](project-rules.md))
 
 ### Context Configuration
 
@@ -270,7 +269,6 @@ Fully local setup for offline or secure environments.
 
 ## Related Documentation
 
-- [Project Rules](project-rules.md) - Project-specific AI behavior customization
 - [File Context](file-context.md) - Attaching files to chat context
 - [Ignoring Files](ignoring-files.md) - Exclude files from AI context
 - [Provider Configuration](../README.md#configuration) - Setting up LLM providers
diff --git a/docs/target-architecture.md b/docs/target-architecture.md
new file mode 100644
index 0000000..9a142a0
--- /dev/null
+++ b/docs/target-architecture.md
@@ -0,0 +1,652 @@
+# QodeAssist — Target Architecture (v1.0)
+
+Status: design baseline, derived from the fixed use-case inventory below.
+Scope: the complete plugin, designed "from scratch" — what the architecture
+should be if nothing legacy constrained it. The current code (see
+`architecture.md`) already converges on this; §10 lists the remaining deltas.
+
+---
+
+## 1. Use-case inventory (requirements baseline)
+
+Every architectural decision below is justified by one of these. Features not
+on this list (Rules system, legacy provider/model/template pickers, Stack A)
+are intentionally out of scope.
+
+| # | Use case | What the user gets |
+|---|----------|--------------------|
+| U1 | **Code completion** | Inline FIM/instruct suggestions via LSP; auto + manual trigger, multiline, smart-context suppression, accept full / word-by-word |
+| U2 | **Chat assistant** | 4 placements (sidebar, bottom pane, editor tab, floating window); streaming text + thinking blocks + tool blocks + file-edit blocks (apply/undo); attachments, linked files, @-mentions, open-files sync; token counter; persisted history; one-click summarization; runtime agent + role pickers |
+| U3 | **Quick refactor** | Selection + instruction by hotkey; custom-instructions library; separate agent; optional tools; streamed result inserted into the editor |
+| U4 | **Tools** | read/create/edit file, search, find, list, build, diagnostics, terminal, todo, load_skill; per-tool enable |
+| U5 | **Skills** | discovery from `.qodeassist/skills`, `.claude/skills`, `~/.claude/skills`; auto-injection, explicit `/` picker, always-on |
+| U6 | **MCP** | server mode (expose plugin tools, HTTP/SSE + stdio bridge) and client hub (consume external tools in chat/refactor) |
+| U7 | **Providers** | 13 `client_api` types over one GenericProvider; secrets store; local-server autostart; model listing |
+| U8 | **Agents** | TOML profiles: `extends`, `[body]` table 1:1 with the wire request, Jinja partials, `match` rules, per-agent model override, per-pipeline rosters |
+| U9 | **Roles** | JSON roles composed into `system_prompt` via `{{ agent_role(id) }}` |
+| U10 | **Bench CLI** | headless agent testing on the same core stack, `.env` secrets |
+| U11 | **Configuration UI** | settings pages for everything above; per-project settings; updater + status widget |
+
+---
+
+## 2. Design principles
+
+1. **One stack.** Every LLM byte — completion, chat, compression, refactor,
+   bench — flows through the same `Session` pipeline. No parallel legacy path.
+2. **Hexagonal core.** The runtime (agents, sessions, providers, templates,
+   prompt rendering) has zero Qt Creator dependencies. The IDE and the bench
+   CLI are two hosts composing the same core; IDE-specific facts enter only
+   through ports (document reading, project scanning, secrets, tool hosting).
+3. **Configuration is declarative, code is mechanism.** What is sent (request
+   `[body]`, system prompt, endpoint, model) lives in TOML/JSON/Jinja and is
+   user-overridable; *how* it is sent (streaming, retries, tool loop, event
+   routing) lives in C++ and is identical for all providers.
+4. **Capability-driven behavior.** Providers and agents declare capabilities
+   (tools, thinking, images, model listing); features and UI adapt to the
+   declared set instead of switching on provider names.
+5. **Single source of truth for conversation state.** `ConversationHistory`
+   owns the messages; `ChatModel` and persistence are projections of it, never
+   independent copies.
+6. **Per-feature composition roots, no singletons.** Each feature constructs
+   and owns its dependencies (`new` + parent); shared services are passed
+   explicitly (constructor/setter, QML context properties for the chat).
+7. **Streaming-first event model.** One typed `ResponseEvent` stream is the
+   only contract between the core and every consumer. Deltas exist for live
+   UI (chat); one-shot pipelines (completion, refactor, bench) ignore them,
+   wait for `finished`, and read the final assistant message from history.
+8. **Fail at load, not mid-conversation.** Agent profiles are validated when
+   loaded (partials resolve, assembled body parses as JSON against a synthetic
+   context), so a config error never surfaces as a silent runtime drop.
+
+---
+
+## 3. Layered model
+
+```mermaid
+flowchart TB
+    subgraph HOSTS["Hosts — composition roots"]
+        PLUGIN["Qt Creator plugin<br/>qodeassist.cpp"]
+        BENCH["bench CLI"]
+    end
+
+    subgraph L5["L5 · Presentation"]
+        LSP["LSP bridge<br/>inline suggestions"]
+        QMLUI["ChatView QML<br/>4 placements"]
+        RW["Refactor widgets"]
+        SUI["Settings pages"]
+    end
+
+    subgraph L4["L4 · Features"]
+        FCOMP["CompletionFeature"]
+        FCHAT["ChatFeature"]
+        FREF["RefactorFeature"]
+    end
+
+    subgraph L3["L3 · Capabilities"]
+        CTX["ContextEngine<br/>ports + QtC adapters"]
+        TOOLS["ToolKit"]
+        SKILLS["SkillsEngine"]
+        MCPH["McpHub<br/>client + server"]
+    end
+
+    subgraph L2["L2 · Core runtime — IDE-independent"]
+        SM["SessionManager"]
+        SESS["Session"]
+        AGF["AgentFactory + AgentRouter"]
+        AG["Agent"]
+        PROV["GenericProvider"]
+        TPL["JsonPromptTemplate"]
+    end
+
+    subgraph L1["L1 · Declarative config"]
+        PCONF["providers/*.toml"]
+        ACONF["agents/*.toml + partials/*.jinja"]
+        ROST["rosters / pipelines"]
+        ROLES["agent_roles/*.json"]
+        SKCONF["skills/*.md"]
+        SEC["SecretsStore"]
+    end
+
+    subgraph L0["L0 · Wire — LLMQore"]
+        CLIENTS["*Client — SSE streaming"]
+        TOOLFW["Tool framework"]
+        MCPT["MCP transports"]
+    end
+
+    PLUGIN --> L4
+    PLUGIN --> SUI
+    BENCH --> SM
+    LSP --> FCOMP
+    QMLUI --> FCHAT
+    RW --> FREF
+    FCOMP --> SM
+    FCHAT --> SM
+    FREF --> SM
+    FCOMP --> CTX
+    FCHAT --> CTX
+    FREF --> CTX
+    FCHAT --> SKILLS
+    FCHAT --> TOOLS
+    FREF --> TOOLS
+    TOOLS --> TOOLFW
+    MCPH --> MCPT
+    SM --> SESS
+    SESS --> AG
+    AGF --> AG
+    AG --> PROV
+    AG --> TPL
+    AGF --> ACONF
+    AGF --> PCONF
+    AGF --> SEC
+    AGF --> ROST
+    TPL --> ROLES
+    PROV --> CLIENTS
+    SKILLS --> SKCONF
+```
+
+### Layer contracts
+
+| Layer | Contains | May depend on | Must NOT depend on |
+|-------|----------|---------------|--------------------|
+| **L0 Wire** | LLMQore clients (one per wire protocol: Claude, OpenAI Chat, OpenAI Responses, Google, Ollama, Mistral, llama.cpp), tool framework, MCP transports | Qt Network | anything above |
+| **L1 Config** | `ProviderInstance`, `AgentProfile` (+ loader/validator), rosters, roles, skills, secrets port | toml++, inja | Qt Creator, L2+ |
+| **L2 Core** | `Agent`, `AgentFactory`, `AgentRouter`, `Provider`/`GenericProvider`, `JsonPromptTemplate`, `Session`, `SessionManager`, `ConversationHistory`, `SystemPromptBuilder`, `ResponseRouter`, `ToolContributorRegistry` | L0, L1 | Qt Creator, QML, features |
+| **L3 Capabilities** | `ContextEngine` (ports + QtC adapters), `ToolKit` (built-in tools), `SkillsEngine`, `McpHub` | L0–L2, QtC APIs *only in adapters* | features, UI |
+| **L4 Features** | `CompletionFeature`, `ChatFeature` (send/stream, compression, token counting, file edits), `RefactorFeature` | L2, L3 | each other |
+| **L5 Presentation** | LSP bridge, ChatView QML, refactor widgets, settings pages | its feature | core internals |
+| **Hosts** | plugin shell, bench CLI | everything (composition only) | — |
+
+The hard rule that makes U10 (bench) and testability free: **L0–L2 build into
+targets with no Qt Creator linkage.** Bench links L0–L2 plus a thin CLI host;
+the plugin adds L3 adapters, L4, L5.
+
+---
+
+## 4. Core domain model
+
+Rendered copy: [core-class-diagram.svg](core-class-diagram.svg) (regenerate
+when the diagram below changes).
+
+```mermaid
+classDiagram
+    direction TB
+    class SessionManager {
+        +acquire(agentName) Session
+        +release(session)
+        +toolContributors() ToolContributorRegistry
+    }
+    class Session {
+        +send(blocks, toolPolicy)
+        +cancel()
+        +history() ConversationHistory
+        +systemPrompt() SystemPromptBuilder
+        +event(ResponseEvent)
+        +finished(id, stopReason)
+        +failed(id, ErrorInfo)
+        +cancelled(id)
+    }
+    class ConversationHistory {
+        +messages() vector~Message~
+        +lastAssistantText() string
+        +append(Message)
+        +reset(vector~Message~)
+    }
+    class Message {
+        +role Role
+        +blocks vector~ContentBlock~
+    }
+    class SystemPromptBuilder {
+        +setLayer(id, text, priority)
+        +removeLayer(id)
+        +compose() string
+    }
+    class ResponseRouter {
+        +attach(BaseClient)
+        +event(ResponseEvent)
+    }
+    class Agent {
+        +config() AgentConfig
+        +provider() Provider
+        +promptTemplate() PromptTemplate
+    }
+    class AgentFactory {
+        +create(name) Agent
+        +configByName(name) AgentConfig
+        +effectiveModel(name) string
+    }
+    class AgentRouter {
+        +pickAgent(roster, fileCtx) string
+    }
+    class Provider {
+        <<interface>>
+        +capabilities() Capabilities
+        +prepareRequest(request, ctx)
+        +sendRequest(json) RequestID
+        +cancelRequest(RequestID)
+    }
+    class GenericProvider {
+        -client BaseClient
+    }
+    class PromptTemplate {
+        <<interface>>
+        +buildFullRequest(request, ctx)
+    }
+    class JsonPromptTemplate {
+        -bodySpec QJsonObject
+        -env InjaEnvironment
+    }
+    class ToolContributorRegistry {
+        +registerContributor(fn)
+        +applyTo(ToolsManager)
+    }
+
+    SessionManager o-- Session : pools
+    SessionManager --> AgentFactory : builds via
+    SessionManager --> ToolContributorRegistry
+    Session *-- ConversationHistory
+    Session *-- SystemPromptBuilder
+    Session *-- ResponseRouter
+    Session --> Agent
+    ConversationHistory o-- Message
+    Agent *-- Provider
+    Agent *-- PromptTemplate
+    AgentFactory ..> Agent : creates
+    AgentFactory --> AgentRouter
+    GenericProvider --|> Provider
+    JsonPromptTemplate --|> PromptTemplate
+```
+
+Responsibilities, one line each:
+
+- **Agent** — immutable bundle of *what to call*: resolved config + provider +
+  compiled prompt template. No request state.
+- **Session** — one conversation's runtime: owns history, system-prompt
+  layers, response routing, the in-flight request, and the tool-execution
+  loop (tool_use → execute → tool_result → continue). `send(blocks)` is the
+  *only* entry point: every pipeline appends a user message and dispatches;
+  there are no per-pipeline send variants. What differs between completion,
+  chat, and refactor is the agent's template and the consumption mode (deltas
+  vs final message), never the Session API.
+- **SessionManager** — creates/pools sessions per agent; the single place
+  features go to get one. Pooling (not per-message construction) covers the
+  "fresh agent + provider + secrets read per request" latency cost. It reuses
+  only the expensive parts (agent, provider, compiled template, secrets read):
+  `acquire` hands out a session with cleared history and system-prompt
+  layers, so one-shot pipelines never see a previous exchange.
+- **AgentRouter** — the *only* agent picker. Every pipeline (completion, chat,
+  compression, refactor) resolves its agent through
+  `pickAgent(roster, {file, project})`; no feature-local picker logic.
+- **GenericProvider** — one class for all 13 client APIs; varies only by
+  LLMQore client factory + metadata. Request *shape* belongs to the template,
+  never to the provider.
+- **JsonPromptTemplate** — compiles the agent's `[body]` table; renders
+  Jinja-bearing string values, splices raw JSON, drops empty keys; validated
+  at load time.
+- **SystemPromptBuilder** — ordered named layers (`agent.system`,
+  `chat.context`, `refactor`, `compression`); features mutate only their own
+  layer.
+- **ResponseRouter / ResponseEvent** — adapts LLMQore client signals into one
+  typed stream: `TextDelta`, `ThinkingDelta`, `ToolCallStart/End`,
+  `ToolResult`, `Usage`, `Error`, `MessageStop`.
+- **ToolContributorRegistry** — contributors (built-in ToolKit, SkillTool,
+  McpHub) register once; `SessionManager` applies them to every new session's
+  `ToolsManager`. This is how MCP tools reach chat *and* refactor (U6) without
+  feature code knowing about MCP.
+
+---
+
+## 5. Runtime flows
+
+### 5.1 Chat (U2) — the richest path
+
+```mermaid
+sequenceDiagram
+    autonumber
+    actor U as User
+    participant V as ChatView QML
+    participant F as ChatFeature
+    participant SM as SessionManager
+    participant S as Session
+    participant T as JsonPromptTemplate
+    participant P as GenericProvider
+    participant C as LLMQore Client
+    participant R as ResponseRouter
+
+    U->>V: message + attachments
+    V->>F: sendMessage(text, files, images)
+    F->>SM: acquire(activeAgent)
+    SM-->>F: Session (pooled)
+    F->>S: systemPrompt().setLayer("chat.context", project + skills + linked files)
+    F->>S: send(userBlocks, toolPolicy)
+    S->>T: buildFullRequest(history, system, ctx)
+    T-->>S: request JSON (body is 1:1 with the API)
+    S->>P: sendRequest(json)
+    P->>C: HTTP POST, SSE stream
+    loop streaming
+        C-->>R: chunk / thinking / tool_use / usage
+        R-->>S: ResponseEvent
+        S-->>F: event(ResponseEvent)
+        F-->>V: ChatModel projection update
+    end
+    opt tool call requested
+        S->>S: execute tool via ToolsManager
+        S->>P: continue with tool_result
+    end
+    C-->>R: finalized
+    R-->>S: MessageStop + Usage
+    S-->>F: finished()
+    F->>SM: release(session)
+```
+
+State ownership in chat: `Session.history()` is the truth. `ChatModel` is a
+QML projection built from history events (`messageAdded`, `messageUpdated`);
+`ChatSerializer`/`ChatHistoryStore` persist *history*, and restoring a chat
+seeds a new session's history — never the other way around. File-edit blocks,
+apply/undo, and the token counter are ChatFeature concerns layered on the
+event stream.
+
+### 5.2 Completion (U1)
+
+```
+LSP getCompletionsCycling
+  → CompletionFeature
+      agent   = AgentRouter.pickAgent(roster.codeCompletion, {file, project})
+      session = SessionManager.acquire(agent)
+      ctx     = ContextEngine: prefix/suffix + open-files context (policy from
+                CodeCompletionSettings — editor policy, not agent config)
+      session.send(blocks{completion context}, tools=off)
+  on finished → history().lastAssistantText()
+      → CodeHandler (output-mode post-processing) → LSP items
+```
+
+No special Session method: the completion context travels as the content of
+an ordinary user message (a structured block carrying prefix/suffix + file
+context), and the template context exposes it as `ctx.prefix` / `ctx.suffix`.
+FIM vs instruct is *agent config* (template + body), not feature code: a FIM
+agent's body renders `prefix`/`suffix` into FIM fields; an instruct agent's
+body renders the same exchange as a chat-shaped request. The feature is
+identical for both — and since completion has no incremental UI, it never
+touches the delta stream: it waits for `finished` and reads the last message.
+
+### 5.3 Quick refactor (U3)
+
+```
+Hotkey → RefactorFeature
+  agent   = AgentRouter.pickAgent(roster.quickRefactor, {file, project})
+  session = SessionManager.acquire(agent)
+  session.systemPrompt().setLayer("refactor", tagged selection + output rules)
+  session.send(blocks{instruction}, toolPolicy)
+  on finished → history().lastAssistantText()
+      → ResponseCleaner → RefactorResult → editor insert (accept/reject)
+```
+
+Same consumption mode as completion: the feature listens to
+`Session::finished`/`failed` only (events at most drive a progress spinner
+and cancel) and reads the result from history — it never connects to raw
+client signals. Tool calls during refactor run inside the session's tool
+loop; history's last assistant message is whatever the model produced after
+the final tool round.
+
+### 5.4 Compression (U2) and bench (U10)
+
+Compression is ChatFeature reusing the same path with
+`roster.chatCompression` and a `"compression"` system layer; the summary
+starts a new history. Bench is a host: CLI args + `.env` secrets → L1 + L2
+composition → `Session.send` → events printed to stdout. Anything bench can't
+do without the IDE is, by construction, an L3+ concern.
+
+---
+
+## 6. Configuration model
+
+```mermaid
+erDiagram
+    AGENT_PROFILE ||--o| AGENT_PROFILE : extends
+    AGENT_PROFILE }o--|| PROVIDER_INSTANCE : provider_instance
+    AGENT_PROFILE }o--o{ PARTIAL : includes
+    AGENT_PROFILE }o--o{ ROLE : agent_role
+    ROSTER }o--o{ AGENT_PROFILE : ranks
+    MODEL_OVERRIDE |o--|| AGENT_PROFILE : overrides_model
+    PROVIDER_INSTANCE }o--|| CLIENT_API : client_api
+    PROVIDER_INSTANCE }o--o| SECRET : api_key_ref
+    PROVIDER_INSTANCE ||--o| LAUNCH_CONFIG : autostarts
+
+    AGENT_PROFILE {
+        string name
+        bool abstract
+        string system_prompt "jinja, composes agent_role()"
+        json body "request body, 1:1 with API"
+        string endpoint "may contain MODEL placeholder"
+        string model "default; override wins"
+        bool enable_tools "capability hint"
+        bool enable_thinking "capability hint"
+        json match "file, path, project patterns"
+    }
+    PROVIDER_INSTANCE {
+        string name
+        string client_api
+        string url
+        string api_key_ref
+    }
+    ROLE {
+        string id
+        string systemPrompt
+    }
+    ROSTER {
+        string pipeline "completion, chat, compression, refactor"
+        list agents "ordered candidates"
+    }
+```
+
+Rules of the config layer (full spec: `agent-templates-design.md`):
+
+- `[body]` **is** the request body — field-by-field, deep-mergeable through
+  `extends`; Jinja-bearing strings render and splice as raw JSON, literals
+  pass through. No separate sampling/thinking merge machinery.
+- `include` resolves only sandboxed partial roots (bundled `:/agents/partials/`,
+  then user `partials/`); a missing partial is a load-time error.
+- Two-level hierarchy: one abstract base per provider family, thin children.
+- Per-agent model override lives in `agent_models.json` and is applied by
+  `AgentFactory`; `${MODEL}` in `endpoint` covers URL-model providers.
+- Roles are JSON managed by the Roles settings UI; profiles pull them in with
+  `{{ agent_role("<id>") }}` — the only system-prompt edit point is the
+  profile.
+- Secrets never appear in TOML; `api_key_ref` resolves through the
+  `SecretsStore` port (QtC keychain in the plugin, `.env` in bench).
+
+---
+
+## 7. Capabilities layer
+
+**ContextEngine** replaces the monolithic ContextManager with three focused
+services behind IDE-agnostic ports:
+
+| Service | Port (L2-visible) | QtC adapter |
+|---------|-------------------|-------------|
+| `EditorContext` — current doc, selection, prefix/suffix | `IDocumentReader` | TextEditor API |
+| `ProjectContext` — root, file listing, ignore filtering (`.qodeassistignore`), open files, changes | `IProjectScanner` | ProjectExplorer API |
+| `TokenEstimator` — input estimates, calibrated by server usage | — (pure) | — |
+
+**ToolKit** registers the built-in tools (U4) with the
+`ToolContributorRegistry`; each tool declares a permission class (read /
+write / execute) so per-tool enablement (settings) and confirmation policy
+(terminal commands) live in one place.
+
+**SkillsEngine** (U5): discovery + watching of the three skill roots; exposes
+`catalogText()` (names + descriptions for the system prompt),
+`alwaysOnBodies()`, and the `load_skill` tool; the `/` picker injects a
+skill's body into a single message.
+
+**McpHub** (U6): client side connects configured servers and contributes
+their tools through the same registry (tools reach every session uniformly);
+server side exposes ToolKit over HTTP/SSE + stdio bridge.
+
+---
+
+## 8. Cross-cutting policies
+
+Architecture is the rules as much as the boxes. These policies bind every
+layer and are part of the contract:
+
+### 8.1 Threading
+
+The core runs on the GUI thread; concurrency is the Qt event loop plus async
+network I/O — no shared-state threading anywhere in L1–L4. Work that can
+block (project scans, token estimation over large trees) hides behind L3
+ports; an adapter may use worker threads internally but delivers results as
+queued signals. Core types are therefore deliberately not thread-safe.
+
+### 8.2 Request lifecycle
+
+A session has at most one in-flight request; `send()` while in flight cancels
+the previous request first. Every request terminates in exactly one of three
+states — `finished(stopReason)`, `failed(error)`, `cancelled()` — and
+cancellation is *not* an error: no consumer may string-match a message to
+tell them apart.
+
+### 8.3 Errors
+
+Runtime errors are typed, not strings: `ErrorInfo { category, message,
+providerDetail }` with categories `Config | Auth | Network | Provider |
+Validation | Tool`. The category drives UI affordances (Auth → open provider
+settings, Network → offer retry); free text is for logs only. Load-time
+errors (principle 8) surface in the agents settings page, never as a failed
+send.
+
+### 8.4 Timeouts and retries
+
+Transfer timeouts are per-pipeline policy (completion short, chat/refactor
+from settings), applied by the feature — never baked into agent profiles. A
+streaming request is never silently retried after the first byte; automatic
+retry with capped backoff is allowed only for connection-phase failures.
+Anything beyond that is an explicit user action.
+
+### 8.5 Observability
+
+One `RequestID` correlates feature → session → provider → client → events →
+logs. Each layer logs under its own category (`qodeassist.session`,
+`qodeassist.provider`, `qodeassist.tools`, …); request bodies are logged only
+at debug level, and secrets are redacted unconditionally. `Usage` events are
+the single source feeding the token counter, `TokenEstimator` calibration,
+and the performance log.
+
+### 8.6 Config compatibility
+
+Agent profiles carry a `schema_version`; the loader migrates old user
+configs forward or rejects them with an actionable message — silent
+reinterpretation is forbidden. Bundled profiles are read-only resources that
+user profiles shadow by name. Persisted chat history is versioned the same
+way.
+
+### 8.7 Security
+
+Secrets exist only behind the `SecretsStore` port; they never reach TOML,
+logs, or persisted chats. Tool permission classes (read / write / execute)
+centralize the confirmation policy. The MCP server is opt-in and binds
+loopback by default; skill and partial roots are sandboxed — nothing resolves
+outside its declared directory.
+
+### 8.8 Testing
+
+The test pyramid follows the layers:
+
+| Layer | Strategy |
+|-------|----------|
+| L1 | loader/validator unit tests; golden-file snapshots of every bundled profile's rendered body against a synthetic context — the same check as load-time validation, run in CI |
+| L2 | `Session` / `ResponseRouter` replay tests over recorded SSE fixtures per provider; fake `BaseClient`, no network |
+| L3 | contract tests against the ports; QtC adapters covered only by plugin integration |
+| E2E | bench (U10) against live providers — the same composition the plugin uses |
+
+Layering is enforced mechanically, not by review: each layer is its own
+CMake target, and the core targets do not link Qt Creator — a violating
+include fails the build.
+
+---
+
+## 9. Module / target layout
+
+```
+core/                       # no Qt Creator linkage — bench + tests link this
+  config/                   # L1: ProviderInstance, AgentProfile, loaders,
+                            #     validators, rosters, roles, secrets port
+  providers/                # L2: Provider, GenericProvider, ProviderFactory,
+                            #     ClaudeCacheControl
+  prompt/                   # L2: JsonPromptTemplate, ContextRenderer, partials
+  agents/                   # L2: Agent, AgentFactory, AgentRouter
+  session/                  # L2: Session, SessionManager, ConversationHistory,
+                            #     SystemPromptBuilder, ResponseRouter, events
+  skills/                   # L3 (IDE-free part): SkillsEngine, loaders
+ide/                        # Qt Creator adapters only
+  context/                  # EditorContext, ProjectContext adapters, ignore
+  tools/                    # built-in ToolKit (build, issues, editor edits…)
+  mcp/                      # McpHub managers
+features/
+  completion/               # LSP bridge + CompletionFeature + CodeHandler
+  chat/                     # ChatFeature: ClientInterface, ChatModel(projection),
+                            #   Compressor, TokenCounter, FileEditController,
+                            #   serializer/store
+  refactor/                 # RefactorFeature + custom instructions
+ui/
+  ChatView qml/, widgets/, settings pages
+hosts/
+  plugin/                   # qodeassist.cpp — composition root, actions, panes
+  bench/                    # CLI composition root
+tests/
+  config/                   # loader cases + golden rendered-body snapshots
+  session/                  # SSE replay fixtures per provider, fake client
+external/
+  llmqore/ inja/ tomlplusplus/
+```
+
+Dependency direction is strictly downward in the table of §3; `features/*`
+never include each other; `ui/*` talks only to its feature; `hosts/*` are the
+only places allowed to know about everything.
+
+---
+
+## 10. Deltas from the current working tree
+
+What "from scratch" changes relative to today's code — the migration
+checklist to call the architecture done:
+
+1. **Stack A physical teardown** — delete root `providers/*`,
+   `pluginllmcore/*`, `ConfigurationManager`, legacy provider/model/template
+   settings pages, and the Stack A registration + MCP loop in
+   `qodeassist.cpp`. Runtime already has no consumers.
+2. **Single history owner** — make `ChatModel` a projection of
+   `Session::history()` (subscribe to history signals) instead of a parallel
+   message store with seed-on-send; `ChatCompressor` reads history, not the
+   model.
+3. **Single send path** — delete `Session::sendCompletion(ContextData)`;
+   the completion context becomes user-message content sent through the one
+   `send()` (the completion handler already reads its result from history's
+   last message). Move `QuickRefactorHandler` off raw `BaseClient` signals
+   (`requestCompleted`/`requestFinalized`/`requestFailed`) onto
+   `Session::finished`/`failed` + `history().lastAssistantText()`.
+4. **Three-state request lifecycle** — add `cancelled` to `Session`; today
+   `cancel()` emits `failed(id, "Cancelled by user")` and consumers must
+   string-match to tell cancellation from failure (§8.2).
+5. **Typed errors** — replace `lastError` strings and the `failed(QString)`
+   payload with `ErrorInfo` categories (§8.3).
+6. **One agent picker** — fold `pickCompletionAgent` / `pickRefactorAgent`
+   remnants into `AgentRouter.pickAgent(roster, …)` exclusively; chat picker
+   filters to the `chatAssistant` roster.
+7. **MCP tools on session clients** — register MCP-contributed tools through
+   `ToolContributorRegistry` so chat/refactor sessions get them (today they
+   are registered only on dead Stack A providers).
+8. **Session pooling** — `SessionManager.acquire/release` with a small pool
+   per agent, replacing per-message agent + provider + secrets construction.
+9. **ContextManager split** — extract `EditorContext` / `ProjectContext` /
+   `TokenEstimator` behind ports; move QtC API use into `ide/context`.
+10. **`[body]` model completion** — finish `agent-templates-design.md`
+    (body-table rendering, sandboxed `include`, load-time validation, model
+    override + `${MODEL}`, `schema_version` gate), delete sampling/thinking
+    merge machinery.
+11. **Message type unification** — one `Message`/`ContentBlock` shape from
+    history to QML (roles, text, thinking, tool use/result, images); delete
+    the parallel `ChatModel::Message` struct.
+12. **Test scaffolding** — golden rendered-body snapshots + SSE replay
+    fixtures (§8.8); CI builds the core targets without Qt Creator so a
+    layering violation fails the build.
+13. **Stale docs cleanup** — `project-rules.md` describes the removed Rules
+    system; mark or delete.
diff --git a/settings/AgentDetailPane.cpp b/settings/AgentDetailPane.cpp
index e3b5f1d..150c067 100644
--- a/settings/AgentDetailPane.cpp
+++ b/settings/AgentDetailPane.cpp
@@ -227,15 +227,15 @@ AgentDetailPane::AgentDetailPane(QWidget *parent)
         tr("Jinja2 template (via inja) rendered to the request body. "
            "Built-in context: ctx.prefix, ctx.suffix, ctx.history, "
            "ctx.system_prompt, agent.model."));
-    m_messageFormat = new QPlainTextEdit(this);
-    m_messageFormat->setReadOnly(true);
-    m_messageFormat->setFont(monospaceFont(11));
-    m_messageFormat->setMinimumHeight(140);
+    m_bodyView = new QPlainTextEdit(this);
+    m_bodyView->setReadOnly(true);
+    m_bodyView->setFont(monospaceFont(11));
+    m_bodyView->setMinimumHeight(140);
 
     templ->bodyLayout()->addWidget(templHint);
     auto *mfLabel = new QLabel(tr("body:"), this);
     templ->bodyLayout()->addWidget(mfLabel);
-    templ->bodyLayout()->addWidget(m_messageFormat);
+    templ->bodyLayout()->addWidget(m_bodyView);
 
     m_diagnostics = new SectionBox(tr("Load errors"), this);
     m_diagnosticsView = new QPlainTextEdit(this);
@@ -378,7 +378,7 @@ void AgentDetailPane::setAgent(const AgentConfig &cfg)
     m_filePatternsValue->setText(cfg.match.filePatterns.join(QStringLiteral(", ")));
     m_filePatternsValue->setPlaceholderText(tr("(matches every file)"));
 
-    m_messageFormat->setPlainText(
+    m_bodyView->setPlainText(
         cfg.body.isEmpty()
             ? tr("(inherited from parent / none)")
             : QString::fromUtf8(QJsonDocument(cfg.body).toJson(QJsonDocument::Indented)));
@@ -434,7 +434,7 @@ void AgentDetailPane::clear()
     m_effectiveUrl->clear();
     m_roleText->clear();
     m_filePatternsValue->clear();
-    m_messageFormat->clear();
+    m_bodyView->clear();
     m_rawToml->clear();
     m_openBtn->setEnabled(false);
     m_dupBtn->setEnabled(false);
diff --git a/settings/AgentDetailPane.hpp b/settings/AgentDetailPane.hpp
index dd2ece9..e4758b3 100644
--- a/settings/AgentDetailPane.hpp
+++ b/settings/AgentDetailPane.hpp
@@ -85,7 +85,7 @@ private:
     QLineEdit *m_filePatternsValue = nullptr;
 
     QPlainTextEdit *m_roleText = nullptr;
-    QPlainTextEdit *m_messageFormat = nullptr;
+    QPlainTextEdit *m_bodyView = nullptr;
 
     SectionBox *m_diagnostics = nullptr;
     QPlainTextEdit *m_diagnosticsView = nullptr;
diff --git a/sources/Session/CMakeLists.txt b/sources/Session/CMakeLists.txt
index e3751aa..5163e24 100644
--- a/sources/Session/CMakeLists.txt
+++ b/sources/Session/CMakeLists.txt
@@ -3,6 +3,7 @@ add_library(Session STATIC
     MessageSerializer.hpp MessageSerializer.cpp
     PluginBlocks.hpp
     LLMRequest.hpp
+    ErrorInfo.hpp
     ResponseEvent.hpp
     ConversationHistory.hpp ConversationHistory.cpp
     ResponseRouter.hpp ResponseRouter.cpp
diff --git a/sources/Session/ErrorInfo.hpp b/sources/Session/ErrorInfo.hpp
new file mode 100644
index 0000000..e55386d
--- /dev/null
+++ b/sources/Session/ErrorInfo.hpp
@@ -0,0 +1,61 @@
+// Copyright (C) 2024-2026 Petr Mironychev
+// SPDX-License-Identifier: GPL-3.0-or-later
+// Additional attribution terms under GPLv3 §7(b) apply — see LICENSE
+
+#pragma once
+
+#include <QMetaType>
+#include <QString>
+
+#include <utility>
+
+namespace QodeAssist {
+
+enum class ErrorCategory {
+    Config,
+    Auth,
+    Network,
+    Provider,
+    Validation,
+    Tool,
+};
+
+struct ErrorInfo
+{
+    ErrorCategory category = ErrorCategory::Provider;
+    QString message;
+    QString providerDetail;
+
+    bool isEmpty() const noexcept { return message.isEmpty(); }
+};
+
+[[nodiscard]] inline ErrorInfo makeError(
+    ErrorCategory category, QString message, QString providerDetail = QString())
+{
+    return ErrorInfo{category, std::move(message), std::move(providerDetail)};
+}
+
+[[nodiscard]] inline ErrorCategory categorizeProviderError(const QString &raw)
+{
+    const QString text = raw.toLower();
+
+    const auto contains = [&text](const char *needle) {
+        return text.contains(QLatin1String(needle));
+    };
+
+    if (contains("401") || contains("403") || contains("unauthorized")
+        || contains("forbidden") || contains("api key") || contains("apikey")
+        || contains("authentication") || contains("invalid token"))
+        return ErrorCategory::Auth;
+
+    if (contains("timeout") || contains("timed out") || contains("connection")
+        || contains("could not resolve") || contains("unreachable")
+        || contains("network") || contains("ssl") || contains("refused"))
+        return ErrorCategory::Network;
+
+    return ErrorCategory::Provider;
+}
+
+} // namespace QodeAssist
+
+Q_DECLARE_METATYPE(QodeAssist::ErrorInfo)
diff --git a/sources/Session/ResponseEvent.hpp b/sources/Session/ResponseEvent.hpp
index cca9951..11c5cf3 100644
--- a/sources/Session/ResponseEvent.hpp
+++ b/sources/Session/ResponseEvent.hpp
@@ -9,6 +9,8 @@
 
 #include <variant>
 
+#include "ErrorInfo.hpp"
+
 namespace QodeAssist {
 
 namespace ResponseEvents {
@@ -45,6 +47,7 @@ struct ToolCallEnd
 struct ToolResult
 {
     QString toolUseId;
+    QString name;
     QString text;
     bool isError = false;
 };
@@ -53,11 +56,14 @@ struct Usage
 {
     int inputTokens = 0;
     int outputTokens = 0;
+    int cachedTokens = 0;
+    int reasoningTokens = 0;
 };
 
 struct Error
 {
     QString message;
+    ErrorCategory category = ErrorCategory::Provider;
 };
 
 struct MessageStop
@@ -128,21 +134,27 @@ public:
             Kind::ToolCallEnd, ResponseEvents::ToolCallEnd{std::move(id), std::move(finalArgs)}};
     }
 
-    static ResponseEvent toolResult(QString toolUseId, QString text, bool isError = false)
+    static ResponseEvent toolResult(
+        QString toolUseId, QString name, QString text, bool isError = false)
     {
         return {
             Kind::ToolResult,
-            ResponseEvents::ToolResult{std::move(toolUseId), std::move(text), isError}};
+            ResponseEvents::ToolResult{
+                std::move(toolUseId), std::move(name), std::move(text), isError}};
     }
 
-    static ResponseEvent usage(int inputTokens, int outputTokens)
+    static ResponseEvent usage(
+        int inputTokens, int outputTokens, int cachedTokens = 0, int reasoningTokens = 0)
     {
-        return {Kind::Usage, ResponseEvents::Usage{inputTokens, outputTokens}};
+        return {
+            Kind::Usage,
+            ResponseEvents::Usage{inputTokens, outputTokens, cachedTokens, reasoningTokens}};
     }
 
-    static ResponseEvent error(QString message)
+    static ResponseEvent error(
+        QString message, ErrorCategory category = ErrorCategory::Provider)
     {
-        return {Kind::Error, ResponseEvents::Error{std::move(message)}};
+        return {Kind::Error, ResponseEvents::Error{std::move(message), category}};
     }
 
 private:
diff --git a/sources/Session/ResponseRouter.cpp b/sources/Session/ResponseRouter.cpp
index a7639a1..0e8b703 100644
--- a/sources/Session/ResponseRouter.cpp
+++ b/sources/Session/ResponseRouter.cpp
@@ -79,7 +79,7 @@ void ResponseRouter::ensureAssistantOpen()
     if (m_assistantOpen && !m_inToolResults)
         return;
     if (m_history)
-        m_history->append(Message(Message::Role::Assistant));
+        m_history->append(Message(Message::Role::Assistant, m_activeId));
     emit event(ResponseEvent::messageStart());
     m_assistantOpen = true;
     m_inToolResults = false;
@@ -107,15 +107,19 @@ void ResponseRouter::onThinking(
 }
 
 void ResponseRouter::onToolStarted(
-    const LLMQore::RequestID &id, const QString &toolId, const QString &toolName)
+    const LLMQore::RequestID &id,
+    const QString &toolId,
+    const QString &toolName,
+    const QJsonObject &arguments)
 {
     if (id != m_activeId)
         return;
     ensureAssistantOpen();
     if (m_history)
         m_history->appendBlockToLast(
-            std::make_unique<LLMQore::ToolUseContent>(toolId, toolName));
+            std::make_unique<LLMQore::ToolUseContent>(toolId, toolName, arguments));
     emit event(ResponseEvent::toolCallStart(toolId, toolName));
+    emit event(ResponseEvent::toolCallEnd(toolId, arguments));
 }
 
 void ResponseRouter::onToolResultReady(
@@ -124,7 +128,6 @@ void ResponseRouter::onToolResultReady(
     const QString &toolName,
     const QString &result)
 {
-    Q_UNUSED(toolName);
     if (id != m_activeId)
         return;
 
@@ -141,7 +144,7 @@ void ResponseRouter::onToolResultReady(
 
     m_assistantOpen = false;
     m_inToolResults = true;
-    emit event(ResponseEvent::toolResult(toolId, result, /*isError=*/false));
+    emit event(ResponseEvent::toolResult(toolId, toolName, result, /*isError=*/false));
 }
 
 void ResponseRouter::onFinalized(
@@ -149,6 +152,13 @@ void ResponseRouter::onFinalized(
 {
     if (id != m_activeId)
         return;
+    if (info.usage) {
+        emit event(ResponseEvent::usage(
+            info.usage->promptTokens,
+            info.usage->completionTokens,
+            info.usage->cachedPromptTokens,
+            info.usage->reasoningTokens));
+    }
     emit event(ResponseEvent::messageStop(info.stopReason));
     endRequest();
 }
@@ -157,7 +167,7 @@ void ResponseRouter::onFailed(const LLMQore::RequestID &id, const QString &err)
 {
     if (id != m_activeId)
         return;
-    emit event(ResponseEvent::error(err));
+    emit event(ResponseEvent::error(err, categorizeProviderError(err)));
     endRequest();
 }
 
diff --git a/sources/Session/ResponseRouter.hpp b/sources/Session/ResponseRouter.hpp
index 1512ace..5a7ec3d 100644
--- a/sources/Session/ResponseRouter.hpp
+++ b/sources/Session/ResponseRouter.hpp
@@ -6,6 +6,7 @@
 
 #include <LLMQore/BaseClient.hpp>
 
+#include <QJsonObject>
 #include <QObject>
 #include <QPointer>
 #include <QString>
@@ -41,7 +42,10 @@ private slots:
     void onThinking(
         const LLMQore::RequestID &id, const QString &thinking, const QString &signature);
     void onToolStarted(
-        const LLMQore::RequestID &id, const QString &toolId, const QString &toolName);
+        const LLMQore::RequestID &id,
+        const QString &toolId,
+        const QString &toolName,
+        const QJsonObject &arguments);
     void onToolResultReady(
         const LLMQore::RequestID &id,
         const QString &toolId,
diff --git a/sources/Session/Session.cpp b/sources/Session/Session.cpp
index 23df74b..03c72f7 100644
--- a/sources/Session/Session.cpp
+++ b/sources/Session/Session.cpp
@@ -36,15 +36,9 @@ QString roleToLegacyString(Message::Role role)
     return QStringLiteral("user");
 }
 
-} // namespace
+[[maybe_unused]] const int kErrorInfoMetaTypeId = qRegisterMetaType<QodeAssist::ErrorInfo>();
 
-Session::Session(QObject *parent)
-    : QObject(parent)
-    , m_history(new ConversationHistory(this))
-    , m_systemPrompt(new SystemPromptBuilder(this))
-{
-    m_invalidReason = QStringLiteral("Session: no agent attached");
-}
+} // namespace
 
 Session::Session(Agent *agent, QObject *parent)
     : Session(agent, /*externalHistory=*/nullptr, parent)
@@ -86,7 +80,7 @@ Session::Session(Agent *agent, ConversationHistory *externalHistory, QObject *pa
 Session::~Session()
 {
     if (isInFlight())
-        cancel();
+        teardownInFlight();
 }
 
 bool Session::isValid() const noexcept
@@ -104,6 +98,11 @@ bool Session::isInFlight() const noexcept
     return !m_inFlight.isEmpty();
 }
 
+const ErrorInfo &Session::lastError() const noexcept
+{
+    return m_lastError;
+}
+
 LLMQore::BaseClient *Session::client() const noexcept
 {
     auto *provider = m_agent ? m_agent->provider() : nullptr;
@@ -127,21 +126,6 @@ void Session::setContextBindings(Templates::ContextRenderer::Bindings bindings)
     m_contextBindings = std::move(bindings);
 }
 
-QString Session::renderAgentContext() const
-{
-    if (!m_agent)
-        return {};
-    const auto &cfg = m_agent->config();
-    if (cfg.systemPrompt.isEmpty())
-        return {};
-    QString err;
-    QString rendered
-        = Templates::ContextRenderer::render(cfg.systemPrompt, m_contextBindings, &err);
-    if (!err.isEmpty())
-        qWarning("[QodeAssist] agent.system render failed: %s", qUtf8Printable(err));
-    return rendered;
-}
-
 LLMQore::RequestID Session::sendText(const QString &text)
 {
     std::vector<std::unique_ptr<LLMQore::ContentBlock>> blocks;
@@ -152,22 +136,27 @@ LLMQore::RequestID Session::sendText(const QString &text)
 
 LLMQore::RequestID Session::sendCompletion(Templates::ContextData ctx)
 {
-    if (!isValid())
+    if (!isValid()) {
+        m_lastError = makeError(ErrorCategory::Config, invalidReason());
         return {};
+    }
     if (isInFlight())
         cancel();
-    return dispatchContext(std::move(ctx), /*tools=*/false, /*thinking=*/false);
+    return dispatchContext(std::move(ctx), /*tools=*/false);
 }
 
 LLMQore::RequestID Session::send(
     std::vector<std::unique_ptr<LLMQore::ContentBlock>> userBlocks,
-    std::optional<bool> toolsOverride,
-    std::optional<bool> thinkingOverride)
+    std::optional<bool> toolsOverride)
 {
-    if (!isValid() || userBlocks.empty())
+    if (!isValid()) {
+        m_lastError = makeError(ErrorCategory::Config, invalidReason());
         return {};
-    if (!m_history)
+    }
+    if (userBlocks.empty() || !m_history) {
+        m_lastError = makeError(ErrorCategory::Validation, QStringLiteral("Session: nothing to send"));
         return {};
+    }
 
     if (isInFlight())
         cancel();
@@ -177,10 +166,20 @@ LLMQore::RequestID Session::send(
         msg.appendBlock(std::move(b));
     m_history->append(std::move(msg));
 
-    return dispatch(toolsOverride, thinkingOverride);
+    return dispatch(toolsOverride);
 }
 
 void Session::cancel()
+{
+    if (m_inFlight.isEmpty())
+        return;
+
+    const auto id = m_inFlight;
+    teardownInFlight();
+    emit cancelled(id);
+}
+
+void Session::teardownInFlight()
 {
     if (m_inFlight.isEmpty())
         return;
@@ -191,41 +190,61 @@ void Session::cancel()
         m_router->endRequest();
     if (m_agent && m_agent->provider())
         m_agent->provider()->cancelRequest(id);
-    emit failed(id, QStringLiteral("Cancelled by user"));
 }
 
-LLMQore::RequestID Session::dispatch(
-    std::optional<bool> toolsOverride, std::optional<bool> thinkingOverride)
+LLMQore::RequestID Session::dispatch(std::optional<bool> toolsOverride)
 {
     const auto &cfg = m_agent->config();
 
-    const QString renderedContext = renderAgentContext();
-    if (renderedContext.isEmpty())
+    if (cfg.systemPrompt.isEmpty()) {
         m_systemPrompt->clearLayer(QStringLiteral("agent.system"));
-    else
-        m_systemPrompt->setLayer(QStringLiteral("agent.system"), renderedContext);
+    } else {
+        QString renderErr;
+        const QString renderedContext = Templates::ContextRenderer::render(
+            cfg.systemPrompt, m_contextBindings, &renderErr);
+        if (!renderErr.isEmpty()) {
+            m_lastError = makeError(
+                ErrorCategory::Validation,
+                QStringLiteral("Agent '%1' system_prompt render failed: %2")
+                    .arg(cfg.name, renderErr));
+            qWarning("[QodeAssist] %s", qUtf8Printable(m_lastError.message));
+            return {};
+        }
+        if (renderedContext.isEmpty())
+            m_systemPrompt->clearLayer(QStringLiteral("agent.system"));
+        else
+            m_systemPrompt->setLayer(
+                QStringLiteral("agent.system"), renderedContext, SystemPromptBuilder::kAgentPriority);
+    }
 
     const bool tools = toolsOverride.value_or(cfg.enableTools);
-    const bool thinking = thinkingOverride.value_or(cfg.enableThinking);
-    return dispatchContext(toLegacyContext(), tools, thinking);
+    return dispatchContext(toLegacyContext(), tools);
 }
 
-LLMQore::RequestID Session::dispatchContext(
-    Templates::ContextData ctx, bool tools, bool thinking)
+LLMQore::RequestID Session::dispatchContext(Templates::ContextData ctx, bool tools)
 {
+    m_lastError = {};
+
     auto *provider = m_agent->provider();
     auto *tmpl = m_agent->promptTemplate();
     const auto &cfg = m_agent->config();
 
     QJsonObject payload{{QStringLiteral("model"), cfg.model}};
-    if (!provider->prepareRequest(payload, tmpl, ctx, tools, thinking))
+    QString prepareErr;
+    if (!provider->prepareRequest(payload, tmpl, ctx, tools, &prepareErr)) {
+        m_lastError = makeError(ErrorCategory::Validation, prepareErr, prepareErr);
         return {};
+    }
 
     QString endpoint = cfg.endpoint;
     endpoint.replace(QStringLiteral("${MODEL}"), cfg.model);
     const auto id = provider->sendRequest(QUrl(provider->url()), payload, endpoint);
-    if (id.isEmpty())
+    if (id.isEmpty()) {
+        m_lastError = makeError(
+            ErrorCategory::Provider,
+            QStringLiteral("Provider '%1' failed to start the request").arg(provider->name()));
         return {};
+    }
 
     m_inFlight = id;
     if (m_router)
@@ -389,9 +408,11 @@ void Session::onRouterEvent(const ResponseEvent &ev)
     } else if (ev.kind() == ResponseEvent::Kind::Error) {
         const auto *err = ev.as<ResponseEvents::Error>();
         const QString msg = err ? err->message : QStringLiteral("unknown error");
+        const ErrorCategory category = err ? err->category : ErrorCategory::Provider;
+        m_lastError = makeError(category, msg, msg);
         const auto id = m_inFlight;
         m_inFlight.clear();
-        emit failed(id, msg);
+        emit failed(id, m_lastError);
     }
 }
 
diff --git a/sources/Session/Session.hpp b/sources/Session/Session.hpp
index 351d53d..9500d2b 100644
--- a/sources/Session/Session.hpp
+++ b/sources/Session/Session.hpp
@@ -20,6 +20,7 @@
 #include <vector>
 
 #include "ConversationHistory.hpp"
+#include "ErrorInfo.hpp"
 #include "ResponseEvent.hpp"
 
 namespace QodeAssist {
@@ -33,8 +34,6 @@ class Session : public QObject
     Q_OBJECT
     Q_DISABLE_COPY_MOVE(Session)
 public:
-    explicit Session(QObject *parent = nullptr);
-
     Session(
         Agent *agent,
         ConversationHistory *externalHistory = nullptr,
@@ -47,6 +46,7 @@ public:
     bool isValid() const noexcept;
     QString invalidReason() const;
     bool isInFlight() const noexcept;
+    const ErrorInfo &lastError() const noexcept;
 
     using ContentLoader = std::function<QString(const QString &storedPath)>;
     void setContentLoader(ContentLoader loader);
@@ -60,12 +60,9 @@ public:
 
     void setContextBindings(Templates::ContextRenderer::Bindings bindings);
 
-    QString renderAgentContext() const;
-
     LLMQore::RequestID send(
         std::vector<std::unique_ptr<LLMQore::ContentBlock>> userBlocks,
-        std::optional<bool> toolsOverride = std::nullopt,
-        std::optional<bool> thinkingOverride = std::nullopt);
+        std::optional<bool> toolsOverride = std::nullopt);
 
     LLMQore::RequestID sendText(const QString &text);
 
@@ -78,16 +75,16 @@ signals:
 
     void started(const LLMQore::RequestID &id);
     void finished(const LLMQore::RequestID &id, const QString &stopReason);
-    void failed(const LLMQore::RequestID &id, const QString &error);
+    void failed(const LLMQore::RequestID &id, const QodeAssist::ErrorInfo &error);
+    void cancelled(const LLMQore::RequestID &id);
 
 private slots:
     void onRouterEvent(const QodeAssist::ResponseEvent &ev);
 
 private:
-    LLMQore::RequestID dispatch(
-        std::optional<bool> toolsOverride = std::nullopt,
-        std::optional<bool> thinkingOverride = std::nullopt);
-    LLMQore::RequestID dispatchContext(Templates::ContextData ctx, bool tools, bool thinking);
+    LLMQore::RequestID dispatch(std::optional<bool> toolsOverride = std::nullopt);
+    LLMQore::RequestID dispatchContext(Templates::ContextData ctx, bool tools);
+    void teardownInFlight();
     Templates::ContextData toLegacyContext() const;
 
     Agent *m_agent = nullptr;                              // child if non-null
@@ -97,17 +94,16 @@ private:
 
     LLMQore::RequestID m_inFlight;
     QString m_invalidReason;
+    ErrorInfo m_lastError;
 
     Templates::ContextRenderer::Bindings m_contextBindings;
+    ContentLoader m_contentLoader;
 
 public:
     static Templates::ContextData buildLegacyContext(
         const std::vector<Message> &history,
         const QString &systemPrompt,
         const ContentLoader &loader = ContentLoader{});
-
-private:
-    ContentLoader m_contentLoader;
 };
 
 } // namespace QodeAssist
diff --git a/sources/Session/SessionManager.cpp b/sources/Session/SessionManager.cpp
index 5af412f..dd77222 100644
--- a/sources/Session/SessionManager.cpp
+++ b/sources/Session/SessionManager.cpp
@@ -10,10 +10,6 @@
 
 namespace QodeAssist {
 
-SessionManager::SessionManager(QObject *parent)
-    : QObject(parent)
-{}
-
 SessionManager::SessionManager(AgentFactory *agentFactory, QObject *parent)
     : QObject(parent)
     , m_agentFactory(agentFactory)
@@ -21,14 +17,6 @@ SessionManager::SessionManager(AgentFactory *agentFactory, QObject *parent)
 
 SessionManager::~SessionManager() = default;
 
-Session *SessionManager::createSession()
-{
-    auto *session = new Session(this);
-    m_sessions.append(session);
-    emit sessionCreated(session);
-    return session;
-}
-
 Session *SessionManager::createSession(const QString &agentName, QString *errorOut)
 {
     return createSession(agentName, /*externalHistory=*/nullptr, errorOut);
diff --git a/sources/Session/SessionManager.hpp b/sources/Session/SessionManager.hpp
index 61085a5..52b35df 100644
--- a/sources/Session/SessionManager.hpp
+++ b/sources/Session/SessionManager.hpp
@@ -22,14 +22,10 @@ class SessionManager : public QObject
     Q_OBJECT
     Q_DISABLE_COPY_MOVE(SessionManager)
 public:
-    explicit SessionManager(QObject *parent = nullptr);
-
-    SessionManager(AgentFactory *agentFactory, QObject *parent = nullptr);
+    explicit SessionManager(AgentFactory *agentFactory, QObject *parent = nullptr);
 
     ~SessionManager() override;
 
-    Session *createSession();
-
     Session *createSession(const QString &agentName, QString *errorOut = nullptr);
 
     Session *createSession(
diff --git a/sources/Session/SystemPromptBuilder.cpp b/sources/Session/SystemPromptBuilder.cpp
index 1573695..05fb023 100644
--- a/sources/Session/SystemPromptBuilder.cpp
+++ b/sources/Session/SystemPromptBuilder.cpp
@@ -4,30 +4,34 @@
 
 #include "SystemPromptBuilder.hpp"
 
+#include <algorithm>
+
 namespace QodeAssist {
 
 SystemPromptBuilder::SystemPromptBuilder(QObject *parent)
     : QObject(parent)
 {}
 
-void SystemPromptBuilder::setLayer(const QString &name, const QString &text)
+void SystemPromptBuilder::setLayer(const QString &name, const QString &text, int priority)
 {
-    for (auto &pair : m_layers) {
-        if (pair.first == name) {
-            if (pair.second == text) return;
-            pair.second = text;
+    for (auto &layer : m_layers) {
+        if (layer.name == name) {
+            if (layer.text == text && layer.priority == priority)
+                return;
+            layer.text = text;
+            layer.priority = priority;
             emit layersChanged();
             return;
         }
     }
-    m_layers.append({name, text});
+    m_layers.append({name, text, priority});
     emit layersChanged();
 }
 
 void SystemPromptBuilder::clearLayer(const QString &name)
 {
     for (auto it = m_layers.begin(); it != m_layers.end(); ++it) {
-        if (it->first == name) {
+        if (it->name == name) {
             m_layers.erase(it);
             emit layersChanged();
             return;
@@ -44,8 +48,8 @@ void SystemPromptBuilder::clear()
 
 QString SystemPromptBuilder::layer(const QString &name) const
 {
-    for (const auto &pair : m_layers) {
-        if (pair.first == name) return pair.second;
+    for (const auto &l : m_layers) {
+        if (l.name == name) return l.text;
     }
     return {};
 }
@@ -54,17 +58,22 @@ QStringList SystemPromptBuilder::layerNames() const
 {
     QStringList out;
     out.reserve(m_layers.size());
-    for (const auto &pair : m_layers) out.append(pair.first);
+    for (const auto &l : m_layers) out.append(l.name);
     return out;
 }
 
 QString SystemPromptBuilder::compose(const QString &separator) const
 {
+    QVector<Layer> ordered = m_layers;
+    std::stable_sort(
+        ordered.begin(), ordered.end(),
+        [](const Layer &a, const Layer &b) { return a.priority < b.priority; });
+
     QStringList parts;
-    parts.reserve(m_layers.size());
-    for (const auto &pair : m_layers) {
-        if (!pair.second.isEmpty())
-            parts.append(pair.second);
+    parts.reserve(ordered.size());
+    for (const auto &l : ordered) {
+        if (!l.text.isEmpty())
+            parts.append(l.text);
     }
     return parts.join(separator);
 }
diff --git a/sources/Session/SystemPromptBuilder.hpp b/sources/Session/SystemPromptBuilder.hpp
index 85c414a..e1c271d 100644
--- a/sources/Session/SystemPromptBuilder.hpp
+++ b/sources/Session/SystemPromptBuilder.hpp
@@ -15,9 +15,12 @@ class SystemPromptBuilder : public QObject
 {
     Q_OBJECT
 public:
+    static constexpr int kAgentPriority = 0;
+    static constexpr int kDefaultPriority = 100;
+
     explicit SystemPromptBuilder(QObject *parent = nullptr);
 
-    void setLayer(const QString &name, const QString &text);
+    void setLayer(const QString &name, const QString &text, int priority = kDefaultPriority);
     void clearLayer(const QString &name);
     void clear();
 
@@ -31,7 +34,14 @@ signals:
     void layersChanged();
 
 private:
-    QVector<QPair<QString, QString>> m_layers;
+    struct Layer
+    {
+        QString name;
+        QString text;
+        int priority = kDefaultPriority;
+    };
+
+    QVector<Layer> m_layers;
 };
 
 } // namespace QodeAssist
diff --git a/sources/agents/Agent.cpp b/sources/agents/Agent.cpp
index d9c4a21..ee86d54 100644
--- a/sources/agents/Agent.cpp
+++ b/sources/agents/Agent.cpp
@@ -55,6 +55,8 @@ Agent::Agent(AgentConfig config, Providers::Provider *providerOwned, QObject *pa
         return;
     }
     m_provider->setParent(this);
+    m_provider->setPromptCaching(
+        m_config.cachePrompt, m_config.cacheTtl == QLatin1StringView{"1h"});
 
     QString tmplErr;
     m_promptTemplate = JsonPromptTemplate::fromConfig(m_config, &tmplErr);
diff --git a/sources/agents/AgentConfig.hpp b/sources/agents/AgentConfig.hpp
index f1decb7..c986475 100644
--- a/sources/agents/AgentConfig.hpp
+++ b/sources/agents/AgentConfig.hpp
@@ -39,6 +39,8 @@ struct AgentConfig
 
     bool enableThinking = false;
     bool enableTools = false;
+    bool cachePrompt = false;
+    QString cacheTtl;
 
     QJsonObject body;
     QString extendsName;
diff --git a/sources/agents/AgentFactory.cpp b/sources/agents/AgentFactory.cpp
index 54ecfcd..1641270 100644
--- a/sources/agents/AgentFactory.cpp
+++ b/sources/agents/AgentFactory.cpp
@@ -194,7 +194,7 @@ Agent *AgentFactory::createFromFile(
 {
     QString parseErr;
     QStringList warnings;
-    auto cfgOpt = Agents::AgentLoader::parseFile(tomlPath, &parseErr, &warnings);
+    auto cfgOpt = Agents::AgentLoader::parseFile(tomlPath, agentQrcPrefix(), &parseErr, &warnings);
     if (!cfgOpt) {
         if (errorOut) *errorOut = parseErr;
         return nullptr;
diff --git a/sources/agents/AgentLoader.cpp b/sources/agents/AgentLoader.cpp
index 12e399d..f7066be 100644
--- a/sources/agents/AgentLoader.cpp
+++ b/sources/agents/AgentLoader.cpp
@@ -6,6 +6,7 @@
 
 #include <QDir>
 #include <QFile>
+#include <QFileInfo>
 #include <QHash>
 #include <QJsonArray>
 #include <QJsonDocument>
@@ -123,6 +124,8 @@ AgentConfig configFromMerged(const QJsonObject &obj)
     cfg.systemPrompt = obj.value("system_prompt").toString();
     cfg.enableThinking = obj.value("enable_thinking").toBool(false);
     cfg.enableTools    = obj.value("enable_tools").toBool(false);
+    cfg.cachePrompt    = obj.value("cache_prompt").toBool(false);
+    cfg.cacheTtl       = obj.value("cache_ttl").toString();
     cfg.tags        = stringArray(obj.value("tags"));
 
     const QJsonObject matchObj = obj.value("match").toObject();
@@ -147,6 +150,34 @@ struct RawEntry
 
 constexpr int kMaxExtendsDepth = 32;
 
+void scanDir(
+    const QString &dir,
+    bool isUserLayer,
+    QHash<QString, RawEntry> &raw,
+    QStringList &errors)
+{
+    if (dir.isEmpty()) return;
+    QDir d(dir);
+    if (!d.exists()) return;
+    const QStringList files = d.entryList({"*.toml"}, QDir::Files);
+    for (const QString &fname : files) {
+        const QString fullPath = d.filePath(fname);
+        QString err;
+        auto objOpt = parseTomlFile(fullPath, &err);
+        if (!objOpt) {
+            errors.append(err);
+            continue;
+        }
+        const QString name = objOpt->value("name").toString();
+        if (name.isEmpty()) {
+            errors.append(QStringLiteral("Agent at %1 has no 'name'").arg(fullPath));
+            continue;
+        }
+        const bool overrides = isUserLayer && raw.contains(name);
+        raw.insert(name, {*objOpt, fullPath, overrides});
+    }
+}
+
 QJsonObject resolveExtends(
     const QString &name,
     const QHash<QString, RawEntry> &raw,
@@ -190,12 +221,47 @@ QJsonObject resolveExtends(
 } // namespace
 
 std::optional<AgentConfig> AgentLoader::parseFile(
-    const QString &path, QString *error, QStringList * /*warnings*/)
+    const QString &path,
+    const QString &qrcPrefix,
+    QString *error,
+    QStringList * /*warnings*/)
 {
     auto objOpt = parseTomlFile(path, error);
     if (!objOpt) return std::nullopt;
-    AgentConfig cfg = configFromMerged(*objOpt);
+
+    const QString name = objOpt->value("name").toString();
+    if (name.isEmpty()) {
+        if (error) *error = QStringLiteral("Agent at %1 has no 'name'").arg(path);
+        return std::nullopt;
+    }
+
+    QHash<QString, RawEntry> raw;
+    QStringList scanErrors;
+    scanDir(qrcPrefix, /*isUserLayer=*/false, raw, scanErrors);
+    scanDir(QFileInfo(path).absolutePath(), /*isUserLayer=*/true, raw, scanErrors);
+    raw.insert(name, {*objOpt, path, raw.contains(name)});
+
+    QSet<QString> visiting;
+    QStringList resolveErrors;
+    const QJsonObject merged = resolveExtends(name, raw, visiting, resolveErrors);
+    if (!resolveErrors.isEmpty() || merged.isEmpty()) {
+        if (error) {
+            *error = resolveErrors.isEmpty()
+                         ? QStringLiteral("Agent '%1' resolved to an empty config").arg(name)
+                         : resolveErrors.join(QStringLiteral("; "));
+        }
+        return std::nullopt;
+    }
+
+    AgentConfig cfg = configFromMerged(merged);
     cfg.sourcePath = path;
+    if (cfg.abstract) {
+        if (error) {
+            *error = QStringLiteral("Agent '%1' is abstract — extend it instead of "
+                                    "loading it directly").arg(name);
+        }
+        return std::nullopt;
+    }
     return cfg;
 }
 
@@ -204,31 +270,8 @@ AgentLoader::LoadResult AgentLoader::load(const QString &qrcPrefix, const QStrin
     LoadResult result;
     QHash<QString, RawEntry> raw;
 
-    auto scan = [&](const QString &dir, bool isUserLayer) {
-        if (dir.isEmpty()) return;
-        QDir d(dir);
-        if (!d.exists()) return;
-        const QStringList files = d.entryList({"*.toml"}, QDir::Files);
-        for (const QString &fname : files) {
-            const QString fullPath = d.filePath(fname);
-            QString err;
-            auto objOpt = parseTomlFile(fullPath, &err);
-            if (!objOpt) {
-                result.errors.append(err);
-                continue;
-            }
-            const QString name = objOpt->value("name").toString();
-            if (name.isEmpty()) {
-                result.errors.append(QStringLiteral("Agent at %1 has no 'name'").arg(fullPath));
-                continue;
-            }
-            const bool overrides = isUserLayer && raw.contains(name);
-            raw.insert(name, {*objOpt, fullPath, overrides});
-        }
-    };
-
-    scan(qrcPrefix, /*isUserLayer=*/false);
-    scan(userDir,   /*isUserLayer=*/true);
+    scanDir(qrcPrefix, /*isUserLayer=*/false, raw, result.errors);
+    scanDir(userDir,   /*isUserLayer=*/true,  raw, result.errors);
 
     for (auto it = raw.constBegin(); it != raw.constEnd(); ++it) {
         const QString &name = it.key();
diff --git a/sources/agents/AgentLoader.hpp b/sources/agents/AgentLoader.hpp
index 9f26eca..4f5a5fe 100644
--- a/sources/agents/AgentLoader.hpp
+++ b/sources/agents/AgentLoader.hpp
@@ -25,7 +25,10 @@ public:
     static LoadResult load(const QString &qrcPrefix, const QString &userDir);
 
     static std::optional<AgentConfig> parseFile(
-        const QString &path, QString *error, QStringList *warnings = nullptr);
+        const QString &path,
+        const QString &qrcPrefix,
+        QString *error,
+        QStringList *warnings = nullptr);
 };
 
 } // namespace QodeAssist::Agents
diff --git a/sources/agents/anthropic_base_chat.toml b/sources/agents/anthropic_base_chat.toml
index 5f7703b..6de5c7e 100644
--- a/sources/agents/anthropic_base_chat.toml
+++ b/sources/agents/anthropic_base_chat.toml
@@ -7,6 +7,7 @@ abstract    = true
 provider_instance = "Claude"
 endpoint          = "/v1/messages"
 enable_tools      = true
+cache_prompt      = true
 tags = ["chat", "claude", "anthropic", "cloud"]
 
 system_prompt = """{{ agent_role() }}"""
diff --git a/sources/agents/partials/anthropic_messages.jinja b/sources/agents/partials/anthropic_messages.jinja
index 7338c5a..2f7355b 100644
--- a/sources/agents/partials/anthropic_messages.jinja
+++ b/sources/agents/partials/anthropic_messages.jinja
@@ -3,8 +3,17 @@
   "role": {{ tojson(msg.role) }},
   "content": [
     {% for b in msg.content_blocks %}
-      {% if b.type == "image" %}{% include "partials/anthropic_image.jinja" %}
-      {% else %}{{ tojson(b) }},
+      {% if b.type == "text" %}
+      { "type": "text", "text": {{ tojson(b.text) }} },
+      {% else if b.type == "thinking" %}
+      { "type": "thinking", "thinking": {{ tojson(b.thinking) }}, "signature": {{ tojson(b.signature) }} },
+      {% else if b.type == "redacted_thinking" %}
+      { "type": "redacted_thinking", "data": {{ tojson(b.data) }} },
+      {% else if b.type == "tool_use" %}
+      { "type": "tool_use", "id": {{ tojson(b.id) }}, "name": {{ tojson(b.name) }}, "input": {{ tojson(b.input) }} },
+      {% else if b.type == "tool_result" %}
+      { "type": "tool_result", "tool_use_id": {{ tojson(b.tool_use_id) }}, "content": {{ tojson(b.content) }} },
+      {% else if b.type == "image" %}{% include "partials/anthropic_image.jinja" %}
       {% endif %}
     {% endfor %}
   ]
diff --git a/sources/agents/partials/ollama_messages.jinja b/sources/agents/partials/ollama_messages.jinja
index 9b91bd4..af561b7 100644
--- a/sources/agents/partials/ollama_messages.jinja
+++ b/sources/agents/partials/ollama_messages.jinja
@@ -2,15 +2,36 @@
 { "role": "system", "content": {{ tojson(ctx.system_prompt) }} },
 {% endif %}
 {% for msg in ctx.history %}
-{
-  "role": {{ tojson(msg.role) }},
-  "content": {{ tojson(msg.content) }}
-  {% if existsIn(msg, "images") %}
-  , "images": [
-    {% for img in msg.images %}
-    {{ tojson(img.data) }},
+  {% set tcalls = filter_by_type(msg.content_blocks, "tool_use") %}
+  {% set tresults = filter_by_type(msg.content_blocks, "tool_result") %}
+  {% if length(tresults) > 0 %}
+    {% for b in tresults %}
+    {
+      "role": "tool",
+      "content": {{ tojson(b.content) }}
+      {% if b.name != "" %}
+      , "tool_name": {{ tojson(b.name) }}
+      {% endif %}
+    },
     {% endfor %}
-  ]
+  {% else %}
+  {
+    "role": {{ tojson(msg.role) }},
+    "content": {{ tojson(msg.content) }}
+    {% if length(tcalls) > 0 %}
+    , "tool_calls": [
+      {% for b in tcalls %}
+      { "type": "function", "function": { "name": {{ tojson(b.name) }}, "arguments": {{ tojson(b.input) }} } },
+      {% endfor %}
+    ]
+    {% endif %}
+    {% if existsIn(msg, "images") %}
+    , "images": [
+      {% for img in msg.images %}
+      {{ tojson(img.data) }},
+      {% endfor %}
+    ]
+    {% endif %}
+  },
   {% endif %}
-},
 {% endfor %}
diff --git a/sources/agents/partials/openai_assistant.jinja b/sources/agents/partials/openai_assistant.jinja
index 2f6f0a4..b065c90 100644
--- a/sources/agents/partials/openai_assistant.jinja
+++ b/sources/agents/partials/openai_assistant.jinja
@@ -1,7 +1,7 @@
 {% set tcalls = filter_by_type(msg.content_blocks, "tool_use") %}
 {
   "role": "assistant",
-  "content": {{ tojson(msg.content) }}
+  "content": {% if msg.content != "" %}{{ tojson(msg.content) }}{% else %}null{% endif %}
   {% if length(tcalls) > 0 %}
   , "tool_calls": [
     {% for b in tcalls %}
diff --git a/sources/agents/partials/openai_image_content.jinja b/sources/agents/partials/openai_image_content.jinja
index f40e89a..5489a8f 100644
--- a/sources/agents/partials/openai_image_content.jinja
+++ b/sources/agents/partials/openai_image_content.jinja
@@ -1,11 +1,12 @@
 [
-  { "type": "text", "text": {{ tojson(msg.content) }} }
+  {% if msg.content != "" %}
+  { "type": "text", "text": {{ tojson(msg.content) }} },
+  {% endif %}
   {% for img in msg.images %}
-  ,
   {% if img.is_url %}
-  { "type": "image_url", "image_url": { "url": {{ tojson(img.data) }} } }
+  { "type": "image_url", "image_url": { "url": {{ tojson(img.data) }} } },
   {% else %}
-  { "type": "image_url", "image_url": { "url": "data:{{ img.media_type }};base64,{{ img.data }}" } }
+  { "type": "image_url", "image_url": { "url": "data:{{ img.media_type }};base64,{{ img.data }}" } },
   {% endif %}
   {% endfor %}
 ]
diff --git a/sources/providers/CMakeLists.txt b/sources/providers/CMakeLists.txt
index 1a0d40f..ea622b4 100644
--- a/sources/providers/CMakeLists.txt
+++ b/sources/providers/CMakeLists.txt
@@ -3,6 +3,7 @@ add_library(Providers STATIC
     Provider.hpp Provider.cpp
     ProviderFactory.hpp ProviderFactory.cpp
     GenericProvider.hpp GenericProvider.cpp
+    ClaudeCacheControl.hpp
 )
 
 target_link_libraries(Providers
diff --git a/sources/providers/ClaudeCacheControl.hpp b/sources/providers/ClaudeCacheControl.hpp
new file mode 100644
index 0000000..f116375
--- /dev/null
+++ b/sources/providers/ClaudeCacheControl.hpp
@@ -0,0 +1,90 @@
+// Copyright (C) 2024-2026 Petr Mironychev
+// SPDX-License-Identifier: GPL-3.0-or-later
+// Additional attribution terms under GPLv3 §7(b) apply — see LICENSE
+
+#pragma once
+
+#include <QJsonArray>
+#include <QJsonObject>
+#include <QJsonValue>
+#include <QString>
+
+namespace QodeAssist::Providers::ClaudeCacheControl {
+
+inline QJsonObject buildBreakpoint(bool extendedTtl)
+{
+    QJsonObject cacheControl{{"type", "ephemeral"}};
+    if (extendedTtl)
+        cacheControl["ttl"] = "1h";
+    return cacheControl;
+}
+
+inline void markLastBlock(QJsonArray &blocks, const QJsonObject &cacheControl)
+{
+    if (blocks.isEmpty())
+        return;
+    QJsonObject last = blocks.last().toObject();
+    last["cache_control"] = cacheControl;
+    blocks.replace(blocks.size() - 1, last);
+}
+
+inline void applyToSystem(QJsonObject &request, const QJsonObject &cacheControl)
+{
+    if (!request.contains("system"))
+        return;
+
+    const QJsonValue sys = request.value("system");
+    if (sys.isString()) {
+        const QString text = sys.toString();
+        if (!text.isEmpty()) {
+            request["system"] = QJsonArray{QJsonObject{
+                {"type", "text"}, {"text", text}, {"cache_control", cacheControl}}};
+        }
+    } else if (sys.isArray()) {
+        QJsonArray blocks = sys.toArray();
+        markLastBlock(blocks, cacheControl);
+        request["system"] = blocks;
+    }
+}
+
+inline void applyToTools(QJsonObject &request, const QJsonObject &cacheControl)
+{
+    if (!request.contains("tools"))
+        return;
+    QJsonArray tools = request.value("tools").toArray();
+    markLastBlock(tools, cacheControl);
+    request["tools"] = tools;
+}
+
+inline void applyToHistory(QJsonObject &request, const QJsonObject &cacheControl)
+{
+    if (!request.contains("messages"))
+        return;
+    QJsonArray messages = request.value("messages").toArray();
+    if (messages.size() < 2)
+        return;
+
+    const int idx = messages.size() - 2;
+    QJsonObject msg = messages[idx].toObject();
+    const QJsonValue content = msg.value("content");
+    if (content.isString()) {
+        msg["content"] = QJsonArray{QJsonObject{
+            {"type", "text"}, {"text", content.toString()}, {"cache_control", cacheControl}}};
+    } else if (content.isArray()) {
+        QJsonArray blocks = content.toArray();
+        markLastBlock(blocks, cacheControl);
+        msg["content"] = blocks;
+    }
+    messages.replace(idx, msg);
+    request["messages"] = messages;
+}
+
+inline void apply(QJsonObject &request, bool extendedTtl)
+{
+    const QJsonObject cacheControl = buildBreakpoint(extendedTtl);
+    applyToSystem(request, cacheControl);
+    applyToTools(request, cacheControl);
+    applyToHistory(request, cacheControl);
+}
+
+} // namespace QodeAssist::Providers::ClaudeCacheControl
diff --git a/sources/providers/Provider.cpp b/sources/providers/Provider.cpp
index a83c785..99aafac 100644
--- a/sources/providers/Provider.cpp
+++ b/sources/providers/Provider.cpp
@@ -4,9 +4,11 @@
 
 #include "Provider.hpp"
 
+#include "ClaudeCacheControl.hpp"
 #include "PromptTemplate.hpp"
 
 #include <LLMQore/BaseClient.hpp>
+#include <LLMQore/ClaudeClient.hpp>
 #include <LLMQore/ToolsManager.hpp>
 
 #include <QJsonArray>
@@ -25,24 +27,27 @@ bool Provider::prepareRequest(
     PromptTemplate *prompt,
     const ContextData &context,
     bool isToolsEnabled,
-    bool isThinkingEnabled)
+    QString *errorOut)
 {
-    if (!prompt) {
-        LOG_MESSAGE(QString("Provider '%1': null template").arg(name()));
+    const auto fail = [errorOut](const QString &message) {
+        LOG_MESSAGE(message);
+        if (errorOut)
+            *errorOut = message;
         return false;
-    }
+    };
+
+    if (!prompt)
+        return fail(QString("Provider '%1': null template").arg(name()));
 
     if (!prompt->isSupportProvider(providerID())) {
-        LOG_MESSAGE(QString("Template '%1' doesn't support provider '%2'")
+        return fail(QString("Template '%1' doesn't support provider '%2'")
                         .arg(prompt->name(), name()));
-        return false;
     }
 
-    if (!prompt->buildFullRequest(request, context, isThinkingEnabled)) {
-        LOG_MESSAGE(
-            QString("Provider '%1': template '%2' failed to build request")
+    if (!prompt->buildFullRequest(request, context)) {
+        return fail(
+            QString("Provider '%1': template '%2' failed to build request (see log)")
                 .arg(name(), prompt->name()));
-        return false;
     }
 
     if (isToolsEnabled) {
@@ -51,9 +56,21 @@ bool Provider::prepareRequest(
             request["tools"] = toolsDefinitions;
         }
     }
+
+    if (m_promptCachingEnabled)
+        ClaudeCacheControl::apply(request, m_promptCachingExtendedTtl);
+
     return true;
 }
 
+void Provider::setPromptCaching(bool enabled, bool extendedTtl)
+{
+    m_promptCachingEnabled = enabled;
+    m_promptCachingExtendedTtl = enabled && extendedTtl;
+    if (auto *claude = qobject_cast<::LLMQore::ClaudeClient *>(client()))
+        claude->setUseExtendedCacheTTL(m_promptCachingExtendedTtl);
+}
+
 RequestID Provider::sendRequest(
     const QUrl &url, const QJsonObject &payload, const QString &endpoint)
 {
diff --git a/sources/providers/Provider.hpp b/sources/providers/Provider.hpp
index 633035a..fbc3204 100644
--- a/sources/providers/Provider.hpp
+++ b/sources/providers/Provider.hpp
@@ -61,7 +61,7 @@ public:
         PromptTemplate *prompt,
         const ContextData &context,
         bool isToolsEnabled,
-        bool isThinkingEnabled);
+        QString *errorOut = nullptr);
     virtual QFuture<QList<QString>> getInstalledModels(const QString &url) = 0;
     virtual ProviderID providerID() const = 0;
     virtual ProviderCapabilities capabilities() const { return {}; }
@@ -73,9 +73,13 @@ public:
     void cancelRequest(const RequestID &requestId);
     ::LLMQore::ToolsManager *toolsManager() const;
 
+    void setPromptCaching(bool enabled, bool extendedTtl);
+
 private:
     QString m_url;
     QString m_apiKey;
+    bool m_promptCachingEnabled = false;
+    bool m_promptCachingExtendedTtl = false;
 };
 
 } // namespace QodeAssist::Providers
diff --git a/sources/templates/JsonPromptTemplate.cpp b/sources/templates/JsonPromptTemplate.cpp
index a854474..7d81f01 100644
--- a/sources/templates/JsonPromptTemplate.cpp
+++ b/sources/templates/JsonPromptTemplate.cpp
@@ -310,6 +310,15 @@ ContextData makeValidationContext()
     Message asst;
     asst.role = QStringLiteral("assistant");
     {
+        ContentBlockEntry th;
+        th.kind = ContentBlockEntry::Kind::Thinking;
+        th.thinking = QStringLiteral("reasoning");
+        th.signature = QStringLiteral("sig");
+        asst.blocks.append(th);
+        ContentBlockEntry rth;
+        rth.kind = ContentBlockEntry::Kind::RedactedThinking;
+        rth.signature = QStringLiteral("sig");
+        asst.blocks.append(rth);
         ContentBlockEntry t;
         t.kind = ContentBlockEntry::Kind::Text;
         t.text = QStringLiteral("hi");
@@ -516,9 +525,7 @@ void JsonPromptTemplate::prepareRequest(QJsonObject &request, const ContextData
 }
 
 bool JsonPromptTemplate::buildFullRequest(
-    QJsonObject &request,
-    const ContextData &context,
-    bool /*thinkingEnabled*/) const
+    QJsonObject &request, const ContextData &context) const
 {
     return mergeRenderedBody(request, renderBody(context));
 }
diff --git a/sources/templates/JsonPromptTemplate.hpp b/sources/templates/JsonPromptTemplate.hpp
index 1d45968..92ac4ce 100644
--- a/sources/templates/JsonPromptTemplate.hpp
+++ b/sources/templates/JsonPromptTemplate.hpp
@@ -47,9 +47,7 @@ public:
     void prepareRequest(QJsonObject &request, const ContextData &context) const override;
 
     [[nodiscard]] bool buildFullRequest(
-        QJsonObject &request,
-        const ContextData &context,
-        bool thinkingEnabled = false) const override;
+        QJsonObject &request, const ContextData &context) const override;
 
 private:
     JsonPromptTemplate() = default;
diff --git a/sources/templates/PromptTemplate.hpp b/sources/templates/PromptTemplate.hpp
index ad39ef0..581a9f5 100644
--- a/sources/templates/PromptTemplate.hpp
+++ b/sources/templates/PromptTemplate.hpp
@@ -40,9 +40,7 @@ public:
     virtual bool isSupportModel(const QString & /*modelName*/) const { return true; }
 
     [[nodiscard]] virtual bool buildFullRequest(
-        QJsonObject &request,
-        const ContextData &context,
-        bool /*thinkingEnabled*/ = false) const
+        QJsonObject &request, const ContextData &context) const
     {
         prepareRequest(request, context);
         return true;