From 5b296442b3d6250154457c0a5d1fd9c1a309cca0 Mon Sep 17 00:00:00 2001
From: danipiza <dpizarrogallego@gmail.com>
Date: Tue, 24 Feb 2026 08:59:06 +0100
Subject: [PATCH 1/6] [#24196] Added tests for 'custom_log_test_area.py'

Signed-off-by: danipiza <dpizarrogallego@gmail.com>
---
 tests/unittest/test_custom_log_text_area.py | 120 ++++++++++++++++++++
 1 file changed, 120 insertions(+)
 create mode 100644 tests/unittest/test_custom_log_text_area.py
diff --git a/tests/unittest/test_custom_log_text_area.py b/tests/unittest/test_custom_log_text_area.py
new file mode 100644
index 0000000..053dfe8
--- /dev/null
+++ b/tests/unittest/test_custom_log_text_area.py
@@ -0,0 +1,120 @@
+# Copyright 2026 Proyectos y Sistemas de Mantenimiento SL (eProsima).
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+import sys
+import unittest
+from unittest.mock import patch
+
+from vulcanai.console.widget_custom_log_text_area import CustomLogTextArea
+
+# Make src-layout importable
+CURRENT_DIR = os.path.dirname(__file__)
+SRC_DIR = os.path.abspath(os.path.join(CURRENT_DIR, os.path.pardir, os.path.pardir, "src"))
+if SRC_DIR not in sys.path:
+    sys.path.insert(0, SRC_DIR)
+
+
+class TestCustomLogTextArea(unittest.TestCase):
+    def setUp(self):
+        self.widget = CustomLogTextArea()
+
+    def test_join_nested_tags(self):
+        text = "<red>first <bold>second</bold> third</red>"
+        expected = "<red>first </red><red bold>second</red bold><red> third</red>"
+        self.assertEqual(self.widget.join_nested_tags(text), expected)
+
+    def test_append_line_stores_plain_text_and_styles(self):
+        result = self.widget.append_line("prefix <red>error</red> suffix")
+        self.assertTrue(result)
+        self.assertEqual(self.widget.document.text, "prefix error suffix")
+        self.assertEqual(list(self.widget._lines_styles)[0], [(7, 12, "red")])
+        self.assertEqual(self.widget._highlights[0], [(7, 12, "red")])
+
+    def test_append_line_rejects_multiline_input(self):
+        self.assertFalse(self.widget.append_line("line 1\nline 2"))
+        self.assertEqual(self.widget.document.text, "")
+        self.assertEqual(self.widget._line_count, 0)
+        self.assertEqual(len(self.widget._lines_styles), 0)
+
+    def test_append_line_trims_max_lines_and_reindexes_highlights(self):
+        max_lines = self.widget.MAX_LINES
+        extra_lines = 5
+
+        for idx in range(max_lines + extra_lines):
+            if idx % 100 == 0:
+                self.widget.append_line(f"<red>line-{idx}</red>")
+            else:
+                self.widget.append_line(f"line-{idx}")
+
+        self.assertEqual(self.widget._line_count, max_lines)
+        self.assertEqual(len(self.widget.document.text.splitlines()), max_lines)
+        self.assertEqual(self.widget.document.get_line(0), f"line-{extra_lines}")
+        self.assertEqual(self.widget.document.get_line(max_lines - 1), f"line-{max_lines + extra_lines - 1}")
+
+        kept_colored_indexes = [i for i in range(max_lines + extra_lines) if i % 100 == 0 and i >= extra_lines]
+        expected_rows = [i - extra_lines for i in kept_colored_indexes]
+        self.assertEqual(sorted(self.widget._highlights.keys()), expected_rows)
+
+        for original_idx, row in zip(kept_colored_indexes, expected_rows):
+            self.assertEqual(self.widget._highlights[row], [(0, len(f"line-{original_idx}"), "red")])
+
+    def test_delete_last_row(self):
+        self.widget.append_line("first")
+        self.widget.append_line("second")
+
+        self.widget.delete_last_row()
+        self.assertEqual(self.widget.document.text, "first")
+        self.assertEqual(self.widget._line_count, 1)
+
+        self.widget.delete_last_row()
+        self.assertEqual(self.widget.document.text, "")
+        self.assertEqual(self.widget._line_count, 0)
+
+        self.widget.delete_last_row()
+        self.assertEqual(self.widget.document.text, "")
+        self.assertEqual(self.widget._line_count, 0)
+
+    def test_clear_console(self):
+        self.widget.append_line("<red>first</red>")
+        self.widget.append_line("second")
+
+        self.widget.clear_console()
+        self.assertEqual(self.widget.document.text, "")
+        self.assertEqual(self.widget._line_count, 0)
+        self.assertEqual(len(self.widget._lines_styles), 0)
+        self.assertEqual(dict(self.widget._highlights), {})
+
+    def test_action_copy_selection_no_selected_text(self):
+        notifications = []
+        self.widget.notify = notifications.append
+
+        with patch("vulcanai.console.widget_custom_log_text_area.pyperclip.copy") as clipboard_copy:
+            self.widget.action_copy_selection()
+
+        clipboard_copy.assert_not_called()
+        self.assertEqual(notifications, ["No text selected to copy!"])
+
+    def test_action_copy_selection_with_selected_text(self):
+        self.widget.append_line("copy this")
+        self.widget.select_all()
+
+        notifications = []
+        self.widget.notify = notifications.append
+
+        with patch("vulcanai.console.widget_custom_log_text_area.pyperclip.copy") as clipboard_copy:
+            self.widget.action_copy_selection()
+
+        clipboard_copy.assert_called_once_with("copy this")
+        self.assertEqual(notifications, ["Selected area copied to clipboard!"])

From 578f8d982a9678738d7417a71c85667d27a53e84 Mon Sep 17 00:00:00 2001
From: danipiza <dpizarrogallego@gmail.com>
Date: Tue, 24 Feb 2026 09:03:04 +0100
Subject: [PATCH 2/6] [#24196] Added textual tests - Terminal input

Signed-off-by: danipiza <dpizarrogallego@gmail.com>
---
 src/vulcanai/console/utils.py  |   15 +-
 tests/unittest/test_console.py | 1176 ++++++++++++++++++++++++++++++++
 2 files changed, 1188 insertions(+), 3 deletions(-)
 create mode 100644 tests/unittest/test_console.py

diff --git a/src/vulcanai/console/utils.py b/src/vulcanai/console/utils.py
index a6e72b7..cde39ce 100644
--- a/src/vulcanai/console/utils.py
+++ b/src/vulcanai/console/utils.py
@@ -38,9 +38,18 @@ def write(self, data: str):
             return
 
         if data.strip():
-            # Ensure update happens on the app thread
-            # self.app.call_from_thread(self.app.append_log_text, data)
-            self.app.call_from_thread(self.app.add_line, data)
+            # Try cross-thread UI update first; if already on app thread,
+            # Textual raises RuntimeError and we can write directly.
+            try:
+                self.app.call_from_thread(self.app.add_line, data)
+            except RuntimeError as e:
+                if "must run in a different thread" in str(e):
+                    try:
+                        self.app.add_line(data)
+                    except Exception:
+                        self.real_stream.write(data)
+                else:
+                    self.real_stream.write(data)
 
     def flush(self):
         self.real_stream.flush()
diff --git a/tests/unittest/test_console.py b/tests/unittest/test_console.py
new file mode 100644
index 0000000..5bd3dcc
--- /dev/null
+++ b/tests/unittest/test_console.py
@@ -0,0 +1,1176 @@
+import importlib.util
+import os
+import re
+import sys
+import time
+import types
+import unittest
+from unittest.mock import patch
+
+from textual.widgets import Input
+
+from vulcanai.console.console import VulcanConsole
+from vulcanai.console.logger import VulcanAILogger
+from vulcanai.core.executor import Blackboard
+
+
+# Stub sentence_transformers to avoid heavyweight imports when loading tools from files
+class _DummySentenceTransformer:
+    def __init__(self, *args, **kwargs):
+        pass
+
+    def encode(self, text, convert_to_numpy=True):
+        return None
+
+    def similarity(self, a, b):
+        return None
+
+
+sys.modules.setdefault("sentence_transformers", types.SimpleNamespace(SentenceTransformer=_DummySentenceTransformer))
+
+
+# Make src-layout importable
+CURRENT_DIR = os.path.dirname(__file__)
+SRC_DIR = os.path.abspath(os.path.join(CURRENT_DIR, os.path.pardir, os.path.pardir, "src"))
+if SRC_DIR not in sys.path:
+    sys.path.insert(0, SRC_DIR)
+RESOURCES_DIR = os.path.abspath(os.path.join(CURRENT_DIR, os.path.pardir, "resources"))
+
+# region TOOLS
+
+tools_mod = importlib.import_module("vulcanai.tools.tools")
+
+
+class FakeTool(tools_mod.AtomicTool):
+    """Small tool descriptor used by FakeRegistry for /tools output tests."""
+
+    def __init__(self, name: str, description: str = "Fake tool description",
+                 is_validation_tool=True, provide_images=True):
+        self.name = name
+        self.description = description
+        self.tags = ["empty", "fake", "tool", "move"]
+        self.input_schema = [("input", "string")]
+        self.output_schema = {"output": "bool"}
+        self.version = "0.1"
+        self.is_validation_tool = is_validation_tool
+        self.provide_images = provide_images
+
+    def run(self, **kwargs):
+        return {"arrived": True}
+
+
+# endregion
+
+# region LLM
+
+class FakeLLM:
+    def __init__(self, logger=None):
+        self.logger = logger
+
+        self.goal_return = None
+        self.goal_error = None
+        self.validation_return = None
+        self.validation_error = None
+
+    def inference_goal(self, system_prompt, user_prompt, history):
+        if self.goal_error:
+            raise self.goal_error
+        return self.goal_return
+
+    def inference_validation(self, system_prompt, user_prompt, images, history):
+        if self.validation_error:
+            raise self.validation_error
+        return self.validation_return
+
+    def set_hooks(self, _hooks) -> None:
+        self.logger.log_manager("LLM hooks set.")
+
+# region REGISTRY
+
+
+class FakeRegistry:
+    """In-memory registry used to avoid real tool discovery in most command tests."""
+
+    def __init__(self):
+        self.tools = {
+            "nav": FakeTool("nav", "Navigate to target pose."),
+            "scan": FakeTool("scan", "Scan surroundings."),
+        }
+        self.deactivated_tools = {
+            "old_tool": FakeTool("old_tool", "Deprecated tool."),
+        }
+
+    def activate_tool(self, _tool) -> bool:
+        return True
+
+    def deactivate_tool(self, _tool) -> bool:
+        return True
+
+
+class FileToolsRegistry:
+    """Registry that discovers @vulcanai_tool classes from a Python file."""
+
+    def __init__(self):
+        self.tools = {}
+        self.deactivated_tools = {}
+
+    def discover_tools_from_file(self, path: str) -> None:
+        spec = importlib.util.spec_from_file_location(f"file_tools_{id(self)}", path)
+        if spec is None or spec.loader is None:
+            raise ImportError(f"Cannot import {path}")
+
+        module = importlib.util.module_from_spec(spec)
+        spec.loader.exec_module(module)
+
+        for symbol_name in dir(module):
+            symbol = getattr(module, symbol_name)
+            if isinstance(symbol, type) and getattr(symbol, "__is_vulcanai_tool__", False):
+                tool = symbol()
+                self.tools[tool.name] = tool
+
+    def activate_tool(self, _tool) -> bool:
+        return True
+
+    def deactivate_tool(self, _tool) -> bool:
+        return True
+
+
+class ThreeToolsStatefulRegistry:
+    """In-memory registry with real activate/deactivate state transitions."""
+
+    def __init__(self):
+        self.tools = {
+            "nav": FakeTool("nav", "Navigate to target pose."),
+            "scan": FakeTool("scan", "Scan surroundings."),
+            "pick": FakeTool("pick", "Pick an object."),
+        }
+        self.deactivated_tools = {}
+
+    def activate_tool(self, tool_name) -> bool:
+        if tool_name in self.tools:
+            return False
+        if tool_name not in self.deactivated_tools:
+            return False
+        self.tools[tool_name] = self.deactivated_tools[tool_name]
+        del self.deactivated_tools[tool_name]
+        return True
+
+    def deactivate_tool(self, tool_name) -> bool:
+        if tool_name in self.deactivated_tools:
+            return False
+        if tool_name not in self.tools:
+            return False
+        self.deactivated_tools[tool_name] = self.tools[tool_name]
+        del self.tools[tool_name]
+        return True
+
+
+# region MANAGER
+
+
+class FakeManager:
+    """Minimal manager API expected by VulcanConsole command handlers."""
+
+    def __init__(self, model: str, k: int, logger):
+        self.k = k
+        self.logger = logger
+        self.history = []
+        self.history_depth = 0
+        self.bb = {}
+        self.registry = FakeRegistry()
+        self.llm = FakeLLM(logger)
+        self.logger.log_manager(f"Using OpenAI API with model: {model}")
+
+    def register_tools_from_file(self, _tool_file_path: str) -> None:
+        return
+
+    def register_tools_from_entry_points(self, _entry_point: str) -> None:
+        return
+
+    def add_user_context(self, _context: str) -> None:
+        return
+
+    def update_k_index(self, value: int) -> None:
+        self.k = value
+
+    def update_history_depth(self, value: int) -> None:
+        self.history_depth = value
+
+
+class QuietFakeManager(FakeManager):
+    """Fake manager variant that avoids logging during __init__."""
+
+    def __init__(self, model: str, k: int, logger):
+        class _FakeExecutor:
+            def run(self, _plan, _bb):
+                return {"blackboard": {"ok": True}}
+
+        self.k = k
+        self.logger = logger
+        self.history = []
+        self.history_depth = 0
+        self.bb = {}
+        self.registry = FakeRegistry()
+        self.llm = FakeLLM(logger)
+        self.executor = _FakeExecutor()
+
+
+class FileToolsFakeManager(FakeManager):
+    """Fake manager that supports file-based tool discovery and query logging."""
+
+    def __init__(self, model: str, k: int, logger):
+        super().__init__(model=model, k=k, logger=logger)
+        self.registry = FileToolsRegistry()
+
+    def register_tools_from_file(self, path: str) -> None:
+        self.registry.discover_tools_from_file(path)
+
+    def handle_user_request(self, user_text: str, context):
+        self.logger.log_manager(f"Fake LLM received query: {user_text}")
+        bb = Blackboard()
+        bb["fake_query"] = user_text
+        return {"plan": {"summary": "fake"}, "success": True, "blackboard": bb}
+
+
+class QuietFileToolsFakeManager(FileToolsFakeManager):
+    """File-tools manager variant without threaded logging side effects."""
+
+    def __init__(self, model: str, k: int, logger):
+        self.k = k
+        self.logger = logger
+        self.history = []
+        self.history_depth = 0
+        self.bb = {}
+        self.registry = FileToolsRegistry()
+        self.llm = FakeLLM(logger)
+
+    def handle_user_request(self, user_text: str, context):
+        bb = Blackboard()
+        bb["fake_query"] = user_text
+        return {"plan": {"summary": "fake"}, "success": True, "blackboard": bb}
+
+
+# region TESTS
+
+def normalize_log(msg: str) -> str:
+    """
+    Remove rich/style markup while preserving human-readable content.
+    """
+    ret = re.sub(r"\[/?#[0-9a-fA-F]{6}\]", "", msg)
+    ret = re.sub(r"\[/?(?:bold|italic|underline|reverse|dim)\]", "", ret)
+    ret = re.sub(r"<[^>]+>", "", ret)
+    ret = re.sub(r"\s+", " ", ret).strip()
+    return ret
+
+
+class FakeSink:
+    def __init__(self):
+        self.messages = []
+
+    def write(self, msg: str, color: str = "") -> None:
+        self.messages.append(msg)
+
+
+# tests helper
+class StartupTestVulcanConsole(VulcanConsole):
+    """Console variant that boots deterministically for command/startup tests."""
+
+    async def bootstrap(self) -> None:
+        # -- Initialize manager -----------------------------------------------
+
+        # Emit the same user-facing startup lines the real app emits.
+        self.logger.log_console("Initializing Manager <bold>'PlanManager'</bold>...")
+        self.manager = FakeManager(model=self.model, k=self.k, logger=self.logger)
+        self.logger.log_console(f"Manager initialized with model <bold>'{self.model.replace('ollama-', '')}</bold>'")
+        self._update_variables_panel()
+
+        # -- Add the commands (non-blocking, runs in event loop) --------------
+
+        self.commands = {
+            "/help": self.cmd_help,
+            "/tools": self.cmd_tools,
+            "/edit_tools": self.cmd_edit_tools,
+            "/change_k": self.cmd_change_k,
+            "/history": self.cmd_history_index,
+            "/show_history": self.cmd_show_history,
+            "/clear_history": self.cmd_clear_history,
+            "/plan": self.cmd_plan,
+            "/rerun": self.cmd_rerun,
+            "/bb": self.cmd_blackboard_state,
+            "/clear": self.cmd_clear,
+            "/exit": self.cmd_quit,
+        }
+
+        # Tab matches initialization
+        self.tab_matches = []
+        self.tab_index = 0
+
+        # -- Spinner controller --
+        try:
+            self.manager.llm.set_hooks(self.hooks)
+        except Exception:
+            pass
+
+        # Add user context (non-blocking)
+        self.manager.add_user_context(self.user_context)
+        # Add console to blackboard
+        self.manager.bb["console"] = self
+
+        self.is_ready = True
+        self.logger.log_console("VulcanAI Interactive Console")
+        self.logger.log_console("Use <bold>'Ctrl+Q'</bold> to quit.")
+
+        # Activate the terminal input
+        self.set_input_enabled(True)
+
+    def cmd_rerun(self, args) -> None:
+        # Test-safe /rerun implementation that avoids threaded worker complexity.
+        selected_plan = 0
+        if len(args) == 0:
+            # No index specified. Last plan selected
+            selected_plan = len(self.plans_list) - 1
+        elif len(args) != 1 or not args[0].isdigit():
+            self.logger.log_console("Usage: /rerun 'int'")
+            return
+        else:
+            selected_plan = int(args[0])
+            if selected_plan < -1:
+                self.logger.log_console("Usage: /rerun 'int' [int >= -1].")
+                return
+
+        if not self.plans_list:
+            self.logger.log_console("No plan to rerun.")
+            return
+
+        self.logger.log_console(f"Rerunning {selected_plan}-th plan...")
+        # Simulate rerun of the latest plan
+        self.logger.log_console("Output of rerun: {'ok': True}")
+
+
+# tests helper
+class FileToolsConsole(VulcanConsole):
+    """Console variant that loads tools from file and handles a fake user query."""
+
+    async def bootstrap(self) -> None:
+        self.manager = FileToolsFakeManager(model=self.model, k=self.k, logger=self.logger)
+        self.commands = {
+            "/help": self.cmd_help,
+            "/tools": self.cmd_tools,
+            "/edit_tools": self.cmd_edit_tools,
+            "/change_k": self.cmd_change_k,
+            "/history": self.cmd_history_index,
+            "/show_history": self.cmd_show_history,
+            "/clear_history": self.cmd_clear_history,
+            "/plan": self.cmd_plan,
+            "/rerun": self.cmd_rerun,
+            "/bb": self.cmd_blackboard_state,
+            "/clear": self.cmd_clear,
+            "/exit": self.cmd_quit,
+        }
+        self.tab_matches = []
+        self.tab_index = 0
+
+        for tool_file_path in self.register_from_file:
+            self.manager.register_tools_from_file(tool_file_path)
+
+        self.manager.llm.set_hooks(self.hooks)
+        self.manager.add_user_context(self.user_context)
+        self.manager.bb["console"] = self
+
+        self.is_ready = True
+        self.logger.log_console("VulcanAI Interactive Console")
+        self.logger.log_console("Use <bold>'Ctrl+Q'</bold> to quit.")
+        self.set_input_enabled(True)
+
+# TERMINAL INPUT
+class TestConsoleInputOutput(unittest.IsolatedAsyncioTestCase):
+    """End-to-end Textual UI tests focused on terminal output behavior."""
+
+    def _new_lines(self, app, start_index: int) -> list[str]:
+        """Return only the lines appended after a known index."""
+        return app.left_pannel.document.text.splitlines()[start_index:]
+
+    def _assert_new_lines_contains(self, app, start_index: int, expected_text: str) -> None:
+        """Assertion helper to check incremental log output."""
+        new_lines = self._new_lines(app, start_index)
+        self.assertTrue(
+            any(expected_text in line for line in new_lines),
+            f"Expected '{expected_text}' in new lines, got: {new_lines}",
+        )
+
+    @staticmethod
+    def _fake_init_manager_for_real_console(console) -> None:
+        # Keep startup behavior deterministic without external manager dependencies.
+        console.call_from_thread(console.logger.log_console, "Initializing Manager <bold>'PlanManager'</bold>...")
+        console.manager = QuietFakeManager(model=console.model, k=console.k, logger=console.logger)
+        console.call_from_thread(console.logger.log_manager, f"Using OpenAI API with model: {console.model}")
+        console.call_from_thread(
+            console.logger.log_console,
+            f"Manager initialized with model <bold>'{console.model.replace('ollama-', '')}</bold>'",
+        )
+        console.call_from_thread(console._update_variables_panel)
+
+    @staticmethod
+    def _fake_init_manager_for_real_console_file_tools(console) -> None:
+        # Deterministic startup with file-tools discovery support.
+        console.call_from_thread(console.logger.log_console, "Initializing Manager <bold>'PlanManager'</bold>...")
+        console.manager = QuietFileToolsFakeManager(model=console.model, k=console.k, logger=console.logger)
+        console.call_from_thread(console.logger.log_manager, f"Using OpenAI API with model: {console.model}")
+        console.call_from_thread(
+            console.logger.log_console,
+            f"Manager initialized with model <bold>'{console.model.replace('ollama-', '')}</bold>'",
+        )
+        console.call_from_thread(console._update_variables_panel)
+
+    async def test_simple_input(self):
+        # Simulate typing into the input widget and verify unknown-command output in log panel.
+        # cmd input: /echo hello
+        # expected output: "Unknown command: ..."
+        app = StartupTestVulcanConsole(model="gpt-5-nano")
+
+        # Textual test runner
+        async with app.run_test() as pilot:
+            # Lets the event loop process pending startup work
+            await pilot.pause()
+            # Waits one more cycle so async bootstrap updates finish before assertions.
+            await pilot.pause()
+            # Store the Initialization of the manager to check the terminal input logs
+            start = len(app.left_pannel.document.text.splitlines())
+            await pilot.click("#cmd")
+            await pilot.press("/", "e", "c", "h", "o", "space", "h", "e", "l", "l", "o", "enter")
+            # Wait for the command to finish
+            await pilot.pause()
+
+        lines = self._new_lines(app, start)
+        self.assertEqual(lines[0], "[USER] >>> /echo hello")
+        self.assertEqual(lines[1], "Unknown command: /echo. Type '/help'.")
+
+    async def test_simple_startup(self):
+        # Validate startup (manager initilization)
+        app = StartupTestVulcanConsole(model="gpt-5-nano")
+        cmd_disabled = True
+
+        async with app.run_test() as pilot:
+            await pilot.pause()
+            await pilot.pause()
+            cmd_disabled = app.query_one("#cmd", Input).disabled
+
+        lines = app.left_pannel.document.text.splitlines()
+        expected_subsequence = [
+            "Initializing Manager 'PlanManager'...",
+            "[MANAGER] Using OpenAI API with model: gpt-5-nano",
+            "Manager initialized with model 'gpt-5-nano'",
+            "[MANAGER] LLM hooks set.",
+            "VulcanAI Interactive Console",
+            "Use 'Ctrl+Q' to quit.",
+        ]
+
+        line_idx = 0
+        for expected in expected_subsequence:
+            while line_idx < len(lines) and lines[line_idx] != expected:
+                line_idx += 1
+            self.assertLess(line_idx, len(lines), f"Missing startup line: {expected}")
+            line_idx += 1
+
+        self.assertTrue(app.is_ready)
+        self.assertFalse(cmd_disabled)
+
+    async def test_simple_command_help(self):
+        app = StartupTestVulcanConsole(model="gpt-5-nano")
+        async with app.run_test() as pilot:
+            await pilot.pause()
+            await pilot.pause()
+
+            # Store the Initialization of the manager to check the terminal input logs
+            start = len(app.left_pannel.document.text.splitlines())
+            # Tool testing
+            app.handle_command("/help")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "Available commands:")
+
+    async def test_simple_command_tools(self):
+        app = StartupTestVulcanConsole(model="gpt-5-nano")
+        async with app.run_test() as pilot:
+            await pilot.pause()
+            await pilot.pause()
+
+            # Store the Initialization of the manager to check the terminal input logs
+            start = len(app.left_pannel.document.text.splitlines())
+            # Tool testing
+            app.handle_command("/tools")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "Available tools:")
+            self._assert_new_lines_contains(app, start, "nav:")
+            self._assert_new_lines_contains(app, start, "scan:")
+
+    async def test_simple_command_tools_from_file(self):
+        # Ensure tools decorated in tests/resources/test_tools.py are shown by /tools.
+        # Then submit a free-text query and assert manager/query output lines.
+        app = FileToolsConsole(
+            model="gpt-5-nano",
+            register_from_file=[os.path.join(RESOURCES_DIR, "test_tools.py")],
+        )
+
+        async with app.run_test() as pilot:
+            await pilot.pause()
+            await pilot.pause()
+
+            # Store the Initialization of the manager to check the terminal input logs
+            start = len(app.left_pannel.document.text.splitlines())
+            # Tool testing
+            app.handle_command("/tools")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "file_tool:")
+            self._assert_new_lines_contains(app, start, "new_file_tool:")
+            self._assert_new_lines_contains(app, start, "other_file_tool:")
+            self._assert_new_lines_contains(app, start, "another_validation_tool:")
+
+    async def test_simple_command_edit_tools(self):
+        app = StartupTestVulcanConsole(model="gpt-5-nano")
+        async with app.run_test() as pilot:
+            await pilot.pause()
+            await pilot.pause()
+            with patch.object(app, "open_checklist") as checklist_mock:
+                # Tool testing
+                app.handle_command("/edit_tools")
+                checklist_mock.assert_called_once()
+                call_args = checklist_mock.call_args.args
+                self.assertEqual(call_args[0], ["- nav", "- scan", "- old_tool"])
+                self.assertEqual(call_args[1], 2)
+
+    async def test_simple_command_tools_deactivate_and_activate(self):
+        app = StartupTestVulcanConsole(model="gpt-5-nano")
+        async with app.run_test() as pilot:
+            await pilot.pause()
+            await pilot.pause()
+            app.manager.registry = ThreeToolsStatefulRegistry()
+
+            start = len(app.left_pannel.document.text.splitlines())
+            app.handle_command("/tools")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "Available tools:")
+            self._assert_new_lines_contains(app, start, "nav:")
+            self._assert_new_lines_contains(app, start, "scan:")
+            self._assert_new_lines_contains(app, start, "pick:")
+
+            self.assertTrue(app.manager.registry.deactivate_tool("scan"))
+            self.assertIn("scan", app.manager.registry.deactivated_tools)
+            self.assertNotIn("scan", app.manager.registry.tools)
+
+            start = len(app.left_pannel.document.text.splitlines())
+            app.handle_command("/tools")
+            await pilot.pause()
+            deactivated_tools_lines = "\n".join(self._new_lines(app, start))
+            self.assertIn("nav:", deactivated_tools_lines)
+            self.assertIn("pick:", deactivated_tools_lines)
+            self.assertNotIn("scan:", deactivated_tools_lines)
+
+            self.assertTrue(app.manager.registry.activate_tool("scan"))
+            self.assertIn("scan", app.manager.registry.tools)
+            self.assertNotIn("scan", app.manager.registry.deactivated_tools)
+
+            start = len(app.left_pannel.document.text.splitlines())
+            app.handle_command("/tools")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "nav:")
+            self._assert_new_lines_contains(app, start, "scan:")
+            self._assert_new_lines_contains(app, start, "pick:")
+
+    async def test_simple_command_change_k(self):
+        app = StartupTestVulcanConsole(model="gpt-5-nano")
+        async with app.run_test() as pilot:
+            await pilot.pause()
+            await pilot.pause()
+
+            # Store the Initialization of the manager to check the terminal input logs
+            start = len(app.left_pannel.document.text.splitlines())
+            # Tool testing
+            app.handle_command("/change_k")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "Current 'k' is 7")
+
+            start = len(app.left_pannel.document.text.splitlines())
+            app.handle_command("/change_k bad")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "Usage: /change_k 'int'")
+
+            app.handle_command("/change_k 3")
+            await pilot.pause()
+            self.assertEqual(app.manager.k, 3)
+
+    async def test_simple_command_history(self):
+        app = StartupTestVulcanConsole(model="gpt-5-nano")
+        async with app.run_test() as pilot:
+            await pilot.pause()
+            await pilot.pause()
+
+            # Store the Initialization of the manager to check the terminal input logs
+            start = len(app.left_pannel.document.text.splitlines())
+            # Tool testing
+            app.handle_command("/history")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "Current 'history depth' is 0")
+
+            start = len(app.left_pannel.document.text.splitlines())
+            app.handle_command("/history bad")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "Usage: /history 'int'")
+
+            app.handle_command("/history 4")
+            await pilot.pause()
+            self.assertEqual(app.manager.history_depth, 4)
+
+    async def test_simple_command_show_history(self):
+        app = StartupTestVulcanConsole(model="gpt-5-nano")
+        async with app.run_test() as pilot:
+            await pilot.pause()
+            await pilot.pause()
+            app.manager.history = []
+
+            # Store the Initialization of the manager to check the terminal input logs
+            start = len(app.left_pannel.document.text.splitlines())
+            # Tool testing
+            app.handle_command("/show_history")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "No history available.")
+
+            app.manager.history = [("ignored_line\nPick object", "Sample plan summary")]
+            start = len(app.left_pannel.document.text.splitlines())
+            app.handle_command("/show_history")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "Current history:")
+            self._assert_new_lines_contains(app, start, "[USER] >>> Pick object")
+            self._assert_new_lines_contains(app, start, "Plan summary: Sample plan summary")
+
+    async def test_simple_command_clear_history(self):
+        app = StartupTestVulcanConsole(model="gpt-5-nano")
+        async with app.run_test() as pilot:
+            await pilot.pause()
+            await pilot.pause()
+            app.history = ["/help", "/tools"]
+            app.history_index = 1
+            app.plans_list = [{"plan": 1}]
+
+            # Tool testing
+            app.handle_command("/clear_history")
+            await pilot.pause()
+
+            self.assertEqual(app.history, [])
+            self.assertIsNone(app.history_index)
+            self.assertEqual(app.plans_list, [])
+            # Textual log
+            self._assert_new_lines_contains(app, 0, "History cleared.")
+
+    async def test_simple_command_plan(self):
+        app = StartupTestVulcanConsole(model="gpt-5-nano")
+        async with app.run_test() as pilot:
+            await pilot.pause()
+            await pilot.pause()
+            app.plans_list = []
+
+            # Store the Initialization of the manager to check the terminal input logs
+            start = len(app.left_pannel.document.text.splitlines())
+            # Tool testing
+            app.handle_command("/plan")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "No plan has been generated yet.")
+
+            app.plans_list = [{"step": "demo"}]
+            start = len(app.left_pannel.document.text.splitlines())
+            app.handle_command("/plan")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "Last generated plan:")
+            self._assert_new_lines_contains(app, start, "{'step': 'demo'}")
+
+    async def test_simple_command_rerun(self):
+        app = StartupTestVulcanConsole(model="gpt-5-nano")
+        async with app.run_test() as pilot:
+            await pilot.pause()
+            await pilot.pause()
+            app.plans_list = []
+
+            # Store the Initialization of the manager to check the terminal input logs
+            start = len(app.left_pannel.document.text.splitlines())
+            # Tool testing
+            app.handle_command("/rerun")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "No plan to rerun.")
+
+            app.plans_list = [{"step": "demo"}]
+            start = len(app.left_pannel.document.text.splitlines())
+            app.handle_command("/rerun")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "Rerunning 0-th plan...")
+            self._assert_new_lines_contains(app, start, "Output of rerun: {'ok': True}")
+
+    async def test_simple_command_bb(self):
+        app = StartupTestVulcanConsole(model="gpt-5-nano")
+        async with app.run_test() as pilot:
+            await pilot.pause()
+            await pilot.pause()
+            app.last_bb = None
+
+            # Store the Initialization of the manager to check the terminal input logs
+            start = len(app.left_pannel.document.text.splitlines())
+            # Tool testing
+            app.handle_command("/bb")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "No blackboard available.")
+
+            app.last_bb = {"key": "<value>"}
+            start = len(app.left_pannel.document.text.splitlines())
+            app.handle_command("/bb")
+            await pilot.pause()
+            # Textual log
+            self._assert_new_lines_contains(app, start, "Lastest blackboard state:")
+            self._assert_new_lines_contains(app, start, "key")
+            self._assert_new_lines_contains(app, start, "value")
+
+    async def test_simple_command_clear(self):
+        app = StartupTestVulcanConsole(model="gpt-5-nano")
+        async with app.run_test() as pilot:
+            await pilot.pause()
+            await pilot.pause()
+            app.logger.log_console("Temporary output before clear")
+            await pilot.pause()
+            self.assertTrue(len(app.left_pannel.document.text) > 0)
+
+            # Tool testing
+            app.handle_command("/clear")
+            await pilot.pause()
+            self.assertEqual(app.left_pannel.document.text, "")
+
+    async def test_simple_command_exit(self):
+        app = StartupTestVulcanConsole(model="gpt-5-nano")
+        async with app.run_test() as pilot:
+            await pilot.pause()
+            await pilot.pause()
+            with patch.object(app, "exit") as exit_mock:
+                app.handle_command("/exit")
+                exit_mock.assert_called_once()
+
+    async def test_simple_query_output(self):
+        # Ensure tools decorated in tests/resources/test_tools.py are shown by /tools.
+        # Then submit a free-text query and assert manager/query output lines.
+        app = FileToolsConsole(
+            model="gpt-5-nano",
+            register_from_file=[os.path.join(RESOURCES_DIR, "test_tools.py")],
+        )
+
+        async with app.run_test() as pilot:
+            await pilot.pause()
+            await pilot.pause()
+
+            await pilot.click("#cmd")
+            await pilot.press(
+                "t",
+                "h",
+                "i",
+                "s",
+                "space",
+                "i",
+                "s",
+                "space",
+                "a",
+                "space",
+                "q",
+                "u",
+                "e",
+                "r",
+                "y",
+                "enter",
+            )
+            await pilot.pause()
+            await pilot.pause()
+
+        lines = app.left_pannel.document.text.splitlines()
+        self.assertIn("[USER] >>> this is a query", lines)
+        self.assertIn("[MANAGER] Fake LLM received query: this is a query", lines)
+        self.assertIn("Output of plan: {'fake_query': 'this is a query'}", lines)
+
+    async def test_vulcanai_input(self):
+        app = VulcanConsole(model="gpt-5-nano")
+
+        with patch.object(VulcanConsole, "init_manager", self._fake_init_manager_for_real_console):
+            async with app.run_test(headless=True) as pilot:
+                # Lets the event loop process pending startup work
+                await pilot.pause()
+                # Waits one more cycle so async bootstrap updates finish before assertions.
+                await pilot.pause()
+
+                # Store the Initialization of the manager to check the terminal input logs
+                start = len(app.left_pannel.document.text.splitlines())
+                await pilot.click("#cmd")
+                await pilot.press("/", "e", "c", "h", "o", "space", "h", "e", "l", "l", "o", "enter")
+                # Wait for the command to finish
+                await pilot.pause()
+
+        lines = self._new_lines(app, start)
+        self.assertEqual(lines[0], "[USER] >>> /echo hello")
+        self.assertEqual(lines[1], "Unknown command: /echo. Type '/help'.")
+
+    async def test_vulcanai_startup(self):
+        # Validate startup logs using the real VulcanConsole in headless mode.
+        app = VulcanConsole(model="gpt-5-nano")
+        cmd_disabled = True
+
+        with patch.object(VulcanConsole, "init_manager", self._fake_init_manager_for_real_console):
+            async with app.run_test(headless=True) as pilot:
+                await pilot.pause()
+                await pilot.pause()
+                cmd_disabled = app.query_one("#cmd", Input).disabled
+
+        lines = app.left_pannel.document.text.splitlines()
+        expected_subsequence = [
+            "Initializing Manager 'PlanManager'...",
+            "[MANAGER] Using OpenAI API with model: gpt-5-nano",
+            "Manager initialized with model 'gpt-5-nano'",
+            "[MANAGER] LLM hooks set.",
+            "VulcanAI Interactive Console",
+            "Use 'Ctrl+Q' to quit.",
+        ]
+
+        line_idx = 0
+        for expected in expected_subsequence:
+            while line_idx < len(lines) and lines[line_idx] != expected:
+                line_idx += 1
+            self.assertLess(line_idx, len(lines), f"Missing startup line: {expected}")
+            line_idx += 1
+
+        self.assertTrue(app.is_ready)
+        self.assertFalse(cmd_disabled)
+
+    async def test_vulcanai_command_help(self):
+        app = VulcanConsole(model="gpt-5-nano")
+
+        with patch.object(VulcanConsole, "init_manager", self._fake_init_manager_for_real_console):
+            async with app.run_test(headless=True) as pilot:
+                await pilot.pause()
+                await pilot.pause()
+
+                # Store the Initialization of the manager to check the terminal input logs
+                start = len(app.left_pannel.document.text.splitlines())
+                # Tool testing
+                app.handle_command("/help")
+                await pilot.pause()
+                # Textual log
+                self._assert_new_lines_contains(app, start, "Available commands:")
+
+    async def test_vulcanai_command_tools(self):
+        app = VulcanConsole(model="gpt-5-nano")
+
+        with patch.object(VulcanConsole, "init_manager", self._fake_init_manager_for_real_console):
+            async with app.run_test(headless=True) as pilot:
+                await pilot.pause()
+                await pilot.pause()
+
+                # Store the Initialization of the manager to check the terminal input logs
+                start = len(app.left_pannel.document.text.splitlines())
+                # Tool testing
+                app.handle_command("/tools")
+                await pilot.pause()
+                # Textual log
+                self._assert_new_lines_contains(app, start, "Available tools:")
+                self._assert_new_lines_contains(app, start, "nav:")
+                self._assert_new_lines_contains(app, start, "scan:")
+
+    async def test_vulcanai_command_tools_from_file(self):
+        app = VulcanConsole(
+            model="gpt-5-nano",
+            register_from_file=[os.path.join(RESOURCES_DIR, "test_tools.py")],
+        )
+
+        with patch.object(VulcanConsole, "init_manager", self._fake_init_manager_for_real_console_file_tools):
+            async with app.run_test(headless=True) as pilot:
+                await pilot.pause()
+                await pilot.pause()
+
+                # Store the Initialization of the manager to check the terminal input logs
+                start = len(app.left_pannel.document.text.splitlines())
+                # Tool testing
+                app.handle_command("/tools")
+                await pilot.pause()
+                # Textual log
+                self._assert_new_lines_contains(app, start, "file_tool:")
+                self._assert_new_lines_contains(app, start, "new_file_tool:")
+                self._assert_new_lines_contains(app, start, "other_file_tool:")
+                self._assert_new_lines_contains(app, start, "another_validation_tool:")
+                self.assertNotIn("no_decorator_tool", app.left_pannel.document.text)
+
+    async def test_vulcanai_command_change_k(self):
+        app = VulcanConsole(model="gpt-5-nano")
+
+        with patch.object(VulcanConsole, "init_manager", self._fake_init_manager_for_real_console):
+            async with app.run_test(headless=True) as pilot:
+                await pilot.pause()
+                await pilot.pause()
+
+                # Store the Initialization of the manager to check the terminal input logs
+                start = len(app.left_pannel.document.text.splitlines())
+                # Tool testing
+                app.handle_command("/change_k")
+                await pilot.pause()
+                # Textual log
+                self._assert_new_lines_contains(app, start, "Current 'k' is 7")
+
+                start = len(app.left_pannel.document.text.splitlines())
+                app.handle_command("/change_k bad")
+                await pilot.pause()
+                # Textual log
+                self._assert_new_lines_contains(app, start, "Usage: /change_k 'int'")
+
+                app.handle_command("/change_k 3")
+                await pilot.pause()
+                self.assertEqual(app.manager.k, 3)
+
+    async def test_vulcanai_command_edit_tools(self):
+        app = VulcanConsole(model="gpt-5-nano")
+
+        with patch.object(VulcanConsole, "init_manager", self._fake_init_manager_for_real_console):
+            async with app.run_test(headless=True) as pilot:
+                await pilot.pause()
+                await pilot.pause()
+                with patch.object(app, "open_checklist") as checklist_mock:
+                    app.handle_command("/edit_tools")
+                    checklist_mock.assert_called_once()
+                    call_args = checklist_mock.call_args.args
+                    self.assertEqual(call_args[0], ["- nav", "- scan", "- old_tool"])
+                    self.assertEqual(call_args[1], 2)
+
+    async def test_vulcanai_command_history(self):
+        app = VulcanConsole(model="gpt-5-nano")
+
+        with patch.object(VulcanConsole, "init_manager", self._fake_init_manager_for_real_console):
+            async with app.run_test(headless=True) as pilot:
+                await pilot.pause()
+                await pilot.pause()
+
+                # Store the Initialization of the manager to check the terminal input logs
+                start = len(app.left_pannel.document.text.splitlines())
+                # Tool testing
+                app.handle_command("/history")
+                await pilot.pause()
+                # Textual log
+                self._assert_new_lines_contains(app, start, "Current 'history depth' is 0")
+
+                start = len(app.left_pannel.document.text.splitlines())
+                app.handle_command("/history bad")
+                await pilot.pause()
+                # Textual log
+                self._assert_new_lines_contains(app, start, "Usage: /history 'int'")
+
+                app.handle_command("/history 4")
+                await pilot.pause()
+                self.assertEqual(app.manager.history_depth, 4)
+
+    async def test_vulcanai_command_show_history(self):
+        app = VulcanConsole(model="gpt-5-nano")
+
+        with patch.object(VulcanConsole, "init_manager", self._fake_init_manager_for_real_console):
+            async with app.run_test(headless=True) as pilot:
+                await pilot.pause()
+                await pilot.pause()
+                app.manager.history = []
+
+                # Store the Initialization of the manager to check the terminal input logs
+                start = len(app.left_pannel.document.text.splitlines())
+                # Tool testing
+                app.handle_command("/show_history")
+                await pilot.pause()
+                # Textual log
+                self._assert_new_lines_contains(app, start, "No history available.")
+
+                app.manager.history = [("ignored_line\nPick object", "Sample plan summary")]
+                start = len(app.left_pannel.document.text.splitlines())
+                app.handle_command("/show_history")
+                await pilot.pause()
+                # Textual log
+                self._assert_new_lines_contains(app, start, "Current history:")
+                self._assert_new_lines_contains(app, start, "[USER] >>> Pick object")
+                self._assert_new_lines_contains(app, start, "Plan summary: Sample plan summary")
+
+    async def test_vulcanai_command_clear_history(self):
+        app = VulcanConsole(model="gpt-5-nano")
+
+        with patch.object(VulcanConsole, "init_manager", self._fake_init_manager_for_real_console):
+            async with app.run_test(headless=True) as pilot:
+                await pilot.pause()
+                await pilot.pause()
+                app.history = ["/help", "/tools"]
+                app.history_index = 1
+                app.plans_list = [{"plan": 1}]
+
+                app.handle_command("/clear_history")
+                await pilot.pause()
+
+                self.assertEqual(app.history, [])
+                self.assertIsNone(app.history_index)
+                self.assertEqual(app.plans_list, [])
+                # Textual log
+                self._assert_new_lines_contains(app, 0, "History cleared.")
+
+    async def test_vulcanai_command_plan(self):
+        app = VulcanConsole(model="gpt-5-nano")
+
+        with patch.object(VulcanConsole, "init_manager", self._fake_init_manager_for_real_console):
+            async with app.run_test(headless=True) as pilot:
+                await pilot.pause()
+                await pilot.pause()
+                app.plans_list = []
+
+                # Store the Initialization of the manager to check the terminal input logs
+                start = len(app.left_pannel.document.text.splitlines())
+                # Tool testing
+                app.handle_command("/plan")
+                await pilot.pause()
+                # Textual log
+                self._assert_new_lines_contains(app, start, "No plan has been generated yet.")
+
+                app.plans_list = [{"step": "demo"}]
+                start = len(app.left_pannel.document.text.splitlines())
+                app.handle_command("/plan")
+                await pilot.pause()
+                # Textual log
+                self._assert_new_lines_contains(app, start, "Last generated plan:")
+                self._assert_new_lines_contains(app, start, "{'step': 'demo'}")
+
+    async def test_vulcanai_command_rerun(self):
+        app = VulcanConsole(model="gpt-5-nano")
+
+        with patch.object(VulcanConsole, "init_manager", self._fake_init_manager_for_real_console):
+            async with app.run_test(headless=True) as pilot:
+                await pilot.pause()
+                await pilot.pause()
+                app.plans_list = []
+
+                # Store the Initialization of the manager to check the terminal input logs
+                start = len(app.left_pannel.document.text.splitlines())
+                # Tool testing
+                app.handle_command("/rerun")
+                await pilot.pause()
+                await pilot.pause()
+                # Textual log
+                self._assert_new_lines_contains(app, start, "No plan to rerun.")
+
+                app.plans_list = [{"step": "demo"}]
+                start = len(app.left_pannel.document.text.splitlines())
+                app.handle_command("/rerun")
+                await pilot.pause()
+                await pilot.pause()
+                # Textual log
+                self._assert_new_lines_contains(app, start, "Rerunning 0-th plan...")
+                self._assert_new_lines_contains(app, start, "Output of rerun: {'ok': True}")
+
+    async def test_vulcanai_command_bb(self):
+        app = VulcanConsole(model="gpt-5-nano")
+
+        with patch.object(VulcanConsole, "init_manager", self._fake_init_manager_for_real_console):
+            async with app.run_test(headless=True) as pilot:
+                await pilot.pause()
+                await pilot.pause()
+                app.last_bb = None
+
+                # Store the Initialization of the manager to check the terminal input logs
+                start = len(app.left_pannel.document.text.splitlines())
+                # Tool testing
+                app.handle_command("/bb")
+                await pilot.pause()
+                # Textual log
+                self._assert_new_lines_contains(app, start, "No blackboard available.")
+
+                app.last_bb = {"key": "<value>"}
+                start = len(app.left_pannel.document.text.splitlines())
+                app.handle_command("/bb")
+                await pilot.pause()
+                # Textual log
+                self._assert_new_lines_contains(app, start, "Lastest blackboard state:")
+                self._assert_new_lines_contains(app, start, "key")
+                self._assert_new_lines_contains(app, start, "value")
+
+    async def test_vulcanai_command_clear(self):
+        app = VulcanConsole(model="gpt-5-nano")
+
+        with patch.object(VulcanConsole, "init_manager", self._fake_init_manager_for_real_console):
+            async with app.run_test(headless=True) as pilot:
+                await pilot.pause()
+                await pilot.pause()
+                app.logger.log_console("Temporary output before clear")
+                await pilot.pause()
+                self.assertTrue(len(app.left_pannel.document.text) > 0)
+
+                app.handle_command("/clear")
+                await pilot.pause()
+                self.assertEqual(app.left_pannel.document.text, "")
+
+    async def test_vulcanai_command_exit(self):
+        app = VulcanConsole(model="gpt-5-nano")
+
+        with patch.object(VulcanConsole, "init_manager", self._fake_init_manager_for_real_console):
+            async with app.run_test(headless=True) as pilot:
+                await pilot.pause()
+                await pilot.pause()
+                with patch.object(app, "exit") as exit_mock:
+                    app.handle_command("/exit")
+                    exit_mock.assert_called_once()
+
+    async def test_vulcanai_query_output(self):
+        app = VulcanConsole(
+            model="gpt-5-nano",
+            register_from_file=[os.path.join(RESOURCES_DIR, "test_tools.py")],
+        )
+
+        with patch.object(VulcanConsole, "init_manager", self._fake_init_manager_for_real_console_file_tools):
+            async with app.run_test(headless=True) as pilot:
+                await pilot.pause()
+                await pilot.pause()
+                await pilot.click("#cmd")
+                await pilot.press(
+                    "t",
+                    "h",
+                    "i",
+                    "s",
+                    "space",
+                    "i",
+                    "s",
+                    "space",
+                    "a",
+                    "space",
+                    "q",
+                    "u",
+                    "e",
+                    "r",
+                    "y",
+                    "enter",
+                )
+                await pilot.pause()
+                await pilot.pause()
+
+        lines = app.left_pannel.document.text.splitlines()
+        self.assertIn("[USER] >>> this is a query", lines)
+        self.assertIn("Output of plan: {'fake_query': 'this is a query'}", lines)
+
+    # TODO.
+    # async def test_vulcanai_save_plan(self):
+    #
+    # async def test_vulcanai_load_plan(self):
+    #  gpt-5-nano, ollama-llama3.1:8b
+    #  default_tools?
+
+# endregion
+

From 49f5c530f411fb7d24f0f8b9f2e9a216d3e41c65 Mon Sep 17 00:00:00 2001
From: danipiza <dpizarrogallego@gmail.com>
Date: Tue, 24 Feb 2026 09:03:39 +0100
Subject: [PATCH 3/6] [#24196] Added textual tests - Console executor logs

Signed-off-by: danipiza <dpizarrogallego@gmail.com>
---
 tests/unittest/test_console.py | 216 +++++++++++++++++++++++++++++++++
 1 file changed, 216 insertions(+)

diff --git a/tests/unittest/test_console.py b/tests/unittest/test_console.py
index 5bd3dcc..6c500b0 100644
--- a/tests/unittest/test_console.py
+++ b/tests/unittest/test_console.py
@@ -382,6 +382,222 @@ async def bootstrap(self) -> None:
         self.logger.log_console("Use <bold>'Ctrl+Q'</bold> to quit.")
         self.set_input_enabled(True)
 
+
+# EXECUTOR PRINTS
+class TestExecutorLoggingInConsoleFile(unittest.TestCase):
+    """Executor logging-path tests kept in this console-focused test module."""
+
+    class SimpleRegistry:
+        def __init__(self):
+            self.tools = {}
+
+    class PrintTool(tools_mod.AtomicTool):
+        name = "print_tool"
+        input_schema = []
+
+        def run(self, **kwargs):
+            print("tool output")
+            return {"ok": True}
+
+    class SleepTool(tools_mod.AtomicTool):
+        name = "sleep_tool"
+        input_schema = [("duration", "float")]
+
+        def run(self, **kwargs):
+            time.sleep(kwargs.get("duration", 0.01))
+            return {"ok": True}
+
+    class ErrorTool(tools_mod.AtomicTool):
+        name = "error_tool"
+        input_schema = []
+
+        def run(self, **kwargs):
+            raise RuntimeError("boom")
+
+    def setUp(self):
+        executor_mod = importlib.import_module("vulcanai.core.executor")
+        plan_types_mod = importlib.import_module("vulcanai.core.plan_types")
+
+        self.PlanExecutor = executor_mod.PlanExecutor
+        self.Arg = plan_types_mod.ArgValue
+        self.Step = plan_types_mod.Step
+        self.PlanNode = plan_types_mod.PlanNode
+        self.PlanBase = plan_types_mod.PlanBase
+
+        # Test changes
+        self.sink = FakeSink()
+        self.logger = VulcanAILogger(sink=self.sink)
+        self.registry = self.SimpleRegistry()
+        self.exec = self.PlanExecutor(self.registry, logger=self.logger)
+
+    def _assert_executor_log_contains(self, text: str, error: bool | None = None):
+        """
+        Check if 'text' is written in the logger
+        """
+        normalized_logs = [normalize_log(m) for m in self.sink.messages]
+        executor_logs = [m for m in normalized_logs if "[EXECUTOR]" in m]
+
+        if error is None:
+            found = any(text in msg for msg in executor_logs)
+        else:
+            found = any((text in msg and ("[ERROR]" in msg) == error) for msg in executor_logs)
+
+        self.assertTrue(found, f"Missing executor log '{text}'. Logs: {executor_logs}")
+
+    def test_log_executor_plan_node_skipped_due_condition(self):
+        node = self.PlanNode(kind="SEQUENCE", steps=[], condition="False")
+        self.assertTrue(self.exec._run_plan_node(node, {}))
+        self._assert_executor_log_contains("Skipping PlanNode SEQUENCE due to not fulfilled condition=False")
+
+    def test_log_executor_plan_node_succeeded_on_attempt(self):
+        self.registry.tools["noop"] = FakeTool("noop", "No operation tool.")
+        node = self.PlanNode(kind="SEQUENCE", steps=[self.Step(tool="noop", args=[])])
+
+        # VulcanAI function
+        self.assertTrue(self.exec._run_plan_node(node, {}))
+        # Textual log
+        self._assert_executor_log_contains("PlanNode SEQUENCE succeeded on attempt")
+
+    def test_log_executor_plan_node_failed_on_attempt(self):
+        node = self.PlanNode(kind="SEQUENCE", steps=[self.Step(tool="missing", args=[])])
+        self.assertFalse(self.exec._run_plan_node(node, {}))
+        self._assert_executor_log_contains("PlanNode SEQUENCE failed on attempt", error=True)
+
+    def test_log_executor_plan_node_timeout(self):
+        self.registry.tools["sleep_tool"] = self.SleepTool()
+        node = self.PlanNode(
+            kind="SEQUENCE",
+            steps=[self.Step(tool="sleep_tool", args=[self.Arg(key="duration", val=0.05)])],
+            timeout_ms=1,
+        )
+
+        # VulcanAI function
+        self.assertFalse(self.exec._execute_plan_node_with_timeout(node, {}))
+        # Textual log
+        self._assert_executor_log_contains("PlanNode SEQUENCE timed out", error=True)
+
+    def test_log_executor_plan_node_kind_unknown(self):
+        unknown_node = type("UnknownNode", (), {"kind": "UNKNOWN", "steps": []})()
+        self.assertTrue(self.exec._execute_plan_node(unknown_node, {}))
+        self._assert_executor_log_contains("Unknown PlanNode kind UNKNOWN, skipping", error=True)
+
+    def test_log_executor_executing_on_fail_branch(self):
+        self.registry.tools["noop"] = FakeTool("noop", "No operation tool.")
+        node = self.PlanNode(
+            kind="SEQUENCE",
+            steps=[self.Step(tool="missing", args=[])],
+            on_fail=self.PlanBase(kind="SEQUENCE", steps=[self.Step(tool="noop", args=[])]),
+        )
+
+        # VulcanAI function
+        self.assertFalse(self.exec._run_plan_node(node, {}))
+        # Textual log
+        self._assert_executor_log_contains("Executing on_fail branch for PlanNode SEQUENCE")
+
+    def test_log_executor_step_skipped_due_to_condition(self):
+        self.registry.tools["noop"] = FakeTool("noop", "No operation tool.")
+        step = self.Step(tool="noop", args=[], condition="False")
+
+        # VulcanAI function
+        self.assertTrue(self.exec._run_step(step, {}))
+        # Textual log
+        self._assert_executor_log_contains("Skipping step 'noop' due to condition=False")
+
+    def test_log_executor_step_attempt_failed(self):
+        step = self.Step(tool="missing", args=[], retry=1)
+
+        # VulcanAI function
+        self.assertFalse(self.exec._run_step(step, {}))
+        # Textual log
+        self._assert_executor_log_contains("Step 'missing' attempt 1/2 failed")
+
+    def test_log_executor_step_entity_succeeded_with_criteria(self):
+        step = self.Step(tool="noop", args=[], success_criteria="True")
+
+        # VulcanAI function
+        self.assertTrue(self.exec._check_success(step, {}, is_step=True))
+        # Textual log
+        self._assert_executor_log_contains("Entity 'noop' succeeded with criteria=True")
+
+    def test_log_executor_step_entity_failed_with_criteria(self):
+        step = self.Step(tool="noop", args=[], success_criteria="False")
+
+        # VulcanAI function
+        self.assertFalse(self.exec._check_success(step, {}, is_step=True))
+        # Textual log
+        self._assert_executor_log_contains("Entity 'noop' failed with criteria=False")
+
+    def test_log_executor_condition_evaluation_failed(self):
+        # VulcanAI function
+        self.assertFalse(self.exec.safe_eval("{{", {}))
+        # Textual log
+        self._assert_executor_log_contains("Condition evaluation failed: {{", error=True)
+
+    def test_log_executor_blackboard_substitution_failed(self):
+        with patch.object(self.exec, "_get_from_bb", side_effect=RuntimeError("boom")):
+            out = self.exec._make_bb_subs("{{bb.value}}", {})
+
+        # VulcanAI function
+        self.assertEqual(out, "{{bb.value}}")
+        # Textual log
+        self._assert_executor_log_contains("Blackboard substitution failed: {{bb.value}} (boom)", error=True)
+
+    def test_log_executor_tool_not_found(self):
+        # VulcanAI function
+        ok, out = self.exec._call_tool("missing", args=[])
+        self.assertFalse(ok)
+        self.assertIsNone(out)
+        # Textual log
+        self._assert_executor_log_contains("Tool 'missing' not found", error=True)
+
+    def test_log_executor_tool_invoking(self):
+        self.registry.tools["noop"] = FakeTool("noop", "No operation tool.")
+        args = [self.Arg(key="value", val="abc")]
+
+        # VulcanAI function
+        self.exec._call_tool("noop", args=args, bb={})
+        # Textual log
+        self._assert_executor_log_contains("Invoking 'noop' with args:")
+
+    def test_log_executor_tool_stdout_log(self):
+        self.registry.tools["print_tool"] = self.PrintTool()
+
+        # VulcanAI function
+        self.exec._call_tool("print_tool", args=[], bb={})
+        # Textual log
+        self._assert_executor_log_contains("tool output: print_tool")
+
+    def test_log_executor_tool_executed_duration(self):
+        self.registry.tools["noop"] = FakeTool("noop", "No operation tool.")
+
+        # VulcanAI function
+        self.exec._call_tool("noop", args=[self.Arg(key="value", val="abc")], bb={})
+        # Textual log
+        self._assert_executor_log_contains("Executed 'noop' in")
+
+    def test_log_executor_tool_execution_timeout(self):
+        self.registry.tools["sleep_tool"] = self.SleepTool()
+
+        args = [self.Arg(key="duration", val=0.05)]
+        # VulcanAI function
+        ok, out = self.exec._call_tool("sleep_tool", args=args, timeout_ms=1, bb={})
+        self.assertFalse(ok)
+        self.assertIsNone(out)
+
+        # Textual log
+        self._assert_executor_log_contains("Execution of 'sleep_tool' timed out after 1 ms", error=False)
+
+    def test_log_executor_tool_execution_failed(self):
+        self.registry.tools["error_tool"] = self.ErrorTool()
+
+        # VulcanAI function
+        ok, out = self.exec._call_tool("error_tool", args=[], bb={})
+        self.assertFalse(ok)
+        self.assertIsNone(out)
+
+        # Textual log
+        self._assert_executor_log_contains("Execution failed for 'error_tool': boom")
+
 # TERMINAL INPUT
 class TestConsoleInputOutput(unittest.IsolatedAsyncioTestCase):
     """End-to-end Textual UI tests focused on terminal output behavior."""

From e78aec411d5d9abb987c9a9bd61b698ff71d6118 Mon Sep 17 00:00:00 2001
From: danipiza <dpizarrogallego@gmail.com>
Date: Tue, 24 Feb 2026 09:04:51 +0100
Subject: [PATCH 4/6] [#24196] Added textual tests - Console manager logs

Signed-off-by: danipiza <dpizarrogallego@gmail.com>
---
 tests/unittest/test_console.py | 368 +++++++++++++++++++++++++++++++++
 1 file changed, 368 insertions(+)

diff --git a/tests/unittest/test_console.py b/tests/unittest/test_console.py
index 6c500b0..c5afc0f 100644
--- a/tests/unittest/test_console.py
+++ b/tests/unittest/test_console.py
@@ -598,6 +598,374 @@ def test_log_executor_tool_execution_failed(self):
         # Textual log
         self._assert_executor_log_contains("Execution failed for 'error_tool': boom")
 
+# MANAGER PRINTS
+class TestManagerLoggingInConsoleFile(unittest.TestCase):
+    """Iterative manager tests kept in this console-focused test module."""
+
+    class _FakeExecutor:
+        def safe_eval(self, expr, bb):
+            if expr == "True":
+                return True
+            if expr == "False":
+                return False
+            return False
+
+    class _FakeRegistry:
+        def __init__(self, tools=None, topk_action=None, topk_validation=None):
+            self.tools = tools or {}
+            self._topk_action = topk_action if topk_action is not None else list(self.tools.values())
+            self._topk_validation = topk_validation if topk_validation is not None else []
+
+        def top_k(self, query, k, validation=False):
+            if validation:
+                return list(self._topk_validation)
+            return list(self._topk_action)
+
+    class _FakeValidator:
+        def __init__(self, side_effects):
+            self._side_effects = list(side_effects)
+
+        def validate(self, plan):
+            if not self._side_effects:
+                return
+            nxt = self._side_effects.pop(0)
+            if isinstance(nxt, Exception):
+                raise nxt
+
+    def setUp(self):
+        executor_mod = importlib.import_module("vulcanai.core.executor")
+        manager_iterator_mod = importlib.import_module("vulcanai.core.manager_iterator")
+        plan_types_mod = importlib.import_module("vulcanai.core.plan_types")
+
+        self.Blackboard = executor_mod.Blackboard
+        self.IterativeManager = manager_iterator_mod.IterativeManager
+        self.TimelineEvent = manager_iterator_mod.TimelineEvent
+        self.Step = plan_types_mod.Step
+        self.GoalSpec = plan_types_mod.GoalSpec
+        self.AIValidation = plan_types_mod.AIValidation
+
+    def _assert_manager_log_contains(self, manager, text: str, error: bool | None = None):
+        normalized_logs = [normalize_log(m) for m in manager._sink.messages]
+        manager_logs = [m for m in normalized_logs if "[MANAGER]" in m]
+        if error is None:
+            found = any(text in msg for msg in manager_logs)
+        else:
+            found = any((text in msg and ("[ERROR]" in msg) == error) for msg in manager_logs)
+        self.assertTrue(found, f"Missing manager log '{text}'. Logs: {manager_logs}")
+
+    def _new_manager(self, max_iters=2):
+        manager = self.IterativeManager.__new__(self.IterativeManager)
+        manager._sink = FakeSink()
+        manager.logger = VulcanAILogger(sink=manager._sink)
+        manager.k = 3
+        manager.history_depth = 5
+        manager.history = []
+        manager.user_context = ""
+        manager.registry = self._FakeRegistry()
+        manager.validator = None
+        manager.executor = self._FakeExecutor()
+        manager.llm = FakeLLM()
+        manager.bb = self.Blackboard()
+        manager.iter = 0
+        manager.max_iters = max_iters
+        manager.step_timeout_ms = 10000
+        manager.goal = None
+        manager._used_plans = set()
+        manager._timeline = []
+        manager._timeline_events_printed = 3
+        manager._single_tool_plan = self.IterativeManager._init_single_tool_plan(manager)
+        return manager
+
+    def _sample_plan(self, summary: str = "sample"):
+        plan_types_mod = importlib.import_module("vulcanai.core.plan_types")
+        return plan_types_mod.GlobalPlan(
+            summary=summary,
+            plan=[plan_types_mod.PlanNode(kind="SEQUENCE", steps=[plan_types_mod.Step(tool="noop", args=[])])],
+        )
+
+    def test_log_manager_error_getting_goal_from_user_request(self):
+        manager = self._new_manager(max_iters=1)
+
+        # Temporarily replaces manager._get_goal_from_user_request so it always raises RuntimeError("goal boom").
+        with patch.object(manager, "_get_goal_from_user_request", side_effect=RuntimeError("goal boom")):
+            # VulcanAI function
+            ret = manager.handle_user_request("user req", {})
+
+        self.assertIn("error", ret)
+        # Textual log
+        self._assert_manager_log_contains(manager, "Error getting goal from user request: goal boom", error=True)
+
+    def test_log_manager_iteration_banner(self):
+        manager = self._new_manager(max_iters=1)
+
+        # Temporarily replaces all other functions in manager.handle_user_request()
+        # to only print the iteration banner
+        with patch.object(manager, "_get_goal_from_user_request", return_value=self.GoalSpec(summary="g")):
+            with patch.object(manager, "_verify_progress", return_value=False):
+                with patch.object(manager, "get_plan_from_user_request", return_value=self._sample_plan("p1")):
+                    with patch.object(manager, "execute_plan", return_value={"success": True}):
+                        # VulcanAI function
+                        manager.handle_user_request("user req", {})
+        # Textual log
+        self._assert_manager_log_contains(manager, "--- Iteration 1 ---")
+
+    def test_log_manager_error_getting_plan_from_model(self):
+        manager = self._new_manager(max_iters=2)
+
+        # Temporarily replaces all other functions in manager.handle_user_request()
+        # get_plan_from_user_request returns None, then try to get another plan and then suceeds.
+        with patch.object(manager, "_get_goal_from_user_request", return_value=self.GoalSpec(summary="g")):
+            with patch.object(manager, "_verify_progress", return_value=False):
+                with patch.object(manager, "get_plan_from_user_request", side_effect=[None, self._sample_plan("p2")]):
+                    with patch.object(manager, "execute_plan", return_value={"success": True}):
+                        # VulcanAI function
+                        ret = manager.handle_user_request("user req", {})
+        self.assertIn("plan", ret)
+        # Textual log
+        self._assert_manager_log_contains(manager, "Error getting plan from model", error=True)
+
+    def test_log_manager_repeated_plan(self):
+        manager = self._new_manager(max_iters=2)
+        # Create a plan and add it to the used plans
+        repeated = self._sample_plan("repeat")
+        manager._used_plans.add(str(repeated.plan))
+
+        # Temporarily replaces all other functions in manager.handle_user_request()
+        # get_plan_from_user_request returns a repeated plan
+        with patch.object(manager, "_get_goal_from_user_request", return_value=self.GoalSpec(summary="g")):
+            with patch.object(manager, "_verify_progress", return_value=False):
+                with patch.object(manager, "get_plan_from_user_request", side_effect=[repeated, self._sample_plan("new")]):
+                    with patch.object(manager, "execute_plan", return_value={"success": True}):
+                        # VulcanAI function
+                        manager.handle_user_request("user req", {})
+        # Textual log
+        self._assert_manager_log_contains(manager, "LLM produced a repeated plan. Stopping iterations.", error=True)
+
+    def test_log_manager_plan_validation_error(self):
+        manager = self._new_manager(max_iters=2)
+        manager.validator = self._FakeValidator([RuntimeError("invalid plan"), None])
+
+        # TODO. danip
+        with patch.object(manager, "_get_goal_from_user_request", return_value=self.GoalSpec(summary="g")):
+            with patch.object(manager, "_verify_progress", return_value=False):
+                with patch.object(
+                    manager,
+                    "get_plan_from_user_request",
+                    side_effect=[self._sample_plan("p1"), self._sample_plan("p2")],
+                ):
+                    with patch.object(manager, "execute_plan", return_value={"success": True}):
+                        # VulcanAI function
+                        manager.handle_user_request("user req", {})
+        # Textual log
+        self._assert_manager_log_contains(manager, "Plan validation error. Asking for new plan: invalid plan")
+
+    def test_log_manager_iteration_failed(self):
+        manager = self._new_manager(max_iters=1)
+
+        # Temporarily replaces all other functions in manager.handle_user_request()
+        # Change the output of execute_plan() with 'False' and see the print
+        with patch.object(manager, "_get_goal_from_user_request", return_value=self.GoalSpec(summary="g")):
+            with patch.object(manager, "_verify_progress", return_value=False):
+                with patch.object(manager, "get_plan_from_user_request", return_value=self._sample_plan("p1")):
+                    with patch.object(manager, "execute_plan", return_value={"success": False}):
+                        # VulcanAI function
+                        manager.handle_user_request("user req", {})
+        # Textual log
+        self._assert_manager_log_contains(manager, "Iteration 1 failed.", error=True)
+
+    def test_log_manager_error_handling_user_request(self):
+        manager = self._new_manager(max_iters=1)
+
+        # Temporarily replaces all other functions in manager.handle_user_request()
+        # Change execute_plan() to throw an exception and see the print
+        with patch.object(manager, "_get_goal_from_user_request", return_value=self.GoalSpec(summary="g")):
+            with patch.object(manager, "_verify_progress", return_value=False):
+                with patch.object(manager, "get_plan_from_user_request", return_value=self._sample_plan("p1")):
+                    with patch.object(manager, "execute_plan", side_effect=RuntimeError("execute boom")):
+                        # VulcanAI function
+                        ret = manager.handle_user_request("user req", {})
+        self.assertEqual(ret["error"], "execute boom")
+        # Textual log
+        self._assert_manager_log_contains(manager, "Error handling user request: execute boom", error=True)
+
+    def test_log_manager_no_tools_available_in_build_prompt(self):
+        manager = self._new_manager()
+        # No tools
+        manager.registry = self._FakeRegistry(tools={}, topk_action=[])
+
+        # VulcanAI function
+        sys_prompt, user_prompt = manager._build_prompt("test", {})
+        self.assertEqual(sys_prompt, "")
+        self.assertEqual(user_prompt, "")
+        # Textual log
+        self._assert_manager_log_contains(manager, "No tools available in the registry.", error=True)
+
+    def test_log_manager_goal_received(self):
+        manager = self._new_manager()
+        manager.llm.goal_return = self.GoalSpec(summary="goal from llm")
+
+        # Temporarily replaces _build_goal_prompt() to return a tuple without executing the functions inside of it
+        with patch.object(manager, "_build_goal_prompt", return_value=("sys", "user")):
+            # VulcanAI function
+            goal = manager._get_goal_from_user_request("req", {})
+        self.assertEqual(goal.summary, "goal from llm")
+        # Textual log
+        self._assert_manager_log_contains(manager, "Goal received:")
+
+    def test_log_manager_single_tool_plan_not_initialized(self):
+        manager = self._new_manager()
+        manager._single_tool_plan = None
+
+        # VulcanAI function
+        manager._set_single_tool_params("verify_tool", [])
+        # Textual log
+        self._assert_manager_log_contains(manager, "Single tool plan is not initialized properly.", error=True)
+
+    def test_log_manager_goal_achieved_objective_mode(self):
+        manager = self._new_manager()
+        manager.goal = self.GoalSpec(summary="g", mode="objective", success_predicates=["True"], verify_tools=[])
+
+        # Temporarily replaces _run_verification_tools() to return None without executing the functions inside of it
+        with patch.object(manager, "_run_verification_tools", return_value=None):
+            # VulcanAI function
+            achieved = manager._verify_progress()
+        self.assertTrue(achieved)
+        self.assertTrue(manager.bb["goal_achieved"])
+        # Textual log
+        self._assert_manager_log_contains(manager, "Goal achieved in objective mode. Stopping iterations.")
+
+    def test_log_manager_perceptual_verification(self):
+        manager = self._new_manager()
+        verify_step = self.Step(tool="verify_tool", args=[])
+        manager.goal = self.GoalSpec(summary="g", mode="perceptual", verify_tools=[verify_step], evidence_bb_keys=["k1"])
+        manager.registry.tools["verify_tool"] = FakeTool("verify_tool", is_validation_tool=True, provide_images=True)
+        manager.bb["verify_tool"] = {"images": ["/tmp/image.png"]}
+        # No achieved (Not yet)
+        manager.llm.validation_return = self.AIValidation(success=False, confidence=0.2, explanation="not yet")
+
+        # Temporarily replaces all other functions in manager._verify_progress()
+        # And prints no instructions
+        with patch.object(manager, "_run_verification_tools", return_value=None):
+            with patch.object(manager, "_build_validation_prompt", return_value=("sys", "user")):
+                # VulcanAI function
+                manager._verify_progress()
+        # Textual log
+        self._assert_manager_log_contains(manager, "Running perceptual verification with instruction:")
+
+    def test_log_manager_perceptual_goal_achieved(self):
+        manager = self._new_manager()
+        manager.goal = self.GoalSpec(summary="g", mode="perceptual", verify_tools=[])
+        # Achieved
+        manager.llm.validation_return = self.AIValidation(success=True, confidence=0.9, explanation="done")
+
+        # Temporarily replaces all other functions in manager._verify_progress()
+        with patch.object(manager, "_run_verification_tools", return_value=None):
+            with patch.object(manager, "_build_validation_prompt", return_value=("sys", "user")):
+                # VulcanAI function
+                achieved = manager._verify_progress()
+        self.assertTrue(achieved)
+        # Textual log
+        self._assert_manager_log_contains(manager, "Goal achieved in perceptual mode. Stopping iterations.")
+
+    def test_log_manager_perceptual_goal_not_achieved(self):
+        manager = self._new_manager()
+        manager.goal = self.GoalSpec(summary="g", mode="perceptual", verify_tools=[])
+        # No achieved (No)
+        manager.llm.validation_return = self.AIValidation(success=False, confidence=0.4, explanation="no")
+
+        # Temporarily replaces all other functions in manager._verify_progress()
+        with patch.object(manager, "_run_verification_tools", return_value=None):
+            with patch.object(manager, "_build_validation_prompt", return_value=("sys", "user")):
+                # VulcanAI function
+                achieved = manager._verify_progress()
+        self.assertFalse(achieved)
+        # Textual log
+        self._assert_manager_log_contains(manager, "Goal not achieved in perceptual mode.")
+
+    def test_log_manager_perceptual_error_during_verification(self):
+        manager = self._new_manager()
+        manager.goal = self.GoalSpec(summary="g", mode="perceptual", verify_tools=[])
+        # No achieved (Exception)
+        manager.llm.validation_error = RuntimeError("validation boom")
+
+        # Temporarily replaces all other functions in manager._verify_progress()
+        with patch.object(manager, "_run_verification_tools", return_value=None):
+            with patch.object(manager, "_build_validation_prompt", return_value=("sys", "user")):
+                # VulcanAI function
+                achieved = manager._verify_progress()
+        self.assertFalse(achieved)
+        # Textual log
+        self._assert_manager_log_contains(manager, "Error during perceptual verification: validation boom", error=True)
+
+    def test_log_manager_verification_tools_skip(self):
+        manager = self._new_manager()
+        manager._timeline = [{"iteration": 1, "event": self.TimelineEvent.PLAN_REPEATED.value}]
+        tool_name = "verify_tool"
+        manager.goal = self.GoalSpec(summary="g", verify_tools=[self.Step(tool=tool_name, args=[])])
+
+        # VulcanAI function
+        manager._run_verification_tools()
+        # Textual log
+        self._assert_manager_log_contains(
+            manager, "Skipping verification tools as no plan has been executed in this iteration."
+        )
+
+    def test_log_manager_verification_tools_not_found(self):
+        manager = self._new_manager()
+        manager._timeline = [{"iteration": 0, "event": self.TimelineEvent.GOAL_SET.value}]
+        tool_name = "missing_tool"
+        manager.goal = self.GoalSpec(summary="g", verify_tools=[self.Step(tool=tool_name, args=[])])
+
+        # VulcanAI function
+        manager._run_verification_tools()
+        # Textual log
+        self._assert_manager_log_contains(manager, f"Verification tool '{tool_name}' not found in registry.", error=True)
+
+    def test_log_manager_verification_tools_running(self):
+        manager = self._new_manager()
+        manager._timeline = [{"iteration": 0, "event": self.TimelineEvent.GOAL_SET.value}]
+        tool_name = "verify_tool"
+        manager.registry.tools[tool_name] = FakeTool(tool_name)
+        manager.goal = self.GoalSpec(summary="g", verify_tools=[self.Step(tool=tool_name, args=[])])
+
+        # Temporarily replaces _run_verification_tools() to return True without executing the functions inside of it
+        with patch.object(manager, "execute_plan", return_value={"success": True}):
+            # VulcanAI function
+            manager._run_verification_tools()
+        # Textual log
+        self._assert_manager_log_contains(manager, f"Running verification tool: {tool_name}")
+
+    def test_log_manager_verification_tools_running_error(self):
+        manager = self._new_manager()
+        manager._timeline = [{"iteration": 0, "event": self.TimelineEvent.GOAL_SET.value}]
+        tool_name = "verify_tool"
+        manager.registry.tools[tool_name] = FakeTool(tool_name)
+        manager.goal = self.GoalSpec(summary="g", verify_tools=[self.Step(tool=tool_name, args=[])])
+
+        # Temporarily replaces _run_verification_tools() to return False without executing the functions inside of it
+        with patch.object(manager, "execute_plan", return_value={"success": False}):
+            # VulcanAI function
+            manager._run_verification_tools()
+        self.assertEqual(manager.bb[tool_name]["error"], "Validation tool execution failed")
+        # Textual log
+        self._assert_manager_log_contains(
+            manager, f"Error running verification tool '{tool_name}'. BB entry of this tool will be empty.", error=True
+        )
+
+    def test_log_manager_verification_tools_running_exception(self):
+        manager = self._new_manager()
+        manager._timeline = [{"iteration": 0, "event": self.TimelineEvent.GOAL_SET.value}]
+        tool_name = "verify_tool"
+        manager.registry.tools["verify_tool"] = FakeTool(tool_name)
+        manager.goal = self.GoalSpec(summary="g", verify_tools=[self.Step(tool=tool_name, args=[])])
+
+        # Temporarily replaces execute_plan() to throw an exeception without executing the functions inside of it
+        with patch.object(manager, "execute_plan", side_effect=RuntimeError("exec crash")):
+            # VulcanAI function
+            manager._run_verification_tools()
+        # Textual log
+        self._assert_manager_log_contains(manager, f"Error running verification tool '{tool_name}': exec crash", error=True)
+
 # TERMINAL INPUT
 class TestConsoleInputOutput(unittest.IsolatedAsyncioTestCase):
     """End-to-end Textual UI tests focused on terminal output behavior."""

From 67aa857747c1756d030045fc026cc2797d6ce99f Mon Sep 17 00:00:00 2001
From: danipiza <dpizarrogallego@gmail.com>
Date: Tue, 24 Feb 2026 11:03:33 +0100
Subject: [PATCH 5/6] [#24196] Added textual tests - Console queries logs

Signed-off-by: danipiza <dpizarrogallego@gmail.com>
---
 src/vulcanai/core/validator.py |  12 +-
 tests/unittest/test_console.py | 438 ++++++++++++++++++++++++++++++---
 2 files changed, 406 insertions(+), 44 deletions(-)

diff --git a/src/vulcanai/core/validator.py b/src/vulcanai/core/validator.py
index 9cf5122..8b66871 100644
--- a/src/vulcanai/core/validator.py
+++ b/src/vulcanai/core/validator.py
@@ -14,6 +14,7 @@
 
 import re
 
+from vulcanai.console.logger import VulcanAILogger
 from vulcanai.core.plan_types import GlobalPlan, PlanNode, Step
 
 TYPE_ALIAS = {"int": int, "integer": int, "float": float, "bool": bool, "boolean": bool, "str": str, "string": str}
@@ -22,8 +23,11 @@
 class PlanValidator:
     """Validates and optionally augments a plan before execution."""
 
-    def __init__(self, registry):
+    def __init__(self, registry, logger=None):
         self.registry = registry
+        # Use an isolated logger instance by default to avoid sharing sinks across
+        # unrelated contexts (e.g. Textual app tests vs plain unittest).
+        self.logger = logger or VulcanAILogger().default()
 
     def validate(self, plan: GlobalPlan):
         """
@@ -89,12 +93,12 @@ def _validate_step(self, step: Step):
                     expected_type = None
                     for schema in tool.input_schema:
                         if arg.key in schema:
-                            print(f"Schema for arg '{arg.key}' in tool '{tool.name}': {schema}")  # Debug print
+                            self.logger.log_validator(f"Schema for arg '{arg.key}' in tool '{tool.name}': {schema}")
                             # Use TYPE_ALIAS to map string type names to actual types
                             expected_type = TYPE_ALIAS.get(schema[1])
-                            print(
+                            self.logger.log_validator(
                                 f"Expected type for arg '{arg.key}' in tool '{tool.name}': {expected_type}"
-                            )  # Debug print
+                            )
                             break
                     if expected_type and not isinstance(arg.val, expected_type):
                         if expected_type is float and isinstance(arg.val, int):
diff --git a/tests/unittest/test_console.py b/tests/unittest/test_console.py
index c5afc0f..3dac489 100644
--- a/tests/unittest/test_console.py
+++ b/tests/unittest/test_console.py
@@ -44,8 +44,9 @@ def similarity(self, a, b):
 class FakeTool(tools_mod.AtomicTool):
     """Small tool descriptor used by FakeRegistry for /tools output tests."""
 
-    def __init__(self, name: str, description: str = "Fake tool description",
-                 is_validation_tool=True, provide_images=True):
+    def __init__(
+        self, name: str, description: str = "Fake tool description", is_validation_tool=True, provide_images=True
+    ):
         self.name = name
         self.description = description
         self.tags = ["empty", "fake", "tool", "move"]
@@ -63,6 +64,7 @@ def run(self, **kwargs):
 
 # region LLM
 
+
 class FakeLLM:
     def __init__(self, logger=None):
         self.logger = logger
@@ -85,20 +87,39 @@ def inference_validation(self, system_prompt, user_prompt, images, history):
     def set_hooks(self, _hooks) -> None:
         self.logger.log_manager("LLM hooks set.")
 
+
+# endregion
+
 # region REGISTRY
 
 
 class FakeRegistry:
     """In-memory registry used to avoid real tool discovery in most command tests."""
 
-    def __init__(self):
-        self.tools = {
-            "nav": FakeTool("nav", "Navigate to target pose."),
-            "scan": FakeTool("scan", "Scan surroundings."),
-        }
-        self.deactivated_tools = {
-            "old_tool": FakeTool("old_tool", "Deprecated tool."),
-        }
+    def __init__(self, tools=None, topk_action=None, topk_validation=None):
+        if tools is None:
+            self.tools = {
+                "nav": FakeTool("nav", "Navigate to target pose."),
+                "scan": FakeTool("scan", "Scan surroundings."),
+            }
+            self.deactivated_tools = {
+                "old_tool": FakeTool("old_tool", "Deprecated tool."),
+            }
+            self.validation_tools = []
+        else:
+            self.tools = tools
+
+        self._topk_action = topk_action if topk_action is not None else list(self.tools.values())
+        self._topk_validation = topk_validation if topk_validation is not None else []
+
+    def register_tool(self, tool, solve_deps: bool = True) -> None:
+        """Register a tool in-memory for tests."""
+        del solve_deps  # Unused in fake registry, kept for API compatibility
+        if tool.name in self.tools:
+            return
+        self.tools[tool.name] = tool
+        if getattr(tool, "is_validation_tool", False):
+            self.validation_tools.append(tool.name)
 
     def activate_tool(self, _tool) -> bool:
         return True
@@ -106,6 +127,11 @@ def activate_tool(self, _tool) -> bool:
     def deactivate_tool(self, _tool) -> bool:
         return True
 
+    def top_k(self, query, k, validation=False):
+        if validation:
+            return list(self._topk_validation)
+        return list(self._topk_action)
+
 
 class FileToolsRegistry:
     """Registry that discovers @vulcanai_tool classes from a Python file."""
@@ -165,6 +191,8 @@ def deactivate_tool(self, tool_name) -> bool:
         return True
 
 
+# endregion
+
 # region MANAGER
 
 
@@ -250,8 +278,11 @@ def handle_user_request(self, user_text: str, context):
         return {"plan": {"summary": "fake"}, "success": True, "blackboard": bb}
 
 
+# endregion
+
 # region TESTS
 
+
 def normalize_log(msg: str) -> str:
     """
     Remove rich/style markup while preserving human-readable content.
@@ -387,10 +418,6 @@ async def bootstrap(self) -> None:
 class TestExecutorLoggingInConsoleFile(unittest.TestCase):
     """Executor logging-path tests kept in this console-focused test module."""
 
-    class SimpleRegistry:
-        def __init__(self):
-            self.tools = {}
-
     class PrintTool(tools_mod.AtomicTool):
         name = "print_tool"
         input_schema = []
@@ -427,7 +454,7 @@ def setUp(self):
         # Test changes
         self.sink = FakeSink()
         self.logger = VulcanAILogger(sink=self.sink)
-        self.registry = self.SimpleRegistry()
+        self.registry = FakeRegistry()
         self.exec = self.PlanExecutor(self.registry, logger=self.logger)
 
     def _assert_executor_log_contains(self, text: str, error: bool | None = None):
@@ -598,6 +625,7 @@ def test_log_executor_tool_execution_failed(self):
         # Textual log
         self._assert_executor_log_contains("Execution failed for 'error_tool': boom")
 
+
 # MANAGER PRINTS
 class TestManagerLoggingInConsoleFile(unittest.TestCase):
     """Iterative manager tests kept in this console-focused test module."""
@@ -610,17 +638,6 @@ def safe_eval(self, expr, bb):
                 return False
             return False
 
-    class _FakeRegistry:
-        def __init__(self, tools=None, topk_action=None, topk_validation=None):
-            self.tools = tools or {}
-            self._topk_action = topk_action if topk_action is not None else list(self.tools.values())
-            self._topk_validation = topk_validation if topk_validation is not None else []
-
-        def top_k(self, query, k, validation=False):
-            if validation:
-                return list(self._topk_validation)
-            return list(self._topk_action)
-
     class _FakeValidator:
         def __init__(self, side_effects):
             self._side_effects = list(side_effects)
@@ -661,7 +678,7 @@ def _new_manager(self, max_iters=2):
         manager.history_depth = 5
         manager.history = []
         manager.user_context = ""
-        manager.registry = self._FakeRegistry()
+        manager.registry = FakeRegistry()
         manager.validator = None
         manager.executor = self._FakeExecutor()
         manager.llm = FakeLLM()
@@ -734,7 +751,9 @@ def test_log_manager_repeated_plan(self):
         # get_plan_from_user_request returns a repeated plan
         with patch.object(manager, "_get_goal_from_user_request", return_value=self.GoalSpec(summary="g")):
             with patch.object(manager, "_verify_progress", return_value=False):
-                with patch.object(manager, "get_plan_from_user_request", side_effect=[repeated, self._sample_plan("new")]):
+                with patch.object(
+                    manager, "get_plan_from_user_request", side_effect=[repeated, self._sample_plan("new")]
+                ):
                     with patch.object(manager, "execute_plan", return_value={"success": True}):
                         # VulcanAI function
                         manager.handle_user_request("user req", {})
@@ -745,7 +764,6 @@ def test_log_manager_plan_validation_error(self):
         manager = self._new_manager(max_iters=2)
         manager.validator = self._FakeValidator([RuntimeError("invalid plan"), None])
 
-        # TODO. danip
         with patch.object(manager, "_get_goal_from_user_request", return_value=self.GoalSpec(summary="g")):
             with patch.object(manager, "_verify_progress", return_value=False):
                 with patch.object(
@@ -791,7 +809,7 @@ def test_log_manager_error_handling_user_request(self):
     def test_log_manager_no_tools_available_in_build_prompt(self):
         manager = self._new_manager()
         # No tools
-        manager.registry = self._FakeRegistry(tools={}, topk_action=[])
+        manager.registry = FakeRegistry(tools={}, topk_action=[])
 
         # VulcanAI function
         sys_prompt, user_prompt = manager._build_prompt("test", {})
@@ -837,7 +855,9 @@ def test_log_manager_goal_achieved_objective_mode(self):
     def test_log_manager_perceptual_verification(self):
         manager = self._new_manager()
         verify_step = self.Step(tool="verify_tool", args=[])
-        manager.goal = self.GoalSpec(summary="g", mode="perceptual", verify_tools=[verify_step], evidence_bb_keys=["k1"])
+        manager.goal = self.GoalSpec(
+            summary="g", mode="perceptual", verify_tools=[verify_step], evidence_bb_keys=["k1"]
+        )
         manager.registry.tools["verify_tool"] = FakeTool("verify_tool", is_validation_tool=True, provide_images=True)
         manager.bb["verify_tool"] = {"images": ["/tmp/image.png"]}
         # No achieved (Not yet)
@@ -919,7 +939,9 @@ def test_log_manager_verification_tools_not_found(self):
         # VulcanAI function
         manager._run_verification_tools()
         # Textual log
-        self._assert_manager_log_contains(manager, f"Verification tool '{tool_name}' not found in registry.", error=True)
+        self._assert_manager_log_contains(
+            manager, f"Verification tool '{tool_name}' not found in registry.", error=True
+        )
 
     def test_log_manager_verification_tools_running(self):
         manager = self._new_manager()
@@ -964,7 +986,10 @@ def test_log_manager_verification_tools_running_exception(self):
             # VulcanAI function
             manager._run_verification_tools()
         # Textual log
-        self._assert_manager_log_contains(manager, f"Error running verification tool '{tool_name}': exec crash", error=True)
+        self._assert_manager_log_contains(
+            manager, f"Error running verification tool '{tool_name}': exec crash", error=True
+        )
+
 
 # TERMINAL INPUT
 class TestConsoleInputOutput(unittest.IsolatedAsyncioTestCase):
@@ -1749,12 +1774,345 @@ async def test_vulcanai_query_output(self):
         self.assertIn("[USER] >>> this is a query", lines)
         self.assertIn("Output of plan: {'fake_query': 'this is a query'}", lines)
 
-    # TODO.
-    # async def test_vulcanai_save_plan(self):
-    #
-    # async def test_vulcanai_load_plan(self):
-    #  gpt-5-nano, ollama-llama3.1:8b
-    #  default_tools?
 
-# endregion
+# TERMINAL PLANS
+class TestConsoleQueriesOutput(unittest.TestCase):
+    def setUp(self):
+        # Import package modules dynamically
+        tools_mod = importlib.import_module("vulcanai.tools.tools")
+        registry_mod = importlib.import_module("vulcanai.tools.tool_registry")
+        plan_types_mod = importlib.import_module("vulcanai.core.plan_types")
+        validator_mod = importlib.import_module("vulcanai.core.validator")
+        executor_mod = importlib.import_module("vulcanai.core.executor")
+
+        # Keep references
+        self.ToolRegistry = registry_mod.ToolRegistry
+        self.Validator = validator_mod.PlanValidator
+        self.PlanExecutor = executor_mod.PlanExecutor
+        self.Blackboard = executor_mod.Blackboard
+
+        # Expose for tests
+        self.GlobalPlan = plan_types_mod.GlobalPlan
+        self.PlanNode = plan_types_mod.PlanNode
+        self.PlanBase = plan_types_mod.PlanBase
+        self.Step = plan_types_mod.Step
+        self.Arg = plan_types_mod.ArgValue
+
+        self.sink = FakeSink()
+        self.logger = VulcanAILogger(sink=self.sink)
+        self.registry = FakeRegistry()
+
+        # Define and register tools
+        class EmptyTool(tools_mod.AtomicTool):
+            name = "empty"
+            description = "Empty tool."
+            input_schema = []
+            output_schema = {"result": "bool"}
+
+            def run(self):
+                return {"result": True}
+
+        class DetectTool(tools_mod.AtomicTool):
+            name = "detect_object"
+            description = "Detect an object in the environment"
+            tags = ["vision", "perception"]
+            input_schema = [("label", "string")]
+            output_schema = {"found": "bool", "pose": "dict(x: float, y: float, z: float)"}
+            version = "0.1"
+
+            def run(self, **kwargs):
+                return {"found": True, "pose": {"x": 4.0, "y": 2.0, "z": 0.0}}
+
+        class NavTool(tools_mod.AtomicTool):
+            name = "go_to_pose"
+            description = "Navigate robot to a target location"
+            tags = ["navigation", "goal", "go to", "move"]
+            input_schema = [("x", "float"), ("y", "float"), ("z", "float")]
+            output_schema = {"arrived": "bool"}
+            version = "0.1"
+
+            def run(self, **kwargs):
+                return {"arrived": True}
+
+        class SpeakTool(tools_mod.AtomicTool):
+            name = "speak"
+            description = "Speak a text string"
+            tags = ["speech", "text"]
+            input_schema = [("text", "string")]
+            output_schema = {"spoken": "bool"}
+            version = "0.1"
+
+            def run(self, **kwargs):
+                return {"spoken": True, "spoken_text": kwargs.get("text", "")}
+
+        class TypesTool(tools_mod.AtomicTool):
+            name = "types"
+            description = "Get the types of the non-string input arguments"
+            tags = ["type", "input"]
+            input_schema = [
+                ("int", "int"),
+                ("integer", "integer"),
+                ("float", "float"),
+                ("bool", "bool"),
+                ("boolean", "boolean"),
+            ]
+            output_schema = {"types": "bool"}
+            version = "0.1"
+
+            def run(self, **kwargs):
+                return {"types": True}
+
+        class FailingTool(tools_mod.AtomicTool):
+            name = "failing_tool"
+            description = "Tool that always fails at runtime"
+            input_schema = []
+            output_schema = {"ok": "bool"}
+            version = "0.1"
+
+            def run(self, **kwargs):
+                raise RuntimeError("forced failure")
+
+        self.registry.register_tool(EmptyTool())
+        self.registry.register_tool(DetectTool())
+        self.registry.register_tool(NavTool())
+        self.registry.register_tool(SpeakTool())
+        self.registry.register_tool(TypesTool())
+        self.registry.register_tool(FailingTool())
+
+        self.validator = self.Validator(self.registry, logger=self.logger)
+        self.exec = self.PlanExecutor(self.registry, logger=self.logger)
+
+    def _assert_log_contains(self, text: str, prefix: str | None = None):
+        logs = [normalize_log(msg) for msg in self.sink.messages]
+        if prefix:
+            logs = [msg for msg in logs if prefix in msg]
+        found = any(text in msg for msg in logs)
+        self.assertTrue(found, f"Missing log '{text}'. Logs: {logs}")
+
+    def _assert_log_not_contains(self, text: str):
+        logs = [normalize_log(msg) for msg in self.sink.messages]
+        self.assertFalse(any(text in msg for msg in logs), f"Unexpected log '{text}'. Logs: {logs}")
+
+    def _run_and_log_plan(self, plan):
+        self.validator.validate(plan)
+        self.logger.log_manager(f"Plan received:\n{plan}")
+        bb = self.Blackboard()
+        result = self.exec.run(plan, bb)
+        self.logger.log_console(f"Output of plan: {bb.text_snapshot()}")
+        return result
+
+    def test_log_query_correct_plan(self):
+        plan = self.GlobalPlan(
+            summary="Navigate to a location, detect an object, and speak the result",
+            plan=[
+                self.PlanNode(
+                    kind="SEQUENCE",
+                    steps=[
+                        self.Step(
+                            tool="go_to_pose",
+                            args=[self.Arg(key="x", val=1.0), self.Arg(key="y", val=2.0), self.Arg(key="z", val=0.0)],
+                        ),
+                        self.Step(tool="detect_object", args=[self.Arg(key="label", val="mug")]),
+                        self.Step(
+                            tool="go_to_pose",
+                            args=[self.Arg(key="x", val=3.0), self.Arg(key="y", val=4.0), self.Arg(key="z", val=0.0)],
+                        ),
+                        self.Step(tool="speak", args=[self.Arg(key="text", val="I have arrived and detected a mug.")]),
+                    ],
+                )
+            ],
+        )
+
+        ret = self._run_and_log_plan(plan)
+
+        self.assertTrue(ret["success"])
+
+        self._assert_log_contains("Plan received:", prefix="[MANAGER]")
+        self._assert_log_contains(
+            "Plan Summary: Navigate to a location, detect an object, and speak the result",
+            prefix="[MANAGER]",
+        )
+        self._assert_log_contains("PlanNode 1: kind=SEQUENCE", prefix="[MANAGER]")
+        self._assert_log_contains("Step 1: go_to_pose(x=1.0, y=2.0, z=0.0)", prefix="[MANAGER]")
+        self._assert_log_contains("Step 2: detect_object(label=mug)", prefix="[MANAGER]")
+        self._assert_log_contains("Step 3: go_to_pose(x=3.0, y=4.0, z=0.0)", prefix="[MANAGER]")
+        self._assert_log_contains("Step 4: speak(text=I have arrived and detected a mug.)", prefix="[MANAGER]")
+
+        self._assert_log_contains(
+            "Invoking 'go_to_pose' with args:'{'x': '1.0', 'y': '2.0', 'z': '0.0'}'",
+            prefix="[EXECUTOR]",
+        )
+        # ROS msgs
+
+        self._assert_log_contains("Invoking 'detect_object' with args:'{'label': 'mug'}'", prefix="[EXECUTOR]")
+        # ROS msgs
+        self._assert_log_contains(
+            "Invoking 'go_to_pose' with args:'{'x': '3.0', 'y': '4.0', 'z': '0.0'}'",
+            prefix="[EXECUTOR]",
+        )
+        # ROS msgs
+        self._assert_log_contains(
+            "Invoking 'speak' with args:'{'text': 'I have arrived and detected a mug.'}'",
+            prefix="[EXECUTOR]",
+        )
+        # ROS msgs
+        self._assert_log_contains("PlanNode SEQUENCE succeeded on attempt 1/1", prefix="[EXECUTOR]")
+
+        self._assert_log_contains("Output of plan: {")
+        self._assert_log_contains("'detect_object': {'found': True")
+        self._assert_log_contains("'speak': {'spoken': True")
+        self._assert_log_contains("'go_to_pose': {'arrived': True}")
+
+    def test_log_query_parallel_plan(self):
+        plan = self.GlobalPlan(
+            summary="Run detection and speech in parallel",
+            plan=[
+                self.PlanNode(
+                    kind="PARALLEL",
+                    steps=[
+                        self.Step(tool="detect_object", args=[self.Arg(key="label", val="book")]),
+                        self.Step(tool="speak", args=[self.Arg(key="text", val="Scanning now.")]),
+                    ],
+                )
+            ],
+        )
+
+        ret = self._run_and_log_plan(plan)
+
+        self.assertTrue(ret["success"])
+
+        self._assert_log_contains("PlanNode 1: kind=PARALLEL", prefix="[MANAGER]")
+        self._assert_log_contains("Step 1: detect_object(label=book)", prefix="[MANAGER]")
+        self._assert_log_contains("Step 2: speak(text=Scanning now.)", prefix="[MANAGER]")
+        self._assert_log_contains("Invoking 'detect_object' with args:'{'label': 'book'}'", prefix="[EXECUTOR]")
+        # ROS msgs
+        self._assert_log_contains("Invoking 'speak' with args:'{'text': 'Scanning now.'}'", prefix="[EXECUTOR]")
+        # ROS msgs
+        self._assert_log_contains("PlanNode PARALLEL succeeded on attempt 1/1", prefix="[EXECUTOR]")
+        self._assert_log_contains("'detect_object': {'found': True")
+        self._assert_log_contains("'speak': {'spoken': True")
+
+    def test_log_query_step_condition_skip(self):
+        plan = self.GlobalPlan(
+            summary="Move first and skip speech step",
+            plan=[
+                self.PlanNode(
+                    kind="SEQUENCE",
+                    steps=[
+                        self.Step(
+                            tool="go_to_pose",
+                            args=[self.Arg(key="x", val=1.0), self.Arg(key="y", val=1.5), self.Arg(key="z", val=0.0)],
+                        ),
+                        self.Step(
+                            tool="speak",
+                            args=[self.Arg(key="text", val="This should be skipped.")],
+                            condition="False",
+                        ),
+                    ],
+                )
+            ],
+        )
+
+        ret = self._run_and_log_plan(plan)
+
+        self.assertTrue(ret["success"])
+
+        self._assert_log_contains("PlanNode 1: kind=SEQUENCE", prefix="[MANAGER]")
+        self._assert_log_contains("Condition: False", prefix="[MANAGER]")
+        self._assert_log_contains("Skipping step 'speak' due to condition=False", prefix="[EXECUTOR]")
+        self._assert_log_contains("PlanNode SEQUENCE succeeded on attempt 1/1", prefix="[EXECUTOR]")
+        self._assert_log_contains("Output of plan: {'go_to_pose': {'arrived': True}}")
+        self._assert_log_not_contains("'speak': {'spoken': True")
+
+    def test_log_query_failing_runtime_error(self):
+        plan = self.GlobalPlan(
+            summary="Execute a tool that fails at runtime",
+            plan=[
+                self.PlanNode(
+                    kind="SEQUENCE",
+                    steps=[
+                        self.Step(tool="failing_tool", args=[]),
+                    ],
+                )
+            ],
+        )
+
+        ret = self._run_and_log_plan(plan)
+
+        self.assertFalse(ret["success"])
+
+        self._assert_log_contains("Plan received:", prefix="[MANAGER]")
+        self._assert_log_contains("Plan Summary: Execute a tool that fails at runtime", prefix="[MANAGER]")
+        self._assert_log_contains("PlanNode 1: kind=SEQUENCE", prefix="[MANAGER]")
+        self._assert_log_contains("Step 1: failing_tool(no args)", prefix="[MANAGER]")
+        self._assert_log_contains("Invoking 'failing_tool' with args:'{}'", prefix="[EXECUTOR]")
+        # ROS msgs
+        self._assert_log_contains("Execution failed for 'failing_tool': forced failure", prefix="[EXECUTOR]")
+        self._assert_log_contains("Step 'failing_tool' attempt 1/1 failed", prefix="[EXECUTOR]")
+        self._assert_log_contains("PlanNode SEQUENCE failed on attempt 1/1", prefix="[EXECUTOR]")
+        self._assert_log_contains("Output of plan: {'failing_tool': None}")
+
+    def test_log_query_failing_success_criteria(self):
+        plan = self.GlobalPlan(
+            summary="Navigate but force node-level failure criteria",
+            plan=[
+                self.PlanNode(
+                    kind="SEQUENCE",
+                    steps=[
+                        self.Step(
+                            tool="go_to_pose",
+                            args=[self.Arg(key="x", val=2.0), self.Arg(key="y", val=3.0), self.Arg(key="z", val=0.0)],
+                        ),
+                    ],
+                    success_criteria="False",
+                )
+            ],
+        )
+
+        ret = self._run_and_log_plan(plan)
 
+        self.assertFalse(ret["success"])
+
+        self._assert_log_contains("Plan received:", prefix="[MANAGER]")
+        self._assert_log_contains("Plan Summary: Navigate but force node-level failure criteria", prefix="[MANAGER]")
+        self._assert_log_contains("PlanNode 1: kind=SEQUENCE", prefix="[MANAGER]")
+        self._assert_log_contains("Success Criteria: False", prefix="[MANAGER]")
+        self._assert_log_contains(
+            "Invoking 'go_to_pose' with args:'{'x': '2.0', 'y': '3.0', 'z': '0.0'}'",
+            prefix="[EXECUTOR]",
+        )
+        # ROS msgs
+        self._assert_log_contains("Entity 'SEQUENCE' failed with criteria=False", prefix="[EXECUTOR]")
+        self._assert_log_contains("PlanNode SEQUENCE failed on attempt 1/1", prefix="[EXECUTOR]")
+        self._assert_log_contains("Output of plan: {'go_to_pose': {'arrived': True}}")
+
+    def test_log_query_failing_non_existent_tool(self):
+        # Intentionally bypass validator to exercise executor "tool not found" path.
+        plan = self.GlobalPlan(
+            summary="Try invoking a non-existent tool",
+            plan=[
+                self.PlanNode(
+                    kind="SEQUENCE",
+                    steps=[self.Step(tool="non_existent_tool", args=[])],
+                )
+            ],
+        )
+
+        self.logger.log_manager(f"Plan received:\n{plan}")
+        bb = self.Blackboard()
+        ret = self.exec.run(plan, bb)
+        self.logger.log_console(f"Output of plan: {bb.text_snapshot()}")
+
+        self.assertFalse(ret["success"])
+
+        self._assert_log_contains("Plan received:", prefix="[MANAGER]")
+        self._assert_log_contains("Plan Summary: Try invoking a non-existent tool", prefix="[MANAGER]")
+        self._assert_log_contains("PlanNode 1: kind=SEQUENCE", prefix="[MANAGER]")
+        self._assert_log_contains("Step 1: non_existent_tool(no args)", prefix="[MANAGER]")
+        self._assert_log_contains("Tool 'non_existent_tool' not found", prefix="[EXECUTOR]")
+        self._assert_log_contains("Step 'non_existent_tool' attempt 1/1 failed", prefix="[EXECUTOR]")
+        self._assert_log_contains("PlanNode SEQUENCE failed on attempt 1/1", prefix="[EXECUTOR]")
+        self._assert_log_contains("Output of plan: {'non_existent_tool': None}")
+
+
+# endregion

From 3736c415883b3f459d4216491388d7a457c91731 Mon Sep 17 00:00:00 2001
From: danipiza <dpizarrogallego@gmail.com>
Date: Tue, 24 Feb 2026 11:36:39 +0100
Subject: [PATCH 6/6] [#24196] Redirect logger from VulcanAILogger.default() to
 tests sinks

Signed-off-by: danipiza <dpizarrogallego@gmail.com>
---
 tests/unittest/test_executor.py      | 6 ++++++
 tests/unittest/test_tool_registry.py | 5 +++++
 tests/unittest/test_validator.py     | 5 +++++
 3 files changed, 16 insertions(+)

diff --git a/tests/unittest/test_executor.py b/tests/unittest/test_executor.py
index 54b2de3..ab935aa 100644
--- a/tests/unittest/test_executor.py
+++ b/tests/unittest/test_executor.py
@@ -47,6 +47,12 @@ def similarity(self, a, b):
 
 class TestPlanExecutor(unittest.TestCase):
     def setUp(self):
+        logger_mod = importlib.import_module("vulcanai.console.logger")
+        # Avoid cross-test leakage from console tests that rebind the default logger
+        # to a Textual sink requiring an active app context.
+        logger_mod.VulcanAILogger._default_instance = None
+        logger_mod.VulcanAILogger._rich_markup = True
+
         # Import package modules dynamically
         tools_mod = importlib.import_module("vulcanai.tools.tools")
         registry_mod = importlib.import_module("vulcanai.tools.tool_registry")
diff --git a/tests/unittest/test_tool_registry.py b/tests/unittest/test_tool_registry.py
index 9dc09ca..d973a28 100644
--- a/tests/unittest/test_tool_registry.py
+++ b/tests/unittest/test_tool_registry.py
@@ -49,6 +49,11 @@ def similarity(self, a, b):
 
 class TestToolRegistry(unittest.TestCase):
     def setUp(self):
+        logger_mod = importlib.import_module("vulcanai.console.logger")
+        # Avoid shared default logger state from console tests (Textual sink).
+        logger_mod.VulcanAILogger._default_instance = None
+        logger_mod.VulcanAILogger._rich_markup = True
+
         # Import package modules dynamically to avoid static import issues
         tool_registry_mod = importlib.import_module("vulcanai.tools.tool_registry")
         tools_mod = importlib.import_module("vulcanai.tools.tools")
diff --git a/tests/unittest/test_validator.py b/tests/unittest/test_validator.py
index 611ac4f..4e37d8e 100644
--- a/tests/unittest/test_validator.py
+++ b/tests/unittest/test_validator.py
@@ -46,6 +46,11 @@ def similarity(self, a, b):
 
 class TestPlanValidator(unittest.TestCase):
     def setUp(self):
+        logger_mod = importlib.import_module("vulcanai.console.logger")
+        # Avoid cross-test default logger contamination from Textual-bound sinks.
+        logger_mod.VulcanAILogger._default_instance = None
+        logger_mod.VulcanAILogger._rich_markup = True
+
         # Import package modules dynamically
         tools_mod = importlib.import_module("vulcanai.tools.tools")
         registry_mod = importlib.import_module("vulcanai.tools.tool_registry")