diff --git a/.github/workflows/run-tests-all-dbs.yml b/.github/workflows/run-tests-all-dbs.yml
index ac2efbe4..53c30de9 100644
--- a/.github/workflows/run-tests-all-dbs.yml
+++ b/.github/workflows/run-tests-all-dbs.yml
@@ -57,7 +57,7 @@ jobs:
           python -c "from flowcept.configs import MONGO_ENABLED, LMDB_ENABLED; print('MONGO?', MONGO_ENABLED); print('LMDB?', LMDB_ENABLED)"
           flowcept --init-settings --full -y
           flowcept --config-profile full-online -y
-          pytest tests --timeout=600 --ignore=tests/adapters/test_tensorboard.py --ignore=tests/misc_tests/telemetry_test.py -k "not test_decorated_function_timed"
+          pytest tests --timeout=600 --ignore=tests/adapters/test_tensorboard.py --ignore=tests/misc_tests/telemetry_test.py -m "not llm" -k "not test_decorated_function_timed"
 
       - name: Test notebooks with pytest and redis
         run: |
diff --git a/.github/workflows/run-tests-kafka-and-rabbit-mq.yml b/.github/workflows/run-tests-kafka-and-rabbit-mq.yml
new file mode 100644
index 00000000..11210c09
--- /dev/null
+++ b/.github/workflows/run-tests-kafka-and-rabbit-mq.yml
@@ -0,0 +1,166 @@
+name: (With Mongo) Tests on Kafka and RabbitMQ MQ
+on:
+  pull_request:
+    branches: [ "dev", "main" ]
+    types: [opened, synchronize, reopened]
+
+jobs:
+
+  build:
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        python-version: [ "3.11", "3.12" ]
+    env:
+      MONGO_ENABLED: true
+      LMDB_ENABLED: false
+    timeout-minutes: 50
+    if: "!contains(github.event.head_commit.message, 'CI Bot')"
+
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          fetch-depth: 1
+
+      - name: Set up Python ${{ matrix.python-version }}
+        uses: actions/setup-python@v5
+        with:
+          python-version: ${{ matrix.python-version }}
+          # cache: "pip"
+
+      - name: Run docker compose
+        run: docker compose -f deployment/compose-kafka.yml up -d
+
+      - name: Upgrade pip
+        run: python -m pip install --upgrade pip
+
+      - name: Show Python version
+        run: python --version && pip --version
+
+      - name: Test examples
+        run: bash .github/workflows/run_examples.sh examples true # with mongo
+
+      - name: Install all dependencies
+        run: |
+          python -m pip install .[all]
+          python -m pip install .[ml_dev]
+
+      - name: Check liveness
+        run: |
+          export MQ_TYPE=kafka
+          export MQ_PORT=9092
+          python -c 'from flowcept.configs import MQ_TYPE, MQ_PORT; print(f"MQ_TYPE={MQ_TYPE}"); print(f"MQ_PORT={MQ_PORT}")'
+          python -c 'from flowcept import Flowcept; assert Flowcept.services_alive()'
+
+      - name: Run tests with kafka
+        run: |
+          export MQ_TYPE=kafka
+          export MQ_PORT=9092
+          flowcept --init-settings --full -y
+          flowcept --config-profile full-online -y
+          pytest tests --timeout=600 --ignore=tests/adapters/test_tensorboard.py --ignore=tests/misc_tests/telemetry_test.py -m "not llm" -k "not test_decorated_function_timed"
+
+      - name: Test telemetry with kafka
+        run: |
+          export MQ_TYPE=kafka
+          export MQ_PORT=9092
+          flowcept --init-settings --full -y
+          flowcept --config-profile full-telemetry -y
+          pytest tests/misc_tests/telemetry_test.py -q
+
+      - name: Test notebooks
+        run: |
+          export MQ_TYPE=kafka
+          export MQ_PORT=9092
+          rm -f "${FLOWCEPT_SETTINGS_PATH:-$HOME/.flowcept/settings.yaml}"
+          flowcept --init-settings --full --dask --mlflow -y
+          flowcept --config-profile full-online -y
+          pytest --nbmake "notebooks/" --nbmake-timeout=600 --ignore=notebooks/dask_from_CLI.ipynb --ignore=notebooks/tensorboard.ipynb
+
+      - name: Stop services
+        run: docker compose -f deployment/compose-kafka.yml down
+
+      - name: Clean up
+        run: |
+          make clean
+          test -d /home/runner/runners/ && find /home/runner/runners/ -type f -name "*.log" -exec sh -c 'echo {}; >"{}"' \; || true
+          docker image prune -a -f
+
+  build-rabbitmq:
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        python-version: [ "3.11", "3.12" ]
+    env:
+      MONGO_ENABLED: true
+      LMDB_ENABLED: false
+    timeout-minutes: 50
+    if: "!contains(github.event.head_commit.message, 'CI Bot')"
+
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          fetch-depth: 1
+
+      - name: Set up Python ${{ matrix.python-version }}
+        uses: actions/setup-python@v5
+        with:
+          python-version: ${{ matrix.python-version }}
+
+      - name: Run docker compose
+        run: docker compose -f deployment/compose-rabbitmq.yml up -d
+
+      - name: Upgrade pip
+        run: python -m pip install --upgrade pip
+
+      - name: Show Python version
+        run: python --version && pip --version
+
+      - name: Test examples
+        run: bash .github/workflows/run_examples.sh examples true # with mongo
+
+      - name: Install all dependencies
+        run: |
+          python -m pip install .[all]
+          python -m pip install .[ml_dev]
+
+      - name: Check liveness
+        run: |
+          export MQ_TYPE=rabbitmq
+          export MQ_PORT=5672
+          python -c 'from flowcept.configs import MQ_TYPE, MQ_PORT; print(f"MQ_TYPE={MQ_TYPE}"); print(f"MQ_PORT={MQ_PORT}")'
+          python -c 'from flowcept import Flowcept; assert Flowcept.services_alive()'
+
+      - name: Run tests with RabbitMQ
+        run: |
+          export MQ_TYPE=rabbitmq
+          export MQ_PORT=5672
+          flowcept --init-settings --full -y
+          flowcept --config-profile full-online -y
+          pytest tests --timeout=600 --ignore=tests/adapters/test_tensorboard.py --ignore=tests/misc_tests/telemetry_test.py -m "not llm" -k "not test_decorated_function_timed"
+
+      - name: Test telemetry with RabbitMQ
+        run: |
+          export MQ_TYPE=rabbitmq
+          export MQ_PORT=5672
+          flowcept --init-settings --full -y
+          flowcept --config-profile full-telemetry -y
+          pytest tests/misc_tests/telemetry_test.py -q
+
+      - name: Test notebooks
+        run: |
+          export MQ_TYPE=rabbitmq
+          export MQ_PORT=5672
+          rm -f "${FLOWCEPT_SETTINGS_PATH:-$HOME/.flowcept/settings.yaml}"
+          flowcept --init-settings --full --dask --mlflow -y
+          flowcept --config-profile full-online -y
+          pytest --nbmake "notebooks/" --nbmake-timeout=600 --ignore=notebooks/dask_from_CLI.ipynb --ignore=notebooks/tensorboard.ipynb
+
+      - name: Stop services
+        run: docker compose -f deployment/compose-rabbitmq.yml down
+
+      - name: Clean up
+        run: |
+          make clean
+          test -d /home/runner/runners/ && find /home/runner/runners/ -type f -name "*.log" -exec sh -c 'echo {}; >"{}"' \; || true
+          docker image prune -a -f
diff --git a/.github/workflows/run-tests-kafka.yml b/.github/workflows/run-tests-kafka.yml
deleted file mode 100644
index 2d1a9add..00000000
--- a/.github/workflows/run-tests-kafka.yml
+++ /dev/null
@@ -1,87 +0,0 @@
-name: (With Mongo) Tests on Kafka MQ
-on:
-  pull_request:
-    branches: [ "dev", "main" ]
-    types: [opened, synchronize, reopened]
-
-jobs:
-
-  build:
-    runs-on: ubuntu-latest
-    strategy:
-      matrix:
-        python-version: [ "3.11", "3.12" ]
-    env:
-      MONGO_ENABLED: true
-      LMDB_ENABLED: false
-    timeout-minutes: 50
-    if: "!contains(github.event.head_commit.message, 'CI Bot')"
-
-    steps:
-      - uses: actions/checkout@v4
-        with:
-          fetch-depth: 1
-
-      - name: Set up Python ${{ matrix.python-version }}
-        uses: actions/setup-python@v5
-        with:
-          python-version: ${{ matrix.python-version }}
-          # cache: "pip"
-
-      - name: Run docker compose
-        run: docker compose -f deployment/compose-kafka.yml up -d
-
-      - name: Upgrade pip
-        run: python -m pip install --upgrade pip
-
-      - name: Show Python version
-        run: python --version && pip --version
-
-      - name: Test examples
-        run: bash .github/workflows/run_examples.sh examples true # with mongo
-
-      - name: Install all dependencies
-        run: |
-          python -m pip install .[all]
-          python -m pip install .[ml_dev]
-
-      - name: Check liveness
-        run: |
-          export MQ_TYPE=kafka
-          export MQ_PORT=9092
-          python -c 'from flowcept.configs import MQ_TYPE, MQ_PORT; print(f"MQ_TYPE={MQ_TYPE}"); print(f"MQ_PORT={MQ_PORT}")'
-          python -c 'from flowcept import Flowcept; assert Flowcept.services_alive()'
-
-      - name: Run tests with kafka
-        run: |
-          export MQ_TYPE=kafka
-          export MQ_PORT=9092
-          flowcept --init-settings --full -y
-          flowcept --config-profile full-online -y
-          pytest tests --timeout=600 --ignore=tests/adapters/test_tensorboard.py --ignore=tests/misc_tests/telemetry_test.py -k "not test_decorated_function_timed"
-
-      - name: Test telemetry with kafka
-        run: |
-          export MQ_TYPE=kafka
-          export MQ_PORT=9092
-          flowcept --init-settings --full -y
-          flowcept --config-profile full-telemetry -y
-          pytest tests/misc_tests/telemetry_test.py -q
-
-      - name: Test notebooks
-        run: |
-          export MQ_TYPE=kafka
-          export MQ_PORT=9092
-          rm -f "${FLOWCEPT_SETTINGS_PATH:-$HOME/.flowcept/settings.yaml}"
-          flowcept --init-settings --full --dask --mlflow -y
-          flowcept --config-profile full-online -y
-          pytest --nbmake "notebooks/" --nbmake-timeout=600 --ignore=notebooks/dask_from_CLI.ipynb --ignore=notebooks/tensorboard.ipynb
-
-      - name: Stop services
-        run: docker compose -f deployment/compose-kafka.yml down
-
-      - name: Clean up
-        run: |
-          make clean
-          test -d /home/runner/runners/ && find /home/runner/runners/ -type f -name "*.log" -exec sh -c 'echo {}; >"{}"' \; || true
-          docker image prune -a -f
diff --git a/.github/workflows/run-tests-py313.yml b/.github/workflows/run-tests-py313.yml
index 5f0373a4..54a98ac4 100644
--- a/.github/workflows/run-tests-py313.yml
+++ b/.github/workflows/run-tests-py313.yml
@@ -47,7 +47,7 @@ jobs:
         run: |
           flowcept --init-settings --full -y
           flowcept --config-profile full-online -y
-          pytest --ignore=tests/adapters/test_tensorboard.py --ignore=tests/adapters/test_broker.py --ignore=tests/instrumentation_tests/ml_tests/ --ignore=tests/misc_tests/telemetry_test.py -k "not test_decorated_function_timed"
+          pytest --ignore=tests/adapters/test_tensorboard.py --ignore=tests/adapters/test_broker.py --ignore=tests/instrumentation_tests/ml_tests/ --ignore=tests/misc_tests/telemetry_test.py -m "not llm" -k "not test_decorated_function_timed"
 
       - name: Shut down docker compose
         run: make services-stop-mongo
diff --git a/.github/workflows/run-tests-simple.yml b/.github/workflows/run-tests-simple.yml
index b27ed4bd..349e16a8 100644
--- a/.github/workflows/run-tests-simple.yml
+++ b/.github/workflows/run-tests-simple.yml
@@ -52,7 +52,7 @@ jobs:
         run: |
           flowcept --init-settings --full -y
           flowcept --config-profile full-online -y
-          pytest tests --timeout=600 --ignore=tests/adapters/test_tensorboard.py --ignore=tests/misc_tests/telemetry_test.py -k "not test_decorated_function_timed"
+          pytest tests --timeout=600 --ignore=tests/adapters/test_tensorboard.py --ignore=tests/misc_tests/telemetry_test.py -m "not llm" -k "not test_decorated_function_timed"
 
       - name: Test notebooks with pytest and redis
         run: |
diff --git a/.github/workflows/run-tests.yml b/.github/workflows/run-tests.yml
index 1fa2e78d..caef619e 100644
--- a/.github/workflows/run-tests.yml
+++ b/.github/workflows/run-tests.yml
@@ -51,10 +51,10 @@ jobs:
         run: |
           pip install .
           pip list
-          flowcept --init-settings -y
+          rm -f ~/.flowcept/settings.yaml flowcept_buffer.jsonl WORKFLOW_CARD.md
           python examples/start_here.py
           pip uninstall flowcept -y 
-          rm ~/.flowcept/settings.yaml
+          rm -f ~/.flowcept/settings.yaml flowcept_buffer.jsonl WORKFLOW_CARD.md
 
       - name: Start docker compose with redis
         run: make services-mongo
@@ -110,7 +110,8 @@ jobs:
           echo "=== inotify limits ==="
           cat /proc/sys/fs/inotify/max_user_watches || true
           cat /proc/sys/fs/inotify/max_user_instances || true
-          pytest tests --timeout=600 --ignore=tests/adapters/test_tensorboard.py --ignore=tests/misc_tests/telemetry_test.py -k "not test_decorated_function_timed"
+          # Below, ignoring tests that require an active LLM service provider:
+          pytest tests --timeout=600 --ignore=tests/adapters/test_tensorboard.py --ignore=tests/misc_tests/telemetry_test.py -m "not llm" -k "not test_decorated_function_timed"
 
       - name: Test decorator timing in isolated offline mode
         run: |
@@ -182,7 +183,7 @@ jobs:
           echo "=== inotify limits ==="
           cat /proc/sys/fs/inotify/max_user_watches || true
           cat /proc/sys/fs/inotify/max_user_instances || true
-          pytest tests --timeout=600 --ignore=tests/adapters/test_tensorboard.py --ignore=tests/misc_tests/telemetry_test.py -k "not test_decorated_function_timed"
+          pytest tests --timeout=600 --ignore=tests/adapters/test_tensorboard.py --ignore=tests/misc_tests/telemetry_test.py -m "not llm" -k "not test_decorated_function_timed"
 
       - name: Test telemetry in isolated telemetry mode with kafka
         run: |
diff --git a/.github/workflows/ui-checks.yml b/.github/workflows/run-ui-checks.yml
similarity index 92%
rename from .github/workflows/ui-checks.yml
rename to .github/workflows/run-ui-checks.yml
index fb15e517..995c195f 100644
--- a/.github/workflows/ui-checks.yml
+++ b/.github/workflows/run-ui-checks.yml
@@ -20,6 +20,9 @@ jobs:
       - name: Install UI dependencies
         run: make ui-install
 
+      - name: Run UI checks (lint)
+        run: make ui-checks
+
       - name: Run UI unit tests
         run: make ui-test
 
diff --git a/AGENTS.md b/AGENTS.md
index b96eb9c5..e5ec555c 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -3,15 +3,30 @@
 This file is the single source of truth for code-assistant behavior in this repository.
 Each major module and the UI also has its own `README.md` (under `src/flowcept/*/`, `ui/`, `tests/`, `deployment/`, `examples/`) with deeper subsystem context; read the relevant one before working in that area.
 
+## Agent Prompt Design Rule
+
+Prompts in `src/flowcept/agents/prompts/` must remain domain- and application-agnostic. Adding app-specific fields or activity names to fix one test is a design failure.
+
+Do not add few-shots to fix specific queries; revisit the prompting strategy instead.
+
+## Test Failure Rule
+
+Fix the system or the expectation — never the test data.
+
 Do not duplicate these rules in `CLAUDE.md`, `.cursor/rules`, `GEMINI.md`, `SKILL.md`, or other agent files.
 If a tool requires its own file, make that file (which should immediately go to .gitignore) a thin pointer to this one.
 
 ## 1. First Principles
 
 - Be surgical. Prefer small, reviewable changes.
-- Reuse above all. Avoid duplication and one-off fixes.
+- Before proposing any implementation or design strategy, find how the codebase already solves the same concern — same class type, same data flow, same operation. Replicate that solution exactly. If no existing pattern exists, flag it in the response before implementing.
+- Flowcept is extremely performance-sensitive, especially in the data producer path. Even small ifs, loops, or function calls in hot paths must be avoided at all costs.
+- Reuse above all. Avoid duplication and one-off fixes. Duplicating code or logic is a MAJOR problem. Avoid it at all costs. 
+- You often solve the main problem being addressed by silently injecting several other problems. Before editing a file, you need to assess the impact it will have in other parts of the code. One-off solutions bring more problems than resolve anything.
+- Separation of concerns is extremely important in this project. Mixing concerns is not acceptable. Each module in the project has a clear and separate concern. Report if you find violations.
 - Do not overengineer.
 - Prefer visible failures over fallback code that hides contract mismatches.
+- Never add defensive type checks, isinstance guards, or fallback values unless explicitly asked. Let the code break loudly.
 - Prefer `settings.yaml` over hardcoded behavior.
 - Avoid dependency pins unless there is a proven direct reason and no better practical fix.
 - Do not commit personal absolute paths.
@@ -21,11 +36,13 @@ If a tool requires its own file, make that file (which should immediately go to
 
 ## 2. Interaction Rules
 
+- Answer questions in text only. Questions ("why", "how", "is X", "should we", "assess") are never commands to write code.
+- Never edit more than what was explicitly named in the request.
+- If fixing X reveals problem Y, report Y — do not fix it.
 - Keep responses under 50 words unless the user asks for detail.
-- Do not dump large code or long explanations unless explicitly asked.
 - Before long-running operations, warn the user and ask permission.
-- During approved long operations, provide brief status updates about every minute.
-- The human user is the owner and responsible for all actions in this code. Explain tradeoffs clearly, then follow decisions.
+- The human user is the owner. Explain tradeoffs clearly, then follow decisions.
+ 
 
 ## 3. Editing Rules
 
@@ -153,7 +170,8 @@ flowcept --init-settings --full --dask --mlflow -y
 
 **TDD is mandatory for both Python and UI/frontend.** Write the test first, watch it fail, then implement until it passes.
 
-- **Python**: write a real integration test in `tests/` before the implementation. Guard service-dependent tests with `Flowcept.services_alive()` / `MONGO_ENABLED` skips. No mocks.
+- **Python**: real integration tests are in `tests/`. Before the implementation, check if what you are about to implement is already covered in both unit and the integration tests. If not, they must be. Guard service-dependent tests with skips that use `Flowcept.services_alive()` / *_ENABLED flags available in configs.py.
+- Test the real thing! No mocks. No fakes. Prefer generating new data than relying on synthetic/
 - **UI/Frontend**: write a vitest test in `ui/tests/` before adding new pure logic (store mutations, utility functions, graph algorithms). Use real data fixtures — no mocks, no DOM for pure-function and store tests. Component render tests are discouraged (fragile, high mock cost); test logic at the function/store level instead. Run with `make ui-test`.
 
 Use the `flowcept` conda environment.
@@ -201,7 +219,9 @@ Do not run tests from scratch/sandbox directories. Target `tests/` explicitly.
 - Prefer real tests over mocks. Use real services, real data, and real LLMs when feasible.
 - Avoid mock-heavy tests unless there is no practical alternative.
 - When a test fails, the correct fix is almost always to fix the implementation code, not the test; the test itself is very rarely the culprit. Always resolve warnings at their source rather than silencing them.
+- **NEVER lower test thresholds or broaden expected responses just to make a failing test pass.** Doing so hides real bugs and degrades the test suite over time. If a test fails, fix the underlying behavior.
 - **Periodically recommend running the full integration test suites** (`make tests` and `E2E_LIVE=1 make ui-e2e`) — especially after merges, significant backend or UI changes, or when the user has been iterating quickly on a feature. Mocked tests alone are not sufficient to catch regressions against real services.
+- **Tests must verify meaningful system behavior**, not code structure (file paths, imports, `hasattr` checks).
 
 
 ## 11. CI And Dependency Drift
@@ -214,7 +234,7 @@ Important CI surfaces:
 - `run-tests.yml`: broad Redis and Kafka path on push/schedule.
 - `run-tests-simple.yml`: Redis without Mongo.
 - `run-tests-offline.yml`: full offline profile.
-- `run-tests-kafka.yml`: Kafka + Mongo.
+- `run-tests-kafka-and-rabbit-mq.yml`: Kafka + RabbitMQ + Mongo.
 - `run-tests-all-dbs.yml`: Mongo and LMDB coverage.
 - `run-tests-in-container.yml`: Docker image tests.
 - `run-tests-py313.yml`: Python 3.13 subset.
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index e70ad1ca..dfe7c789 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -50,7 +50,7 @@ Several GitHub Actions cover different runtime environments:
 * [run-tests.yml](.github/workflows/run-tests.yml) runs the main test matrix, including Redis and Kafka paths.
 * [run-tests-simple.yml](.github/workflows/run-tests-simple.yml) runs tests without MongoDB.
 * [run-tests-offline.yml](.github/workflows/run-tests-offline.yml) runs the full-offline profile.
-* [run-tests-kafka.yml](.github/workflows/run-tests-kafka.yml) runs Mongo-backed tests with Kafka MQ.
+* [run-tests-kafka-and-rabbit-mq.yml](.github/workflows/run-tests-kafka-and-rabbit-mq.yml) runs Mongo-backed tests with Kafka and RabbitMQ.
 * [run-tests-all-dbs.yml](.github/workflows/run-tests-all-dbs.yml) runs Mongo and non-Mongo database paths.
 * [run-tests-in-container.yml](.github/workflows/run-tests-in-container.yml) runs tests inside the Flowcept container.
 * [run-tests-py313.yml](.github/workflows/run-tests-py313.yml) runs the Python 3.13-compatible subset.
diff --git a/Makefile b/Makefile
index 211f1cf9..4e921ab6 100644
--- a/Makefile
+++ b/Makefile
@@ -12,11 +12,14 @@ help:
 	@printf "\033[32mservices-stop-kafka\033[0m       stop Kafka services and remove attached volumes\n"
 	@printf "\033[32mservices-mofka\033[0m            run services with Mofka using Docker\n"
 	@printf "\033[32mservices-stop-mofka\033[0m       stop Mofka services and remove attached volumes\n"
+	@printf "\033[32mservices-rabbitmq\033[0m         run services with RabbitMQ using Docker\n"
+	@printf "\033[32mservices-stop-rabbitmq\033[0m    stop RabbitMQ services and remove attached volumes\n"
 	@printf "\033[32mtests\033[0m                     run unit tests with pytest\n"
 	@printf "\033[32mtests-offline\033[0m             run offline-safe tests with pytest\n"
 	@printf "\033[32mtests-in-container\033[0m        run unit tests with pytest inside Flowcept's container\n"
 	@printf "\033[32mtests-in-container-mongo\033[0m  run unit tests inside container with MongoDB\n"
-	@printf "\033[32mtests-in-container-kafka\033[0m  run unit tests inside container with Kafka and MongoDB\n"
+	@printf "\033[32mtests-in-container-kafka\033[0m     run unit tests inside container with Kafka and MongoDB\n"
+	@printf "\033[32mtests-in-container-rabbitmq\033[0m  run unit tests inside container with RabbitMQ and MongoDB\n"
 	@printf "\033[32mtests-notebooks\033[0m           test the notebooks using pytest\n"
 	@printf "\033[32mclean\033[0m                     remove cache directories and Sphinx build output\n"
 	@printf "\033[32mdocs\033[0m                      build HTML documentation using Sphinx\n"
@@ -154,6 +157,17 @@ services-mofka:
 services-stop-mofka:
 	docker compose --file deployment/compose-mofka.yml down --volumes
 
+# Run services with RabbitMQ using Docker
+services-rabbitmq:
+	docker compose --file deployment/compose-rabbitmq.yml up --detach
+
+# Stop RabbitMQ services and remove attached volumes
+services-stop-rabbitmq:
+	docker compose --file deployment/compose-rabbitmq.yml down --volumes
+
+tests-in-container-rabbitmq:
+	docker run --rm -v $(shell pwd):/flowcept -e KVDB_HOST=flowcept_redis -e MQ_HOST=flowcept_rabbitmq -e MQ_PORT=5672 -e MQ_TYPE=rabbitmq -e MONGO_HOST=flowcept_mongo -e MONGO_ENABLED=true -e LMDB_ENABLED=false --network flowcept_default flowcept /bin/bash -lc '/opt/conda/envs/flowcept/bin/flowcept --init-settings --full -y && /opt/conda/envs/flowcept/bin/flowcept --config-profile full-online -y && /opt/conda/envs/flowcept/bin/pytest tests --timeout=600 --ignore=tests/adapters/test_tensorboard.py --ignore=tests/instrumentation_tests/ml_tests --ignore=tests/misc_tests/telemetry_test.py -k "not test_decorated_function_timed"'
+
 # Run unit tests using pytest
 .PHONY: tests
 tests:
diff --git a/README.md b/README.md
index 47e32683..6b5e79e3 100644
--- a/README.md
+++ b/README.md
@@ -1,570 +1,291 @@
 <p align="center">
   <picture>
-    <!-- Dark theme -->
     <source srcset="./docs/img/flowcept-logo-dark.png" media="(prefers-color-scheme: dark)" />
-    <!-- Light theme -->
     <source srcset="./docs/img/flowcept-logo.png" media="(prefers-color-scheme: light)" />
-    <!-- Fallback -->
     <img src="./docs/img/flowcept-logo.png" alt="Flowcept Logo" width="200"/>
   </picture>
 </p>
 
-<h3 align="center">Lightweight Distributed Workflow Provenance</h3>
+<h3 align="center">Runtime provenance for distributed scientific and AI workflows</h3>
 
+<p align="center">
+Capture, stream, query, visualize, and reason over workflow lineage across ML, agentic, edge, cloud, and HPC systems.
+</p>
 
----
-
-Flowcept captures and queries workflow provenance at runtime with minimal code changes and low overhead. It unifies data from diverse tools and workflows across the Edge–Cloud–HPC continuum and provides ML-aware capture, MCP agents provenance, telemetry, extensible adapters, and flexible storage.
-
----
-
+<p align="center">
+  <a href="https://flowcept.org">Website</a> ·
+  <a href="https://flowcept.readthedocs.io/">Documentation</a> ·
+  <a href="./examples">Examples</a> ·
+  <a href="./notebooks">Notebooks</a> ·
+  <a href="https://flowcept.readthedocs.io/en/latest/publications.html">Publications</a>
+</p>
 
 [![Documentation](https://img.shields.io/badge/docs-readthedocs.io-green.svg)](https://flowcept.readthedocs.io/)
-[![Slack](https://img.shields.io/badge/Slack-%23flowcept%40Workflows%20Community-4A154B?logo=slack)](https://workflowscommunity.slack.com/archives/C06L5GYJKQS)
-[![Build](https://github.com/ORNL/flowcept/actions/workflows/create-release-n-publish.yml/badge.svg)](https://github.com/ORNL/flowcept/actions/workflows/create-release-n-publish.yml)
 [![PyPI](https://badge.fury.io/py/flowcept.svg)](https://pypi.org/project/flowcept)
 [![Tests](https://github.com/ORNL/flowcept/actions/workflows/run-tests.yml/badge.svg)](https://github.com/ORNL/flowcept/actions/workflows/run-tests.yml)
-[![Code Formatting](https://github.com/ORNL/flowcept/actions/workflows/checks.yml/badge.svg?branch=dev)](https://github.com/ORNL/flowcept/actions/workflows/checks.yml)
+[![Checks](https://github.com/ORNL/flowcept/actions/workflows/checks.yml/badge.svg)](https://github.com/ORNL/flowcept/actions/workflows/checks.yml)
 [![License: MIT](https://img.shields.io/github/license/ORNL/flowcept)](LICENSE)
 
+---
 
+## What Is Flowcept?
 
+Flowcept is a lightweight runtime provenance data management and data observability system for AI, scientific, and agentic workflows.
+It records what ran, what data were used and generated, where it ran, how long it took,
+which resources it consumed, and how workflow artifacts relate to each other, with rich context and detailed metadata.
 
-<h4 align="center">
-  <a href="https://flowcept.org">Website</a> &#8226;
-  <a href="https://flowcept.readthedocs.io/">Documentation</a> &#8226; 
-  <a href="./docs/publications">Publications</a>
-</h4>
+It is designed for workflows that are distributed, heterogeneous, and hard to inspect after the fact:
+ML training, agentic workflows, HPC jobs, edge-to-cloud-to-HPC pipelines, Workflow Management System tasks, and multi-workflow campaigns.
 
+Flowcept records can start as simple JSONL files for small local demos, move to LMDB for
+pure file-based runs, and scale to MongoDB for cloud deployments, production-style querying, dashboards, and UI use.
+For distributed runs, provenance records can also stream through a message queue while the
+workflow is still executing. The Flowcept Agent adds LLM-based interaction on top of captured
+provenance, so users can ask questions, inspect lineage, and drive visual exploration naturally, both to the in-motion data in the MQ systems or the data persisted in the database. 
 
----
+## See It In Action
+
+The Flowcept UI turns captured provenance into browsable workflow structure, data lineage,
+dashboards, workflow cards, and natural-language provenance exploration.
+
+> Place Gif here
 
-# Quickstart
+<!--
+![Flowcept UI: GridSearch provenance graph](docs/img/ui-gridsearch-dataflow.png)
+![Flowcept UI: GridSearch workflow card](docs/img/ui-gridsearch-workflow-card.png)
+-->
 
-The easiest way to capture provenance from plain Python functions, with no external services needed:
+## Why Flowcept?
 
-1) Install and initialize settings
+- **Distributed by design**: MQ-based provenance streaming with [Redis](https://redis.io) (default), [RabbitMQ](https://www.rabbitmq.com), [Kafka](https://kafka.apache.org), and [Mofka](https://mofka.readthedocs.io), plus database-backed storage for online querying.
+- **Low-overhead HPC capture**: buffer and stream provenance with low interference in large-scale jobs.
+- **Plugin-friendly capture**: instrument native code or use adapters, including PyTorch, Dask, MLflow, TensorBoard, and more.
+- **AI/ML-ready semantics**: preserve workflow, task, parameter, metric, model, tensor, artifact, telemetry, and resource-usage context.
+- **Agentic workflow lineage**: capture agent/tool execution, LLM usage, prompts, responses, and runtime provenance.
+- **Flowcept Agent**: chat naturally with captured provenance, inspect workflow data, generate workflow cards, and drive interactive visualizations.
+- **Standards-aware provenance**: Flowcept follows the [W3C PROV](https://www.w3.org/TR/prov-overview/) model and extends it for workflow, ML, and agentic execution contexts.
 
-```shell
-# Make sure you activate your Python environment (e.g., conda, venv) first
+## Quickstart (get it up in 1 minute): Capture Provenance Offline
+
+This minimal example needs no database, broker, or external service.
+
+```bash
 pip install flowcept
-flowcept --init-settings
 ```
-This generates a minimal settings file in `~/.flowcept/settings.yaml`.
-
-2) Run the minimal example
 
-Save the following script as `quickstart.py` and run `python quickstart.py.`
+Create `quickstart.py`:
 
 ```python
-"""
-A minimal example of Flowcept's instrumentation using @decorators.
-This example needs no DB, broker, or external service.
-"""
 from flowcept import Flowcept, flowcept_task
 from flowcept.instrumentation.flowcept_decorator import flowcept
 
 
-@flowcept_task(output_names="o1")
-def sum_one(i1):
-    return i1 + 1
+@flowcept_task(output_names="y")
+def add_one(x):
+    return x + 1
 
 
-@flowcept_task(output_names="o2")
-def mult_two(o1):
-    return o1 * 2
+@flowcept_task(output_names="z")
+def double(y):
+    return y * 2
 
 
 @flowcept
 def main():
-    n = 3
-    o1 = sum_one(n)
-    o2 = mult_two(o1)
-    print("Final output", o2)
+    y = add_one(3)
+    z = double(y)
+    print("result:", z)
 
 
 if __name__ == "__main__":
     main()
-
-    prov_messages = Flowcept.read_buffer_file()
-    assert len(prov_messages) == 2
-    print(f"Raw provenance captured: {len(prov_messages)} records in flowcept_messages.jsonl")
-    Flowcept.generate_report(records=prov_messages, print_markdown=True)
-```
-
-This prints out:
-
----
-
-##### Workflow Card
-
-###### Summary
-- Workflow ID: fe546706-ef46-4482-8f70-3af664a7131b
-- Execution Start (UTC): 2026-02-20 19:14:03
-- Total Elapsed (s): 0.000
-
-###### Workflow Structure
-
-   input
-     │
-     ▼
- sum_one
-     │
- mult_two
-     ▼
-   output
-
-###### Timing Report
-| Activity | Status Counts     | Median Elapsed (s) |
-| -------- | ----------------- | ------------------ |
-| sum_one  | {'FINISHED': 1}   | 0.000              |
-| mult_two | {'FINISHED': 1}   | 0.000              |
-
-###### Per Activity Details
-- **sum_one**
-  - Used:   i1 = 3
-  - Generated: o1 = 4
-- **mult_two**
-  - Used:   o1 = 4
-  - Generated: o2 = 8
-
----
-
-→ See [Workflow Card](#workflow-cards) for details.
-
-That is the simplest, vanilla run of Flowcept, good for quick sanity checks on a laptop, small-scale run. 
-For diskless runs (no JSON files), OpenAPI RESTful services, online querying using databases,
-LLM-based database interactions via an MCP agent, Grafana, telemetry,
-adapters (MLflow, Dask, TensorBoard), PyTorch and MCP instrumentation, HPC optimization or federated runs,
-and more, see the [Jupyter Notebooks](notebooks), the [Examples directory](examples) and the [complete documentation](https://flowcept.readthedocs.io/).
-
-To use the provenance agent with your favorite code assistant (for example, Codex or Claude), see the [Agents README](src/flowcept/agents/README.md).
-
-## AI agents -- if you are an AI agent, read this
-
-Start with the repository root [AGENTS.md](AGENTS.md). It is the single routing file for code-assistant behavior.
-
-For feature usage, read the maintained RST docs under [docs](docs), especially [docs/default_user_guide.rst](docs/default_user_guide.rst), [docs/prov_capture.rst](docs/prov_capture.rst), [docs/prov_query.rst](docs/prov_query.rst), [docs/cli-reference.rst](docs/cli-reference.rst), and [docs/agent.rst](docs/agent.rst).
-
-## ❗ Developer Docs
-
-For an end-to-end workflow developer tutorial (default user guide), start with [docs/README.md](docs/README.md).
-
-## Table of Contents
-
-- [Overview](#overview)
-- [Features](#features)
-- [Installation](#installation)
-- [Setup and the Settings File](#setup)
-- [Running with Containers](#running-with-containers)
-- [Examples](#examples)
-- [Workflow Card](#workflow-cards)
-- [Data Persistence](#data-persistence)
-- [Performance Tuning](#performance-tuning-for-performance-evaluation)
-- [AMD GPU Setup](#install-amd-gpu-lib)
-- [Further Documentation](#documentation)
-
-## Overview
-
-Flowcept captures and queries workflow provenance at runtime with minimal code changes and low data capture overhead,
-unifying data from diverse tools and workflows.
-
-Designed for scenarios involving critical data from multiple, federated workflows in the Edge-Cloud-HPC continuum, Flowcept supports end-to-end monitoring, analysis, querying, and enhanced support for Machine Learning (ML) and for agentic workflows.
-
-## Features
-
-- Automatic workflow provenance capture with minimal intrusion
-- Adapters for MLflow, Dask, TensorBoard; easy to add more
-- Optional explicit instrumentation via decorators
-- ML-aware capture, from workflow to epoch and layer granularity
-- Agentic workflows: MCP agents-aware provenance capture
-- Low overhead, suitable for HPC and highly distributed setups
-- Telemetry capture for CPU, GPU, memory, linked to dataflow
-- Pluggable MQ and storage backends (Redis, Kafka, MongoDB, LMDB)
-- Web UI: provenance browser, dashboards, live updates, and an embedded LLM chat agent
-- [W3C PROV](https://www.w3.org/TR/prov-overview/) adherence 
-
-Explore [Jupyter Notebooks](notebooks) and [Examples](examples) for usage.
-
-## Installation
-
-Flowcept can be installed in multiple ways, depending on your needs.
-
-### 1. Default Installation
-To install Flowcept with its basic dependencies from [PyPI](https://pypi.org/project/flowcept/), run:
-
-```shell
-pip install flowcept
-```
-
-This installs the minimal Flowcept package, **not** including MongoDB, Redis, MCP, or any adapter-specific dependencies.
-
-### 2. Installing Specific Adapters and Additional Dependencies
-
-Flowcept integrates with several tools and services, but you should **only install what you actually need**.  
-Good practice is to cherry-pick the extras relevant to your workflow instead of installing them all.
-
-```shell
-pip install flowcept[mongo]         # MongoDB support
-pip install flowcept[mlflow]        # MLflow adapter
-pip install flowcept[dask]          # Dask adapter
-pip install flowcept[tensorboard]   # TensorBoard adapter
-pip install flowcept[kafka]         # Kafka message queue
-pip install flowcept[nvidia]        # NVIDIA GPU runtime capture
-pip install flowcept[amd]           # AMD GPU runtime capture (see "Install AMD GPU Lib" for version/LD_LIBRARY_PATH notes)
-pip install flowcept[telemetry]     # CPU/GPU/memory telemetry capture
-pip install flowcept[lmdb]          # LMDB lightweight database
-pip install flowcept[mqtt]          # MQTT support
-pip install flowcept[llm_agent]     # MCP agent, LangChain, Streamlit integration: needed either for MCP capture or for the Flowcept Agent.
-pip install flowcept[llm_google]    # Google GenAI + Flowcept agent support
-pip install flowcept[dev]           # Developer dependencies (docs, tests, lint, etc.)
-```
-
-### 3. Installing with Common Runtime Bundle
-
-```shell
-pip install flowcept[extras]
+    # print(Flowcept.read_buffer_file())  # inspect raw JSONL records if needed
+    Flowcept.generate_report(print_markdown=True)
 ```
 
-The `extras` group is a convenience shortcut that bundles the most common runtime dependencies.  
-It is intended for users who want a fairly complete, but not maximal, Flowcept environment.
-
-You might choose `flowcept[extras]` if:
-
-- You want Flowcept to run out-of-the-box with Redis, telemetry, and MongoDB.  
-- You prefer not to install each extra one by one
-
-⚠️ If you only need one of these features, install it individually instead of `extras`.
-
-### 4. Install All Optional Dependencies at Once
-
-Flowcept provides a combined all extra, but installing everything into a single environment is not recommended for users.
-Many of these dependencies are unrelated and should not be mixed in the same runtime. This option is only intended for Flowcept developers who need to test across all adapters and integrations.
-
-```
-pip install flowcept[all]
-```
+Run it:
 
-### 5. Installing from Source
-To install Flowcept from the source repository:
-
-```
-git clone https://github.com/ORNL/flowcept.git
-cd flowcept
-pip install .
-```
-
-You can then install specific dependencies similarly as above:
-
-```
-pip install .[optional_dependency_name]
+```bash
+python quickstart.py
 ```
 
-This follows the same pattern as step 2, allowing for a customized installation from source.
-
-## Setup
+Flowcept captures task inputs, outputs, timing, workflow structure, and writes a local JSONL buffer.
+The final line reads the default buffer file and prints a workflow card.
 
-The [Quickstart](#quickstart) example works with just `pip install flowcept`, no extra setup is required.
+For the maintained tutorial, read the [Quick Start](https://flowcept.readthedocs.io/en/latest/quick_start.html).
 
-For online queries or distributed capture, Flowcept relies on two optional components:
+## Use The Web UI
 
-- **Message Queue (MQ)** — message broker / pub-sub / data stream  
-- **Database (DB)** — persistent storage for historical queries  
-
----
-
-#### Message Queue (MQ)
-
-- Required for anything beyond Quickstart  
-- Flowcept publishes provenance data to the MQ during workflow runs  
-- Developers can subscribe with custom consumers (see [this example](examples/consumers/simple_consumer.py).  
-- You can monitor or print messages in motion using `flowcept --stream-messages --print`.  
-
-Supported MQs:
-- [Redis](https://redis.io) → **default**, lightweight, works on Linux, macOS, Windows, and HPC (tested on [Frontier](link) and [Summit](link))  
-- [Kafka](https://kafka.apache.org) → for distributed environments or if Kafka is already in your stack  
-- [Mofka](https://mofka.readthedocs.io) → optimized for HPC runs  
-
----
-
-#### Database (DB)
-
-- **Optional**, but required for:
-  - Persisting provenance beyond MQ memory/disk buffers  
-  - Running complex analytical queries on historical data  
-
-Supported DBs:
-- [MongoDB](https://www.mongodb.com) → default, efficient bulk writes + rich query support  
-- [LMDB](https://lmdb.readthedocs.io) → lightweight, no external service, basic query capabilities  
-
----
-
-### Notes
-
-- Without a DB:
-  - Provenance remains in the MQ only (persistence not guaranteed)  
-  - Complex historical queries are unavailable  
-- Flowcept’s architecture is modular: other MQs and DBs (graph, relational, etc.) can be added in the future  
-- Deployment examples for MQ and DB are provided in the [deployment](deployment) directory  
- 
-
-### Downloading and Starting External Services (MQ or DB)
-
-Flowcept uses external services for message queues (MQ) and databases (DB). You can start them with Docker Compose, plain containers, or directly on your host.
-
----
-
-#### Using Docker Compose (recommended)
-
-We provide a [Makefile](deployment/Makefile) with shortcuts:
-
-1. **Redis only (no DB)**: `make services`   (LMDB can be used in this setup as a lightweight DB)
-2. **Redis + MongoDB**: `make services-mongo`
-3. **Kafka + MongoDB**: `make services-kafka`
-4. **Mofka only (no DB)**: `make services-mofka`
-
-To customize, edit the YAML files in [deployment](deployment/) and run `docker compose -f deployment/<compose-file>.yml up -d`
-
----
-
-#### Using Docker (without Compose)
-
-See the [deployment/](deployment/) compose files for expected images and configurations. You can adapt them to your environment and use standard `docker pull / run / exec` commands.
-
----
-
-#### Running on the Host (no containers)
-
-1. Install binaries for the service you need:  
-   - **macOS** users can install with [Homebrew](https://brew.sh).  
-     Example for Redis:
-     ```bash
-     brew install redis
-     brew services start redis
-     ```
-
-   - On Linux, use your distro package manager (e.g. `apt`, `dnf`, `yum`) 
-   - If non-root (typically the case if you want to deploy these services locally in an HPC system), search for the installed binaries for your OS/hardware architecture, download them in a directory that you have r+w permission, and run them.
-   - On Windows, utilize [WSL](https://learn.microsoft.com/en-us/windows/wsl/install) to use a Linux distro.
-
-2. Start services normally (`redis-server`, `mongod`, `kafka-server-start.sh`, etc.).
-
-## Flowcept Settings File
-
-Flowcept uses a settings file for configuration.
-
-- To create a minimal settings file, run: `flowcept --init-settings` → creates `~/.flowcept/settings.yaml`
-
-- To copy the full sample settings file, run: `flowcept --init-settings --full` → creates `~/.flowcept/settings.yaml`
-
-- To switch runtime mode, apply a profile after creating the file:
+For interactive and live provenance exploration, run Flowcept with MongoDB and the webservice.
+The UI shows captured workflows, so run one or more workflows after the service is up to populate the database.
 
 ```bash
+pip install "flowcept[webservice,mongo]"
+make services-mongo
 flowcept --init-settings --full -y
 flowcept --config-profile full-online -y
+flowcept --start-ui
 ```
 
-Meaning:
+Open `http://localhost:8008`.
 
-- `--init-settings` = minimal file with default settings.
-- `--init-settings --full` = copy `resources/sample_settings.yaml`
-- `--config-profile ...` = overlay a runtime mode on top of the existing file
-
----
-
-#### What You Can Configure
-
-- Message queue and database routes, ports, and paths  
-- MCP agent ports and LLM API keys  
-- Buffer sizes and flush settings  
-- Telemetry capture settings  
-- Instrumentation and PyTorch details  
-- Log levels  
-- Data observability adapters  
-- And more (see [example file](resources/sample_settings.yaml))  
-
----
-
-#### Custom Settings File
-
-Flowcept looks for its settings in the following order:
-
-1. Environment variable `FLOWCEPT_SETTINGS_PATH` — if set, Flowcept will use this path
-2. `~/.flowcept/settings.yaml` — created by running `flowcept --init-settings`  
-3. [Default sample file](resources/sample_settings.yaml) — used if neither of the above is found
-
-Important:
-
-- environment variables can override settings values
-- use profiles for mode switches such as `full-online`, `full-offline`, `mq-only`, `mq-only-no-flush`, `full-telemetry`
-- adapter flags are additive:
+In another terminal, run a workflow with the same online settings, for example:
 
 ```bash
-flowcept --init-settings --dask -y
-flowcept --init-settings --mlflow -y
-flowcept --init-settings --tensorboard -y
+python examples/start_here.py
 ```
 
-They add `adapters.<name>` to the current settings file instead of replacing the whole file.
+The UI provides:
 
-# Examples
+- **Workflow and campaign browser** for runs, tasks, artifacts, and agents.
+- **Dataflow graph** for W3C PROV-style task/data lineage.
+- **Task and data inspectors** for metadata, inputs, outputs, timing, and artifact details.
+- **Dashboards** for runtime summaries and workflow metrics.
+- **Workflow cards** downloadable as Markdown or PDF.
+- **Chat agent** for natural-language questions and interactive provenance visualization.
 
-### Adapters and Notebooks
+See the [Web UI docs](https://flowcept.readthedocs.io/en/latest/web_ui.html) and [ui/README.md](ui/README.md).
 
- See the [Jupyter Notebooks](notebooks) and [Examples directory](examples) for utilization examples.
+## Flowcept Agent
 
-## Workflow Cards
+The Flowcept Agent lets users ask natural language questions over captured provenance instead of hand-writing queries.
+It supports two complementary modes:
 
-The [Quickstart](#quickstart) example (`python quickstart.py`) shows a workflow card.
+- **Web chat**: built into the Flowcept UI. The chat webservice route calls Flowcept's LangChain tool orchestrator and keeps answers scoped to the workflow or campaign being viewed.
+- **MCP server**: exposes the same provenance tool surface to external assistants such as Codex, Claude Code, or other MCP clients.
 
-Flowcept introduces the Workflow Card concept: a structured markdown summary of a workflow execution covering:
+The tool surface covers two analysis paths:
 
-- **Summary** — workflow name, IDs, execution window, elapsed time, host, git info
-- **Workflow-level Summary** — activity count, status counts, top slowest activities
-- **Workflow Structure** — ASCII diagram of the activity DAG
-- **Timing Report** — per-activity start, end, and median elapsed times with insights
-- **Per Activity Details** — aggregated inputs (`used`) and outputs (`generated`) per activity
-- **Per-activity Resource Usage** — CPU, memory, disk I/O, network, and GPU deltas (when telemetry is captured)
-- **Object Artifacts Summary** — versioned artifacts produced or consumed by the workflow
+- **Streaming provenance tools** query records directly from the runtime stream. These are best for monitoring and runtime analysis while a workflow is still running.
+- **Persisted provenance tools** query MongoDB or LMDB. These are best for postmortem analysis, dashboards, workflow cards, and live analysis with a small flush delay.
 
-Cards also support **campaign-level reporting** for multi-workflow runs (replicated experiments or multi-stage pipelines):
+The Flowcept Agent itself also uses these tools through its LangChain orchestration layer.
 
-```python
-# From a JSONL buffer file (no DB needed)
-Flowcept.generate_report(input_jsonl_path="flowcept_messages.jsonl")
+Example questions:
 
-# From a live DB query
-Flowcept.generate_report(workflow_id="<id>")
-Flowcept.generate_report(campaign_id="<id>")
+- “Which activity took the longest?”
+- “Show the lineage of the selected model.”
+- “Which input files were larger than 100 MB?”
+- “Generate a workflow card for this campaign.”
+- “Highlight all tasks related to the best model.”
 
-# As PDF
-Flowcept.generate_report(workflow_id="<id>", report_type="provenance_report", format="pdf")
-```
+See the [Flowcept Agent docs](https://flowcept.readthedocs.io/en/latest/agent.html) and [src/flowcept/agents/README.md](src/flowcept/agents/README.md).
 
-See [`docs/reporting.rst`](docs/reporting.rst) and [`src/flowcept/report/README.md`](src/flowcept/report/README.md) for the full reporting reference.
+## Capture Options
 
-## Web UI
+Flowcept supports several capture styles. Use the least invasive one that answers your provenance questions.
 
-Flowcept ships a built-in web interface for browsing and analyzing provenance data. Start it with:
+| Need | Use |
+|---|---|
+| Minimal function-level capture | `@flowcept_task` |
+| Whole workflow context | `with Flowcept():` or `@flowcept` |
+| Custom metadata and manual events | `FlowceptTask` |
+| Loop capture | `FlowceptLoop` |
+| ML model and tensor semantics | PyTorch instrumentation |
+| Tool/framework observability | Dask, MLflow, TensorBoard, MCP, and other adapters |
+| Distributed runtime stream | [Redis](https://redis.io), [RabbitMQ](https://www.rabbitmq.com), [Kafka](https://kafka.apache.org), or [Mofka](https://mofka.readthedocs.io) message queues |
+| Queryable persistent store | MongoDB or LMDB |
 
-```bash
-pip install flowcept[webservice]
-flowcept --start-ui        # starts the webservice + dev server; open http://localhost:8008
-```
-
-Key features:
-- **Provenance browser** — campaigns, workflows, tasks, and artifacts with drill-down views
-- **Live updates** — SSE-based streaming so the task table updates while a workflow runs
-- **Dashboards** — per-workflow and per-campaign chart dashboards (configurable, stored in MongoDB)
-- **Dataflow graph** — W3C PROV-style graph of task inputs/outputs; click any node to inspect its provenance
-- **LLM chat agent** — ask natural-language questions about your provenance data; charts render inline; queries are automatically scoped to the current workflow or campaign
-- **Lineage highlighting** — ask the chat agent to highlight the full provenance lineage (ancestors + descendants) of any task directly in the Dataflow graph
-
-The chat agent queries the **persisted store** (MongoDB) and the **live stream** (via near-real-time DB flushes from the MQ). For sub-second in-flight queries, use the MCP agent instead.
+Read [Provenance Capture Methods](https://flowcept.readthedocs.io/en/latest/prov_capture.html) for examples.
 
-See [`docs/web_ui.rst`](docs/web_ui.rst) and [`ui/README.md`](ui/README.md) for the full reference.
+## Storage And Querying
 
-# Summary: Observability, Instrumentation, MQs, DBs, and Querying
+Flowcept can run fully offline or as an online distributed system.
 
-| Category                           | Supported Options                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-|------------------------------------|-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| **Data Observability Adapters**    | [MLflow](https://github.com/ORNL/flowcept/blob/main/examples/mlflow_example.py), [Dask](https://github.com/ORNL/flowcept/blob/main/examples/dask_example.py), [TensorBoard](https://github.com/ORNL/flowcept/blob/main/examples/tensorboard_example.py)                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
-| **Instrumentation and Decorators** | - [@flowcept](https://github.com/ORNL/flowcept/blob/main/examples/start_here.py): encapsulate a function (e.g., a main function) as a workflow. <br> - [@flowcept_task](https://github.com/ORNL/flowcept/blob/main/examples/instrumented_simple_example.py): encapsulate a function as a task. <br> - `@telemetry_flowcept_task`: same as `@flowcept_task`, but optimized for telemetry capture. <br> - `@lightweight_flowcept_task`: same as `@flowcept_task`, but very lightweight, optimized for HPC workloads <br> - [Loop](https://github.com/ORNL/flowcept/blob/main/examples/instrumented_loop_example.py) <br> - [PyTorch Model](https://github.com/ORNL/flowcept/blob/main/examples/llm_complex/llm_model.py) <br> - [MCP Agent](https://github.com/ORNL/flowcept/blob/main/examples/agents/aec_agent_mock.py) |
-| **Context Manager**                | `with Flowcept():` <br/> &nbsp;&nbsp;&nbsp;`# Workflow code` <br/><br/>Similar to the `@flowcept` decorator, but more flexible for instrumenting code blocks that aren’t encapsulated in a single function and for workflows with scattered code across multiple files.                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
-| **Custom Task Creation**           | `FlowceptTask(activity_id=<id>, used=<inputs>, generated=<outputs>, ...)` <br/><br/>Use for fully customizable task instrumentation. Publishes directly to the MQ either via context management (`with FlowceptTask(...)`) or by calling `send()`. It needs to have a `Flowcept().start()` first (or within a `with Flowcept()` context). See [example](examples/consumers/ping_pong_example.py).                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| **Message Queues (MQ)**            | - **Disabled** (offline mode: provenance events stay in an in-memory buffer, not accessible to external processes) <br> - [Redis](https://redis.io) → default, lightweight, easy to run anywhere <br> - [Kafka](https://kafka.apache.org) → for distributed, production setups <br> - [Mofka](https://mofka.readthedocs.io) → optimized for HPC runs <br><br> _Setup example:_ [docker compose](https://github.com/ORNL/flowcept/blob/main/deployment/compose.yml)                                                                                                                                                                                                                                                                                                                                                      |
-| **Databases**                      | - **Disabled** → Flowcept runs in ephemeral mode (data only in MQ, no persistence) <br> - **[MongoDB](https://www.mongodb.com)** → default, rich queries and efficient bulk writes <br> - **[LMDB](https://lmdb.readthedocs.io)** → lightweight, file-based, no external service, basic query support                                                                                                                                                                                                                                                                                                                                                     |
-| **Querying and Monitoring**        | - **[Web UI](docs/web_ui.rst)** → browser-based provenance browser with dashboards, live updates, and an embedded LLM chat agent that queries the persisted store and highlights provenance lineage in the Dataflow graph <br> - **[Grafana](deployment/compose-grafana.yml)** → dashboarding via MongoDB connector <br> - **MCP Flowcept Agent** → LLM-based querying of the live MQ stream (Redis/Kafka/Mofka) via external assistants (Claude Code, Codex, etc.) or offline JSONL buffer                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            | 
-| **Custom Consumer**                | You can implement your own consumer to monitor or query the provenance stream in real time. Useful for custom analytics, monitoring, debugging, or to persist the data in a different data model (e.g., graph) . See [example](examples/consumers/simple_consumer.py).                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  |
+| Mode | What happens |
+|---|---|
+| Offline JSONL | Provenance is captured locally and can be loaded later. |
+| MQ stream | Runtime records are streamed through [Redis](https://redis.io), [RabbitMQ](https://www.rabbitmq.com), [Kafka](https://kafka.apache.org), or [Mofka](https://mofka.readthedocs.io). |
+| MongoDB | Rich online queries, web UI, dashboards, workflow cards, and agent chat. |
+| LMDB | Lightweight local persistence without an external database service. |
 
+Query surfaces:
 
-## Performance Tuning for Performance Evaluation
+- Python API: `Flowcept.db`
+- CLI: `flowcept --query ...`
+- REST API: `flowcept --start-webservice`
+- Web UI: browser-based exploration and dashboards
+- Flowcept Agent: natural-language provenance querying and reasoning
 
-In the settings.yaml file, many variables may impact interception efficiency. 
-Please be mindful of the following parameters:
+Read [Provenance Querying](https://flowcept.readthedocs.io/en/latest/prov_query.html), [Provenance Storage](https://flowcept.readthedocs.io/en/latest/prov_storage.html), and the [REST API docs](https://flowcept.readthedocs.io/en/latest/rest_api.html).
 
-* `mq`
-    - `buffer_size` and `insertion_buffer_time_secs`. -- `buffer_size: 1` is really bad for performance, but it will give the most up-to-date info possible to the MQ.
-    
-* `log`
-    - set both stream and files to disable
-
-* `telemetry_capture` 
-  The more things you enable, the more overhead you'll get. For GPU, you can turn on/off specific metrics.
+## Workflow Cards
 
-* `instrumentation`
-  This will configure whether every single granular step in the model training process will be captured. Disable very granular model inspection and try to use more lightweight methods. There are commented instructions in the settings.yaml sample file.
+Flowcept generates workflow cards: structured run summaries for reproducibility, review, and communication.
+Cards include workflow metadata, execution status, activity summaries, resource usage, artifacts, and lineage structure.
 
-Other thing to consider:
+```python
+from flowcept import Flowcept
 
-```
-project:
-  replace_non_json_serializable: false # Here it will assume that all captured data are JSON serializable
-  db_flush_mode: offline               # This disables the feature of runtime analysis in the database.
-mq:
-  chunk_size: -1                       # This disables chunking the messages to be sent to the MQ. Use this only if the main memory of the compute notes is large enough.
+Flowcept.generate_report(workflow_id="<workflow-id>")
+Flowcept.generate_report(campaign_id="<campaign-id>")
+Flowcept.generate_report(workflow_id="<workflow-id>", format="pdf")
 ```
 
-Other variables depending on the adapter may impact too. For instance, in Dask, timestamp creation by workers add interception overhead. As we evolve the software, other variables that impact overhead appear and we might not stated them in this README file yet. If you are doing extensive performance evaluation experiments using this software, please reach out to us (e.g., create an issue in the repository) for hints on how to reduce the overhead of our software.
+The Markdown workflow cards follow the upstream
+[Workflow Provenance Card template](https://github.com/data-cards/workflow-provenance-card).
 
-## Install AMD GPU Lib
+Read the [Reporting docs](https://flowcept.readthedocs.io/en/latest/reporting.html).
 
-Only needed for AMD GPU telemetry capture. NVIDIA users use `flowcept[nvidia]` instead.
+## Installation
+
+Install only what you need.
 
-**Quick install:**
 ```bash
-pip install flowcept[amd]
+pip install flowcept                  # minimal package
+pip install "flowcept[mongo]"         # MongoDB support
+pip install "flowcept[webservice]"    # REST API and web UI
+pip install "flowcept[dask]"          # Dask adapter
+pip install "flowcept[mlflow]"        # MLflow adapter
+pip install "flowcept[rabbitmq]"      # RabbitMQ MQ
+pip install "flowcept[kafka]"         # Kafka MQ
+pip install "flowcept[telemetry]"     # CPU/memory telemetry
+pip install "flowcept[lmdb]"          # LMDB storage
+pip install "flowcept[llm_agent]"     # Flowcept Agent / MCP / chat dependencies
 ```
 
-This installs the latest `amdsmi` from PyPI. The `amdsmi` Python package is a thin wrapper around the system's `libamd_smi.so`, so the PyPI version must match your ROCm installation. If you get a runtime error like `undefined symbol` or `libamd_smi.so not found`, follow the steps below.
+`flowcept[all]` exists for development and broad testing, but it is usually better to install targeted extras.
 
-**Matching the version to your ROCm:**
+Read [Setup and Installation](https://flowcept.readthedocs.io/en/latest/setup.html).
 
-1. Find your ROCm version:
-   ```bash
-   ls /opt/rocm-*   # e.g. /opt/rocm-6.2.4
-   # or: rocm-smi --version
-   ```
+## Settings
 
-2. Find the matching `amdsmi` PyPI version — the major/minor version tracks ROCm (e.g. ROCm 6.2.x → `amdsmi==6.2.*`, ROCm 7.0.x → `amdsmi==7.0.*`):
-   ```bash
-   pip index versions amdsmi   # lists all available versions
-   pip install amdsmi==<X.Y.Z>
-   ```
+Flowcept is configured through `settings.yaml`, with environment variables taking precedence.
 
-3. Set `LD_LIBRARY_PATH` so Python finds the correct shared library:
-   ```bash
-   export LD_LIBRARY_PATH=/opt/rocm-<X.Y.Z>/lib:$LD_LIBRARY_PATH
-   ```
-   Add this to your job script or shell profile so it persists.
-
-**Verify:**
 ```bash
-python -c "from amdsmi import amdsmi_init, amdsmi_get_processor_handles; amdsmi_init(); print(len(amdsmi_get_processor_handles()), 'GPU(s) found')"
+flowcept --init-settings -y              # minimal settings
+flowcept --init-settings --full -y       # full template
+flowcept --config-profile full-online -y # online MQ + DB profile
 ```
 
-## Torch Dependencies
+Configuration precedence:
 
-Some unit tests utilize `torch==2.2.2`, `torchtext=0.17.2`, and `torchvision==0.17.2`. They are only really needed to run some tests and will be installed if you run `pip install flowcept[ml_dev]` or `pip install flowcept[all]`. If you want to use Flowcept with Torch, please adapt torch dependencies according to your project's dependencies.
+1. Environment variables.
+2. `FLOWCEPT_SETTINGS_PATH`.
+3. `~/.flowcept/settings.yaml`.
+4. Built-in defaults.
 
-## Documentation
+Read the [CLI Reference](https://flowcept.readthedocs.io/en/latest/cli-reference.html).
 
-Full documentation is available on [Read the Docs](https://flowcept.readthedocs.io/).
+## Examples And Notebooks
 
-## Cite us
+- [examples](examples): runnable scripts for decorators, Dask, MLflow, TensorBoard, PyTorch, agents, consumers, and object storage.
+- [notebooks](notebooks): exploratory examples and tutorials.
+- [Default User Guide](https://flowcept.readthedocs.io/en/latest/default_user_guide.html): recommended end-to-end guide.
 
-If you used Flowcept in your research, consider citing our paper.
+## For Code Assistants
 
-```
-Towards Lightweight Data Integration using Multi-workflow Provenance and Data Observability
-R. Souza, T. Skluzacek, S. Wilkinson, M. Ziatdinov, and R. da Silva
-19th IEEE International Conference on e-Science, 2023.
-```
+Code assistants should read [AGENTS.md](AGENTS.md) first.
+It is the single source of truth for repository-specific engineering rules.
+
+For Flowcept feature usage, read the maintained RST docs under [docs](docs) instead of inventing behavior from source snippets.
 
-**Bibtex:**
+## Cite Flowcept
 
-```latex
-@inproceedings{souza2023towards,  
+If you use Flowcept in research, please cite:
+
+```bibtex
+@inproceedings{souza2023towards,
   author = {Souza, Renan and Skluzacek, Tyler J and Wilkinson, Sean R and Ziatdinov, Maxim and da Silva, Rafael Ferreira},
   booktitle = {IEEE International Conference on e-Science},
   doi = {10.1109/e-Science58273.2023.10254822},
@@ -575,13 +296,19 @@ R. Souza, T. Skluzacek, S. Wilkinson, M. Ziatdinov, and R. da Silva
 }
 ```
 
-## Disclaimer & Get in Touch
+More publications are listed in the [Flowcept publications page](https://flowcept.readthedocs.io/en/latest/publications.html).
+
+## Community And Contributing
 
-Refer to [Contributing](CONTRIBUTING.md) for adding new adapters or contributing with the codebase.
+Flowcept is research software developed for distributed scientific workflows.
+Issues, discussions, examples, adapters, and documentation improvements are welcome.
 
-Please note that this a research software. We encourage you to give it a try and use it with your own stack.
-We are continuously working on improving documentation and adding more examples and notebooks, but we are continuously improving documentation and examples. If you are interested in working with Flowcept in your own scientific project, we can give you a jump start if you reach out to us. Feel free to [create an issue](https://github.com/ORNL/flowcept/issues/new), [create a new discussion thread](https://github.com/ORNL/flowcept/discussions/new/choose) or drop us an email (we trust you'll find a way to reach out to us :wink:).
+- [Contributing guide](CONTRIBUTING.md)
+- [GitHub issues](https://github.com/ORNL/flowcept/issues/new)
+- [GitHub discussions](https://github.com/ORNL/flowcept/discussions/new/choose)
+- [Slack channel](https://workflowscommunity.slack.com/archives/C06L5GYJKQS)
 
 ## Acknowledgement
 
-This research uses resources of the Oak Ridge Leadership Computing Facility at the Oak Ridge National Laboratory, which is supported by the Office of Science of the U.S. Department of Energy under Contract No. DE-AC05-00OR22725.
+This research uses resources of the Oak Ridge Leadership Computing Facility at Oak Ridge National Laboratory,
+which is supported by the Office of Science of the U.S. Department of Energy under Contract No. DE-AC05-00OR22725.
diff --git a/deployment/compose-rabbitmq.yml b/deployment/compose-rabbitmq.yml
new file mode 100644
index 00000000..b8478366
--- /dev/null
+++ b/deployment/compose-rabbitmq.yml
@@ -0,0 +1,33 @@
+name: flowcept
+services:
+  flowcept_redis:
+    container_name: flowcept_redis
+    image: redis
+    ports:
+      - 6379:6379
+
+  flowcept_mongo:
+    container_name: flowcept_mongo
+    image: mongo:latest
+    ports:
+      - 27017:27017
+    volumes:
+      - mongo_data:/data/db
+
+  # RabbitMQ broker; reachable on 5672 (AMQP) and 15672 (management UI)
+  flowcept_rabbitmq:
+    container_name: flowcept_rabbitmq
+    image: rabbitmq:3-management
+    ports:
+      - "5672:5672"
+      - "15672:15672"
+    environment:
+      RABBITMQ_DEFAULT_USER: guest
+      RABBITMQ_DEFAULT_PASS: guest
+
+networks:
+  flowcept:
+    driver: bridge
+
+volumes:
+  mongo_data:
diff --git a/docs/README.md b/docs/README.md
index 2134916c..40b99e08 100644
--- a/docs/README.md
+++ b/docs/README.md
@@ -445,7 +445,7 @@ agent:
 
 #### Internal-LLM mode
 
-Flowcept builds the model using `build_llm_model()` (`src/flowcept/agents/agents_utils.py`).
+Flowcept builds the model using `build_llm_model()` (`src/flowcept/agents/llm/builders.py`).
 
 Providers in code:
 
diff --git a/docs/agent.rst b/docs/agent.rst
index 6d211566..cd6bb894 100644
--- a/docs/agent.rst
+++ b/docs/agent.rst
@@ -27,35 +27,22 @@ Flowcept exposes provenance data to LLM-based agents through two complementary s
    workflow is still executing. It also supports offline JSONL buffer files.
 
 The two surfaces share the same underlying provenance tool core
-(``src/flowcept/agents/tools/prov_tools.py``) so queries stay consistent across both.
+(``src/flowcept/agents/data_query_tools/db_query_tools.py``) so queries stay consistent across both.
 
-The MCP agent has one backend and two orchestration paths:
-
-- **Internal LLM mode**: Flowcept builds the configured LLM and routes free-text messages through ``prompt_handler``.
-- **External LLM mode**: your outside assistant, such as Codex, Claude, LibreChat, Cursor, or another MCP client,
-  owns routing and reasoning, while Flowcept provides the same MCP prompts, tools, and in-memory context.
-
-The modes are intended to expose the same functionality. The difference is only who orchestrates the tools.
+The MCP agent exposes explicit tools only. The outside assistant, such as Codex,
+Claude, LibreChat, Cursor, or another MCP client, owns routing and reasoning,
+while Flowcept provides the MCP prompts, tools, and in-memory context.
 
 Configuring LLM orchestration
 -----------------------------
 
-Internal mode:
-
-.. code-block:: yaml
-
-   agent:
-     external_llm: false
-
-External mode:
-
 .. code-block:: yaml
 
    agent:
      external_llm: true
 
-In external mode, arbitrary free-text messages sent to ``prompt_handler`` are not internally routed. Use explicit
-commands, prompt-builder calls, and execution-tool calls from the outside assistant.
+When ``agent.external_llm`` is enabled, use explicit commands, prompt-builder
+calls, and execution-tool calls from the outside assistant.
 
 Shared commands and prefixes
 ----------------------------
@@ -101,16 +88,16 @@ The agent resolves the matching task(s) via a Mongo-style filter, then the Dataf
 tab dims all unrelated nodes and edges, tracing only the ancestor/descendant chain.
 Click any node or empty space to reset the highlight manually.
 
-Internal prompt-handler example
--------------------------------
+Explicit MCP tool example
+-------------------------
 
 .. code-block:: python
 
-   from flowcept.agents.agent_client import run_tool
+   from flowcept.agents.mcp.mcp_client import run_tool
 
    result = run_tool(
-       "prompt_handler",
-       kwargs={"message": "What are the top 5 slowest activities?"},
+       "run_workflow_query",
+       kwargs={"query": "What is the workflow name?"},
    )
 
 External prompt plus execution example
@@ -118,7 +105,7 @@ External prompt plus execution example
 
 .. code-block:: python
 
-   from flowcept.agents.agent_client import run_prompt, run_tool
+   from flowcept.agents.mcp.mcp_client import run_prompt, run_tool
 
    prompt = run_prompt(
        "build_df_query_prompt",
@@ -143,7 +130,7 @@ External workflow-message query example
 
 .. code-block:: python
 
-   from flowcept.agents.agent_client import run_prompt, run_tool
+   from flowcept.agents.mcp.mcp_client import run_prompt, run_tool
 
    prompt = run_prompt(
        "build_workflow_query_prompt",
@@ -170,7 +157,8 @@ This is a minimal offline example:
 
    import json
    from flowcept import Flowcept, flowcept_task
-   from flowcept.agents.flowcept_agent import FlowceptAgent
+   from flowcept.agents.mcp.mcp_client import run_tool
+   from flowcept.agents.mcp.mcp_server import FlowceptMCPServer
 
    @flowcept_task
    def sum_one(x):
@@ -182,10 +170,10 @@ This is a minimal offline example:
        f.dump_buffer("flowcept_buffer.jsonl")
 
    # Start the agent from the buffer file and query it
-   agent = FlowceptAgent(buffer_path="flowcept_buffer.jsonl")
+   agent = FlowceptMCPServer(buffer_path="flowcept_buffer.jsonl")
    # Or load a list of messages directly
-   # agent = FlowceptAgent(buffer_messages=msgs)
+   # agent = FlowceptMCPServer(buffer_messages=msgs)
    agent.start()
-   resp = agent.query("how many tasks?")
+   resp = run_tool("run_df_query", kwargs={"query": "how many tasks?"})[0]
    print(json.loads(resp))
    agent.stop()
diff --git a/docs/architecture.rst b/docs/architecture.rst
index b2a2341f..3e273db4 100644
--- a/docs/architecture.rst
+++ b/docs/architecture.rst
@@ -40,8 +40,9 @@ To minimize interference with HPC applications, provenance messages are buffered
 and streamed asynchronously to a **publish–subscribe hub**.  
 Flowcept supports configurable flushing strategies and multiple broker backends:
 
-- **Redis** → low-latency messaging, minimal setup, default for most use cases.  
-- **Kafka** → high throughput for data-intensive workflows.  
+- **Redis** → low-latency messaging, minimal setup, default for most use cases.
+- **RabbitMQ** → AMQP-based broker, suitable for cloud and enterprise environments.
+- **Kafka** → high throughput for data-intensive workflows.
 - **Mofka** → RDMA-optimized transport, ideal for tightly coupled HPC networks.
 
 Regardless of the broker, all provenance messages follow a **common schema**.
diff --git a/docs/index.rst b/docs/index.rst
index b3029887..b0ec9be0 100644
--- a/docs/index.rst
+++ b/docs/index.rst
@@ -77,3 +77,4 @@ Flowcept
    contributing
    cli-reference
    api-reference
+   publications
diff --git a/docs/openapi/flowcept-openapi.json b/docs/openapi/flowcept-openapi.json
index f164a8db..c665e52c 100644
--- a/docs/openapi/flowcept-openapi.json
+++ b/docs/openapi/flowcept-openapi.json
@@ -12,7 +12,7 @@
           "health"
         ],
         "summary": "Live",
-        "description": "Liveness check.",
+        "description": "Liveness check \u2014 process is running.",
         "operationId": "live_api_v1_health_live_get",
         "responses": {
           "200": {
@@ -36,18 +36,14 @@
           "health"
         ],
         "summary": "Ready",
-        "description": "Readiness check.",
+        "description": "Readiness check \u2014 verifies all enabled services via ``Flowcept.services_alive()``.\n\nWhich services are checked is driven by settings.yaml (MQ, KVDB, MongoDB, LMDB, LLM).\nReturns HTTP 200 when all enabled services are reachable, HTTP 503 otherwise.\nThe response body includes per-service status so callers can identify which\nservice is down without reading server logs.",
         "operationId": "ready_api_v1_health_ready_get",
         "responses": {
           "200": {
             "description": "Successful Response",
             "content": {
               "application/json": {
-                "schema": {
-                  "additionalProperties": true,
-                  "type": "object",
-                  "title": "Response Ready Api V1 Health Ready Get"
-                }
+                "schema": {}
               }
             }
           }
@@ -656,6 +652,117 @@
         }
       }
     },
+    "/api/v1/workflows/{workflow_id}/node_positions": {
+      "get": {
+        "tags": [
+          "workflows"
+        ],
+        "summary": "Get Node Positions",
+        "description": "Get node positions for a workflow graph type.",
+        "operationId": "get_node_positions_api_v1_workflows__workflow_id__node_positions_get",
+        "parameters": [
+          {
+            "name": "workflow_id",
+            "in": "path",
+            "required": true,
+            "schema": {
+              "type": "string",
+              "title": "Workflow Id"
+            }
+          },
+          {
+            "name": "graph_type",
+            "in": "query",
+            "required": true,
+            "schema": {
+              "type": "string",
+              "description": "Graph type: 'dataflow', 'task', or 'activity'",
+              "title": "Graph Type"
+            },
+            "description": "Graph type: 'dataflow', 'task', or 'activity'"
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": {
+                  "type": "object",
+                  "additionalProperties": true,
+                  "title": "Response Get Node Positions Api V1 Workflows  Workflow Id  Node Positions Get"
+                }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            }
+          }
+        }
+      },
+      "post": {
+        "tags": [
+          "workflows"
+        ],
+        "summary": "Save Node Positions",
+        "description": "Save node positions for a workflow graph type.",
+        "operationId": "save_node_positions_api_v1_workflows__workflow_id__node_positions_post",
+        "parameters": [
+          {
+            "name": "workflow_id",
+            "in": "path",
+            "required": true,
+            "schema": {
+              "type": "string",
+              "title": "Workflow Id"
+            }
+          }
+        ],
+        "requestBody": {
+          "required": true,
+          "content": {
+            "application/json": {
+              "schema": {
+                "type": "object",
+                "additionalProperties": true,
+                "title": "Payload"
+              }
+            }
+          }
+        },
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": {
+                  "type": "object",
+                  "additionalProperties": true,
+                  "title": "Response Save Node Positions Api V1 Workflows  Workflow Id  Node Positions Post"
+                }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            }
+          }
+        }
+      }
+    },
     "/api/v1/tasks": {
       "get": {
         "tags": [
@@ -1129,6 +1236,49 @@
             }
           }
         }
+      },
+      "delete": {
+        "tags": [
+          "objects"
+        ],
+        "summary": "Delete Object",
+        "description": "Delete an object and all its versions by object_id.",
+        "operationId": "delete_object_api_v1_objects__object_id__delete",
+        "parameters": [
+          {
+            "name": "object_id",
+            "in": "path",
+            "required": true,
+            "schema": {
+              "type": "string",
+              "title": "Object Id"
+            }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": {
+                  "type": "object",
+                  "additionalProperties": true,
+                  "title": "Response Delete Object Api V1 Objects  Object Id  Delete"
+                }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            }
+          }
+        }
       }
     },
     "/api/v1/objects/{object_id}/versions/{version}": {
@@ -2253,6 +2403,30 @@
         }
       }
     },
+    "/api/v1/agents/cleanup/empty": {
+      "delete": {
+        "tags": [
+          "agents"
+        ],
+        "summary": "Delete Empty Agents",
+        "description": "Delete all agents from the database that don't have associated task_id.",
+        "operationId": "delete_empty_agents_api_v1_agents_cleanup_empty_delete",
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": {
+                  "additionalProperties": true,
+                  "type": "object",
+                  "title": "Response Delete Empty Agents Api V1 Agents Cleanup Empty Delete"
+                }
+              }
+            }
+          }
+        }
+      }
+    },
     "/api/v1/stats/tasks/summary": {
       "get": {
         "tags": [
@@ -3065,7 +3239,8 @@
             "enum": [
               "tasks",
               "workflows",
-              "objects"
+              "objects",
+              "collection_sizes"
             ],
             "title": "Source",
             "default": "tasks"
@@ -3129,7 +3304,7 @@
             "anyOf": [
               {
                 "items": {
-                  "$ref": "#/components/schemas/SortSpec"
+                  "$ref": "#/components/schemas/flowcept__webservice__schemas__dashboards__SortSpec"
                 },
                 "type": "array"
               },
@@ -3226,6 +3401,17 @@
             "type": "boolean",
             "title": "Allow Dashboard Edit",
             "default": false
+          },
+          "thread_id": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Thread Id"
           }
         },
         "type": "object",
@@ -3542,7 +3728,7 @@
             "anyOf": [
               {
                 "items": {
-                  "$ref": "#/components/schemas/SortSpec"
+                  "$ref": "#/components/schemas/flowcept__webservice__schemas__common__SortSpec"
                 },
                 "type": "array"
               },
@@ -3613,7 +3799,7 @@
             "anyOf": [
               {
                 "items": {
-                  "$ref": "#/components/schemas/SortSpec"
+                  "$ref": "#/components/schemas/flowcept__webservice__schemas__common__SortSpec"
                 },
                 "type": "array"
               },
@@ -3647,30 +3833,6 @@
         "title": "QueryRequest",
         "description": "Read-only query payload."
       },
-      "SortSpec": {
-        "properties": {
-          "field": {
-            "type": "string",
-            "minLength": 1,
-            "title": "Field"
-          },
-          "order": {
-            "type": "integer",
-            "enum": [
-              1,
-              -1
-            ],
-            "title": "Order",
-            "default": 1
-          }
-        },
-        "type": "object",
-        "required": [
-          "field"
-        ],
-        "title": "SortSpec",
-        "description": "Sort field/order pair."
-      },
       "TimeseriesRequest": {
         "properties": {
           "filter": {
@@ -3762,6 +3924,53 @@
         "type": "object",
         "title": "VizSpec",
         "description": "How a chart renders its rows."
+      },
+      "flowcept__webservice__schemas__common__SortSpec": {
+        "properties": {
+          "field": {
+            "type": "string",
+            "minLength": 1,
+            "title": "Field"
+          },
+          "order": {
+            "type": "integer",
+            "enum": [
+              1,
+              -1
+            ],
+            "title": "Order",
+            "default": 1
+          }
+        },
+        "type": "object",
+        "required": [
+          "field"
+        ],
+        "title": "SortSpec",
+        "description": "Sort field/order pair."
+      },
+      "flowcept__webservice__schemas__dashboards__SortSpec": {
+        "properties": {
+          "field": {
+            "type": "string",
+            "title": "Field"
+          },
+          "order": {
+            "type": "integer",
+            "enum": [
+              1,
+              -1
+            ],
+            "title": "Order",
+            "default": 1
+          }
+        },
+        "type": "object",
+        "required": [
+          "field"
+        ],
+        "title": "SortSpec",
+        "description": "Sort field/order pair for chart data queries."
       }
     }
   }
diff --git a/docs/openapi/flowcept-openapi.yaml b/docs/openapi/flowcept-openapi.yaml
index 5b7c83af..07c0d552 100644
--- a/docs/openapi/flowcept-openapi.yaml
+++ b/docs/openapi/flowcept-openapi.yaml
@@ -10,7 +10,7 @@ paths:
       tags:
       - health
       summary: Live
-      description: Liveness check.
+      description: "Liveness check \u2014 process is running."
       operationId: live_api_v1_health_live_get
       responses:
         '200':
@@ -26,17 +26,18 @@ paths:
       tags:
       - health
       summary: Ready
-      description: Readiness check.
+      description: "Readiness check \u2014 verifies all enabled services via ``Flowcept.services_alive()``.\n\
+        \nWhich services are checked is driven by settings.yaml (MQ, KVDB, MongoDB,\
+        \ LMDB, LLM).\nReturns HTTP 200 when all enabled services are reachable, HTTP\
+        \ 503 otherwise.\nThe response body includes per-service status so callers\
+        \ can identify which\nservice is down without reading server logs."
       operationId: ready_api_v1_health_ready_get
       responses:
         '200':
           description: Successful Response
           content:
             application/json:
-              schema:
-                additionalProperties: true
-                type: object
-                title: Response Ready Api V1 Health Ready Get
+              schema: {}
   /api/v1/info:
     get:
       tags:
@@ -417,6 +418,81 @@ paths:
             application/json:
               schema:
                 $ref: '#/components/schemas/HTTPValidationError'
+  /api/v1/workflows/{workflow_id}/node_positions:
+    get:
+      tags:
+      - workflows
+      summary: Get Node Positions
+      description: Get node positions for a workflow graph type.
+      operationId: get_node_positions_api_v1_workflows__workflow_id__node_positions_get
+      parameters:
+      - name: workflow_id
+        in: path
+        required: true
+        schema:
+          type: string
+          title: Workflow Id
+      - name: graph_type
+        in: query
+        required: true
+        schema:
+          type: string
+          description: 'Graph type: ''dataflow'', ''task'', or ''activity'''
+          title: Graph Type
+        description: 'Graph type: ''dataflow'', ''task'', or ''activity'''
+      responses:
+        '200':
+          description: Successful Response
+          content:
+            application/json:
+              schema:
+                type: object
+                additionalProperties: true
+                title: Response Get Node Positions Api V1 Workflows  Workflow Id  Node
+                  Positions Get
+        '422':
+          description: Validation Error
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/HTTPValidationError'
+    post:
+      tags:
+      - workflows
+      summary: Save Node Positions
+      description: Save node positions for a workflow graph type.
+      operationId: save_node_positions_api_v1_workflows__workflow_id__node_positions_post
+      parameters:
+      - name: workflow_id
+        in: path
+        required: true
+        schema:
+          type: string
+          title: Workflow Id
+      requestBody:
+        required: true
+        content:
+          application/json:
+            schema:
+              type: object
+              additionalProperties: true
+              title: Payload
+      responses:
+        '200':
+          description: Successful Response
+          content:
+            application/json:
+              schema:
+                type: object
+                additionalProperties: true
+                title: Response Save Node Positions Api V1 Workflows  Workflow Id  Node
+                  Positions Post
+        '422':
+          description: Validation Error
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/HTTPValidationError'
   /api/v1/tasks:
     get:
       tags:
@@ -699,6 +775,34 @@ paths:
             application/json:
               schema:
                 $ref: '#/components/schemas/HTTPValidationError'
+    delete:
+      tags:
+      - objects
+      summary: Delete Object
+      description: Delete an object and all its versions by object_id.
+      operationId: delete_object_api_v1_objects__object_id__delete
+      parameters:
+      - name: object_id
+        in: path
+        required: true
+        schema:
+          type: string
+          title: Object Id
+      responses:
+        '200':
+          description: Successful Response
+          content:
+            application/json:
+              schema:
+                type: object
+                additionalProperties: true
+                title: Response Delete Object Api V1 Objects  Object Id  Delete
+        '422':
+          description: Validation Error
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/HTTPValidationError'
   /api/v1/objects/{object_id}/versions/{version}:
     get:
       tags:
@@ -1394,6 +1498,23 @@ paths:
             application/json:
               schema:
                 $ref: '#/components/schemas/HTTPValidationError'
+  /api/v1/agents/cleanup/empty:
+    delete:
+      tags:
+      - agents
+      summary: Delete Empty Agents
+      description: Delete all agents from the database that don't have associated
+        task_id.
+      operationId: delete_empty_agents_api_v1_agents_cleanup_empty_delete
+      responses:
+        '200':
+          description: Successful Response
+          content:
+            application/json:
+              schema:
+                additionalProperties: true
+                type: object
+                title: Response Delete Empty Agents Api V1 Agents Cleanup Empty Delete
   /api/v1/stats/tasks/summary:
     get:
       tags:
@@ -1915,6 +2036,7 @@ components:
           - tasks
           - workflows
           - objects
+          - collection_sizes
           title: Source
           default: tasks
         filter:
@@ -1948,7 +2070,7 @@ components:
         sort:
           anyOf:
           - items:
-              $ref: '#/components/schemas/SortSpec'
+              $ref: '#/components/schemas/flowcept__webservice__schemas__dashboards__SortSpec'
             type: array
           - type: 'null'
           title: Sort
@@ -2013,6 +2135,11 @@ components:
           type: boolean
           title: Allow Dashboard Edit
           default: false
+        thread_id:
+          anyOf:
+          - type: string
+          - type: 'null'
+          title: Thread Id
       type: object
       required:
       - messages
@@ -2227,7 +2354,7 @@ components:
         sort:
           anyOf:
           - items:
-              $ref: '#/components/schemas/SortSpec'
+              $ref: '#/components/schemas/flowcept__webservice__schemas__common__SortSpec'
             type: array
           - type: 'null'
           title: Sort
@@ -2271,7 +2398,7 @@ components:
         sort:
           anyOf:
           - items:
-              $ref: '#/components/schemas/SortSpec'
+              $ref: '#/components/schemas/flowcept__webservice__schemas__common__SortSpec'
             type: array
           - type: 'null'
           title: Sort
@@ -2289,24 +2416,6 @@ components:
       type: object
       title: QueryRequest
       description: Read-only query payload.
-    SortSpec:
-      properties:
-        field:
-          type: string
-          minLength: 1
-          title: Field
-        order:
-          type: integer
-          enum:
-          - 1
-          - -1
-          title: Order
-          default: 1
-      type: object
-      required:
-      - field
-      title: SortSpec
-      description: Sort field/order pair.
     TimeseriesRequest:
       properties:
         filter:
@@ -2374,3 +2483,38 @@ components:
       type: object
       title: VizSpec
       description: How a chart renders its rows.
+    flowcept__webservice__schemas__common__SortSpec:
+      properties:
+        field:
+          type: string
+          minLength: 1
+          title: Field
+        order:
+          type: integer
+          enum:
+          - 1
+          - -1
+          title: Order
+          default: 1
+      type: object
+      required:
+      - field
+      title: SortSpec
+      description: Sort field/order pair.
+    flowcept__webservice__schemas__dashboards__SortSpec:
+      properties:
+        field:
+          type: string
+          title: Field
+        order:
+          type: integer
+          enum:
+          - 1
+          - -1
+          title: Order
+          default: 1
+      type: object
+      required:
+      - field
+      title: SortSpec
+      description: Sort field/order pair for chart data queries.
diff --git a/docs/publications.rst b/docs/publications.rst
new file mode 100644
index 00000000..60f6c81e
--- /dev/null
+++ b/docs/publications.rst
@@ -0,0 +1,155 @@
+Publications
+============
+
+Flowcept Papers
+---------------
+
+**Towards Lightweight Data Integration using Multi-workflow Provenance and Data Observability**
+
+R. Souza, T. J. Skluzacek, S. R. Wilkinson, M. Ziatdinov, and R. Ferreira da Silva.
+*IEEE International Conference on e-Science*, Limassol, Cyprus, 2023.
+
+Introduces Flowcept's lightweight runtime provenance and data observability architecture and
+shows minimal-intrusion capture across heterogeneous workflows.
+
+Links:
+`doi <https://doi.org/10.1109/e-Science58273.2023.10254822>`__ |
+`pdf <https://arxiv.org/pdf/2308.09004.pdf>`__
+
+
+**PROV-AGENT: Unified Provenance for Tracking AI Agent Interactions in Agentic Workflows**
+
+R. Souza, A. Gueroudji, S. DeWitt, D. Rosendo, T. Ghosal, R. Ross,
+P. Balaprakash, and R. Ferreira da Silva.
+*IEEE International Conference on e-Science*, Chicago, USA, 2025.
+
+Defines agentic provenance and a unified provenance model and tooling to capture,
+link, and query AI-agent interactions within agentic workflows.
+
+Links:
+`doi <https://doi.org/10.1109/eScience65000.2025.00093>`__ |
+`pdf <https://arxiv.org/pdf/2508.02866>`__ |
+`html <https://arxiv.org/html/2508.02866v3>`__
+
+
+**Workflow Provenance in the Computing Continuum for Responsible, Trustworthy, and Energy-Efficient AI**
+
+R. Souza, S. Caino-Lores, M. Coletti, T. J. Skluzacek, A. Costan,
+F. Suter, M. Mattoso, and R. Ferreira da Silva.
+*IEEE International Conference on e-Science*, Osaka, Japan, 2024.
+
+Explains how end-to-end provenance across edge, cloud, and HPC supports responsible,
+trustworthy, and energy-aware AI workflows.
+
+Links:
+`doi <https://doi.org/10.1109/e-Science62913.2024.10678731>`__ |
+`pdf <https://hal.science/hal-04902079v1/document>`__
+
+
+**LLM Agents for Interactive Workflow Provenance: Reference Architecture and Evaluation Methodology**
+
+R. Souza, T. Poteet, B. Etz, D. Rosendo, A. Gueroudji, W. Shin,
+P. Balaprakash, and R. Ferreira da Silva.
+*Workflows in Support of Large-Scale Science (WORKS), co-located with SC*,
+St. Louis, USA, 2025.
+
+Presents a reference architecture and evaluation method for LLM agents that query
+and act on large-scale provenance databases.
+
+Links:
+`doi <https://doi.org/10.1145/3731599.3767582>`__ |
+`pdf <https://arxiv.org/pdf/2509.13978>`__ |
+`html <https://arxiv.org/html/2509.13978>`__
+
+
+Papers That Used Flowcept
+-------------------------
+
+**Toward a Persistent Event-Streaming System for High-Performance Computing Applications**
+
+M. Dorier, A. Gueroudji, V. Hayot-Sasson, H. Nguyen, S. Ockerman,
+R. Souza, T. Bicer, H. Pan, P. Carns, K. Chard, and others.
+*Frontiers in High Performance Computing*, 2025.
+
+Demonstrates Flowcept generating high-volume provenance that is persistently
+streamed with Mofka for HPC applications.
+
+Links:
+`doi <https://doi.org/10.3389/fhpcp.2025.1638203>`__ |
+`pdf <https://web.cels.anl.gov/~woz/papers/Mofka_2025.pdf>`__ |
+`html <https://www.frontiersin.org/journals/high-performance-computing/articles/10.3389/fhpcp.2025.1638203/full>`__
+
+
+**AI Agents for Enabling Autonomous Experiments at ORNL's HPC and Manufacturing User Facilities**
+
+D. Rosendo, S. DeWitt, R. Souza, P. Austria, T. Ghosal, M. McDonnell,
+R. Miller, T. Skluzacek, J. Haley, B. Turcksin, and others.
+*Extreme-Scale Experiment-in-the-Loop Computing (XLOOP), co-located with SC*,
+2025.
+
+Leverages Flowcept's agentic provenance to coordinate multi-agent experiments
+and connect agents with HPC simulations through a shared provenance stream.
+
+Links:
+`doi <https://doi.org/10.1145/3731599.3767592>`__ |
+`pdf <https://rafaelsilva.com/files/publications/rosendo2025xloop.pdf>`__ |
+`html <https://camps.aptaracorp.com/ACM_PMS/PMS/ACM/SCWORKSHOPS25/253/0b09762d-8e84-11f0-957d-16ffd757ba29/OUT/scworkshops25-253.html>`__
+
+
+BibTeX
+------
+
+.. code-block:: bibtex
+
+   @inproceedings{souza2023towards,
+     title={Towards Lightweight Data Integration using Multi-workflow Provenance and Data Observability},
+     author={Souza, Renan and Skluzacek, Tyler J and Wilkinson, Sean R and Ziatdinov, Maxim and da Silva, Rafael Ferreira},
+     booktitle={IEEE International Conference on e-Science},
+     doi={10.1109/e-Science58273.2023.10254822},
+     url={https://doi.org/10.1109/e-Science58273.2023.10254822},
+     pdf={https://arxiv.org/pdf/2308.09004.pdf},
+     year={2023}
+   }
+
+   @inproceedings{souza_prov_agent_2025,
+     author={Renan Souza and Amal Gueroudji and Stephen DeWitt and Daniel Rosendo and Tirthankar Ghosal and Robert Ross and Prasanna Balaprakash and Rafael Ferreira da Silva},
+     title={PROV-AGENT: Unified Provenance for Tracking {AI} Agent Interactions in Agentic Workflows},
+     booktitle={IEEE International Conference on e-Science},
+     year={2025},
+     doi={10.1109/eScience65000.2025.00093},
+     pdf={https://arxiv.org/pdf/2508.02866}
+   }
+
+   @inproceedings{souza_rtai_2024,
+     author={Renan Souza and Silvina Caino-Lores and Mark Coletti and Tyler J. Skluzacek and Alexandru Costan and Frederic Suter and Marta Mattoso and Rafael Ferreira da Silva},
+     title={Workflow Provenance in the Computing Continuum for Responsible, Trustworthy, and Energy-Efficient {AI}},
+     booktitle={IEEE International Conference on e-Science},
+     year={2024},
+     doi={10.1109/e-Science62913.2024.10678731},
+     pdf={https://hal.science/hal-04902079v1/document}
+   }
+
+   @inproceedings{souza_llm_agents_works_sc25,
+     title={{LLM} Agents for Interactive Workflow Provenance: Reference Architecture and Evaluation Methodology},
+     author={Souza, Renan and Poteet, Timothy and Etz, Brian and Rosendo, Daniel and Gueroudji, Amal and others},
+     booktitle={Workflows in Support of Large-Scale Science ({WORKS}) co-located with the {ACM}/{IEEE} International Conference for High Performance Computing, Networking, Storage, and Analysis ({SC})},
+     year={2025},
+     doi={10.1145/3731599.3767582}
+   }
+
+   @article{dorier2025toward,
+     author={Dorier, Matthieu and Gueroudji, Amal and Hayot-Sasson, Valerie and Nguyen, Hai and Ockerman, Seth and Souza, Renan and Bicer, Tekin and Pan, Haochen and Carns, Philip and Chard, Kyle and others},
+     doi={10.3389/fhpcp.2025.1638203},
+     journal={Frontiers in High Performance Computing},
+     title={Toward a Persistent Event-Streaming System for High-Performance Computing Applications},
+     volume={3},
+     year={2025}
+   }
+
+   @inproceedings{rosendo2025ai,
+     author={Rosendo, Daniel and DeWitt, Stephen and Souza, Renan and Austria, Phillipe and Ghosal, Tirthankar and McDonnell, Marshall and Miller, Ross and Skluzacek, Tyler J and Haley, James and Turcksin, Bruno and others},
+     booktitle={Extreme-Scale Experiment-in-the-Loop Computing ({XLOOP}) co-located with the {ACM}/{IEEE} International Conference for High Performance Computing, Networking, Storage, and Analysis ({SC})},
+     title={AI Agents for Enabling Autonomous Experiments at ORNL's HPC and Manufacturing User Facilities},
+     year={2025},
+     doi={10.1145/3731599.3767592}
+   }
diff --git a/docs/quick_start.rst b/docs/quick_start.rst
index 6ef231c8..167b3722 100644
--- a/docs/quick_start.rst
+++ b/docs/quick_start.rst
@@ -8,22 +8,19 @@ Quick Start
 
 The easiest way to capture provenance from plain Python functions—no external services required.
 
-Install and Initialize
-----------------------
+Install
+-------
 
-First, install Flowcept and initialize a settings file:
+First, install Flowcept:
 
 .. code-block:: bash
 
    # Make sure you activate your Python environment (conda, venv, etc.)
    pip install flowcept
-   flowcept --init-settings
 
-This creates a minimal settings file at ``~/.flowcept/settings.yaml``.
-
-Use this for the simplest offline path.
-
-If you need the full config structure instead, use:
+The simplest offline path does not require a settings file. If you need the
+full config structure for online services, adapters, telemetry, or deployment
+profiles, use:
 
 .. code-block:: bash
 
@@ -40,8 +37,6 @@ Save the following script as ``quickstart.py`` and run ``python quickstart.py``:
    Minimal example of Flowcept's instrumentation using decorators.
    No DB, broker, or external service required.
    """
-   import json
-
    from flowcept import Flowcept, flowcept_task
    from flowcept.instrumentation.flowcept_decorator import flowcept
 
@@ -67,9 +62,8 @@ Save the following script as ``quickstart.py`` and run ``python quickstart.py``:
    if __name__ == "__main__":
        main()
 
-       prov_buffer = Flowcept.read_buffer_file()
-       assert len(prov_buffer) == 2
-       print(json.dumps(prov_buffer, indent=2))
+       # print(Flowcept.read_buffer_file())  # inspect raw JSONL records if needed
+       Flowcept.generate_report(print_markdown=True)
 
 Inspecting the Output
 ---------------------
diff --git a/docs/schemas.rst b/docs/schemas.rst
index 4b2feee9..55ae2e59 100644
--- a/docs/schemas.rst
+++ b/docs/schemas.rst
@@ -14,10 +14,14 @@ Data Schemas for Flowcept data.
 PROV-AGENT and Flowcept
 =======================
 
-PROV-AGENT is a lightweight extension of `W3C PROV <https://www.w3.org/TR/prov-dm/>`_ for agentic workflows. It names the
-main building blocks you see in modern AI systems:
+PROV-AGENT is a `W3C PROV <https://www.w3.org/TR/prov-dm/>`_ extension for capturing provenance of agentic AI workflows.
+It is described in:
 
-- **Activities** such as Campaign, Workflow, and Task
+  R. Souza et al., *PROV-AGENT: Unified Provenance for Tracking AI Agent Interactions in Agentic Workflows*, IEEE International Conference on e-Science, Chicago, IL, USA, 2025. https://arxiv.org/abs/2508.02866
+
+PROV-AGENT names the main building blocks you see in modern AI systems:
+
+- **Activities** such as Campaign, Workflow, Task, AIModelInvocation, and AgentTool
 - **Agents** such as an AI agent or a human user
 - **Data Objects** such as domain data, prompts, responses, scheduling info, and telemetry
 - **Relations** such as *used*, *wasGeneratedBy*, *wasAssociatedWith*, *wasAttributedTo*, and *wasInformedBy*
@@ -42,6 +46,41 @@ At a high level:
 - **Relations** are preserved with IDs and standard fields (for example, workflow IDs, parent or dependency links),
   so the graph remains connected and queryable.
 
+PROV-AGENT task subtypes
+------------------------
+The ``subtype`` field on a Task record narrows it to a specific PROV-AGENT activity class.
+Use the :class:`~flowcept.commons.vocabulary.PROV_AGENT` enum to set these values:
+
+.. list-table::
+   :header-rows: 1
+   :widths: 30 25 45
+
+   * - Enum value
+     - Stored string
+     - Description
+   * - ``PROV_AGENT.AI_MODEL_INVOCATION``
+     - ``ai_model_invocation``
+     - A single LLM prompt→response call (*AIModelInvocation* in PROV-AGENT).
+       Captured automatically by :class:`~flowcept.instrumentation.flowcept_agent_task.FlowceptLLM`.
+       ``used.prompt`` stores the input; ``generated.response`` stores the output;
+       ``custom_metadata.llm_usage`` stores token counts.
+   * - ``PROV_AGENT.AGENT_TOOL``
+     - ``agent_tool``
+     - A tool execution by an AI agent (*AgentTool* in PROV-AGENT).
+       Captured automatically by the
+       :func:`~flowcept.instrumentation.flowcept_agent_task.agent_flowcept_task` decorator
+       applied to MCP tools and LangGraph tool nodes.
+       ``used`` stores tool arguments; ``generated`` stores the return value.
+
+The ``wasInformedBy`` relation — an ``AgentTool`` activity informing an ``AIModelInvocation`` — is
+the key link for root-cause analysis and downstream impact tracing in PROV-AGENT.  In Flowcept this
+is expressed through the ``agent_id`` field: every task with the same ``agent_id`` belongs to the
+same AI agent and can be queried together to reconstruct the full agent provenance graph.
+
+The UI uses ``subtype`` to visually distinguish AI agent activities from regular workflow tasks.
+Filter for ``subtype == "ai_model_invocation"`` or ``subtype == "agent_tool"`` to isolate agent
+interactions from the provenance database.
+
 Figure
 ------
 .. only:: html
diff --git a/docs/setup.rst b/docs/setup.rst
index 3fd9b0c9..042e85b7 100644
--- a/docs/setup.rst
+++ b/docs/setup.rst
@@ -31,6 +31,7 @@ Good practice is to cherry-pick the extras relevant to your workflow instead of
    pip install flowcept[mlflow]          # MLflow adapter
    pip install flowcept[dask]            # Dask adapter
    pip install flowcept[tensorboard]     # TensorBoard adapter
+   pip install flowcept[rabbitmq]        # RabbitMQ message queue
    pip install flowcept[kafka]           # Kafka message queue
    pip install flowcept[nvidia]          # NVIDIA GPU runtime capture
    pip install flowcept[telemetry]       # CPU/GPU/memory telemetry capture
@@ -114,9 +115,10 @@ Message Queue (MQ)
 
 Supported MQs:
 
-- `Redis <https://redis.io>`_ → **default**, lightweight, works on Linux, macOS, Windows, and HPC (tested on Frontier and Summit)  
-- `Kafka <https://kafka.apache.org>`_ → for distributed environments or if Kafka is already in your stack  
-- `Mofka <https://mofka.readthedocs.io>`_ → optimized for HPC runs  
+- `Redis <https://redis.io>`_ → **default**, lightweight, works on Linux, macOS, Windows, and HPC (tested on Frontier and Summit)
+- `RabbitMQ <https://www.rabbitmq.com>`_ → AMQP-based broker, suitable for cloud and enterprise environments
+- `Kafka <https://kafka.apache.org>`_ → for distributed environments or if Kafka is already in your stack
+- `Mofka <https://mofka.readthedocs.io>`_ → optimized for HPC runs
 
 Database (DB)
 --------------
@@ -149,10 +151,11 @@ Using Docker Compose (recommended)
 
 We provide a `Makefile <https://github.com/ORNL/flowcept/blob/main/deployment/Makefile>`_ with shortcuts:
 
-1. **Redis only (no DB)**: ``make services``   (LMDB can be used in this setup as a lightweight DB)  
-2. **Redis + MongoDB**: ``make services-mongo``  
-3. **Kafka + MongoDB**: ``make services-kafka``  
-4. **Mofka only (no DB)**: ``make services-mofka``  
+1. **Redis only (no DB)**: ``make services``   (LMDB can be used in this setup as a lightweight DB)
+2. **Redis + MongoDB**: ``make services-mongo``
+3. **RabbitMQ + MongoDB**: ``make services-rabbitmq``
+4. **Kafka + MongoDB**: ``make services-kafka``
+5. **Mofka only (no DB)**: ``make services-mofka``
 
 To customize, edit the YAML files in `deployment <https://github.com/ORNL/flowcept/tree/main/deployment>`_ and run:
 
diff --git a/examples/agents/aec_agent_context_manager.py b/examples/agents/aec_agent_context_manager.py
index 168c2b78..aa2f9350 100644
--- a/examples/agents/aec_agent_context_manager.py
+++ b/examples/agents/aec_agent_context_manager.py
@@ -3,7 +3,7 @@
 import json
 
 from flowcept.flowceptor.consumers.agent.base_agent_context_manager import BaseAgentContextManager
-from flowcept.agents.agent_client import run_tool
+from flowcept.agents.mcp.mcp_client import run_tool
 
 
 @dataclass
diff --git a/examples/agents/aec_agent_mock.py b/examples/agents/aec_agent_mock.py
index c3c9f1c1..351c36e5 100644
--- a/examples/agents/aec_agent_mock.py
+++ b/examples/agents/aec_agent_mock.py
@@ -7,7 +7,7 @@
 from mcp.server.fastmcp import FastMCP
 
 from flowcept.configs import AGENT
-from flowcept.agents.agents_utils import build_llm_model
+from flowcept.agents.llm.builders import build_llm_model
 
 from examples.agents.aec_agent_context_manager import AdamantineAeCContextManager
 from examples.agents.aec_prompts import choose_option_prompt, generate_options_set_prompt
diff --git a/examples/agents/opt_driver_mock.py b/examples/agents/opt_driver_mock.py
index bbd3b339..c966dce0 100644
--- a/examples/agents/opt_driver_mock.py
+++ b/examples/agents/opt_driver_mock.py
@@ -4,7 +4,7 @@
 from typing import Dict, List
 
 from flowcept.flowcept_api.flowcept_controller import Flowcept
-from flowcept.agents.agent_client import run_tool
+from flowcept.agents.mcp.mcp_client import run_tool
 from flowcept.flowceptor.consumers.base_consumer import BaseConsumer
 from flowcept.instrumentation.flowcept_task import flowcept_task
 from flowcept.instrumentation.task_capture import FlowceptTask
diff --git a/examples/llm_complex/llm_model.py b/examples/llm_complex/llm_model.py
index 80a718dc..b7532c65 100644
--- a/examples/llm_complex/llm_model.py
+++ b/examples/llm_complex/llm_model.py
@@ -229,7 +229,7 @@ def model_train(
         if val_loss < best_val_loss:
             best_val_loss = val_loss
             if with_persistence:
-                best_obj_id = Flowcept.db.save_or_update_torch_model(
+                best_obj_id = Flowcept.insert_or_update_torch_model(
                     model,
                     object_id=best_obj_id,
                     task_id=epochs_loop.get_current_iteration_id(),
diff --git a/examples/llm_tutorial/llm_model.py b/examples/llm_tutorial/llm_model.py
index ac8cfdfa..e52db3f5 100644
--- a/examples/llm_tutorial/llm_model.py
+++ b/examples/llm_tutorial/llm_model.py
@@ -231,7 +231,7 @@ def model_train(
         if val_loss < best_val_loss:
             best_val_loss = val_loss
             if with_persistence:
-                best_obj_id = Flowcept.db.save_or_update_torch_model(
+                best_obj_id = Flowcept.insert_or_update_torch_model(
                     model,
                     object_id=best_obj_id,
                     task_id=epochs_loop.get_current_iteration_id(),
diff --git a/examples/start_here.py b/examples/start_here.py
index b17e7f4f..7e856e5c 100644
--- a/examples/start_here.py
+++ b/examples/start_here.py
@@ -2,11 +2,10 @@
 This is a very simple script to show the basic instrumentation capabilities of Flowcept, using its most straightforward
 way of capturing workflow provenance from functions: using @decorators. It is meant to be executed in offline model.
 
-Flowcept will flush its internal buffer to a simple JSONL file in the end, if a `dump_buffer_path` is defined in
- the settings file (typically under ~/.flowcept/settings.yaml).
+Flowcept will flush its internal buffer to a simple JSONL file at the end of the run.
 
 This very simple scenario does not need any database, streaming service, message queue or any other external service.
-It should run fine after installing Flowcept via `pip install flowcept` and running `$> flowcept --init-settings`.
+It should run fine after installing Flowcept via `pip install flowcept`.
 
 For more complex features, such as online provenance analysis, HPC requirements, federated/highly distributed execution,
  data observability from existing adapters, PyTorch models, telemetry capture optimization, query requirements, or
@@ -45,11 +44,8 @@ def main():
     main()
 
     # Reporting and verifications:
-    prov_buffer = Flowcept.read_buffer_file()
-    assert len(prov_buffer) == 2
+    raw_records = Flowcept.read_buffer_file()
+    assert len(raw_records) == 2
     workflow_card_path = "WORKFLOW_CARD.md"
-    report_stats = Flowcept.generate_report(
-        records=prov_buffer,
-        output_path=workflow_card_path,
-    )
+    Flowcept.generate_report(output_path=workflow_card_path)
     print(f"{workflow_card_path} generated!")
diff --git a/examples/unmanaged/simple_task2.py b/examples/unmanaged/simple_task2.py
index a834a9d2..926e3423 100644
--- a/examples/unmanaged/simple_task2.py
+++ b/examples/unmanaged/simple_task2.py
@@ -41,4 +41,4 @@ def super_func4(alpha):
     flowcept.stop()
 
     flowcept_messages = Flowcept.read_buffer_file()
-    assert len(flowcept_messages) == 5
+    assert len(flowcept_messages) == 6
diff --git a/pyproject.toml b/pyproject.toml
index 326ef45b..f763ce57 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -47,14 +47,15 @@ dependencies = [
     "omegaconf",
     "numpy",
     "msgpack",
-    "orjson"
+    "orjson",
+    "rich",
 ]
 
 [project.optional-dependencies]
 redis = ["redis<8"]
 lmdb = ["lmdb"]
 telemetry = ["psutil>=6.1.1", "py-cpuinfo"]
-extras = ["flowcept[redis]", "flowcept[telemetry]", "flowcept[mongo]", "GitPython", "pandas", "pyarrow", "requests", "rich"]
+extras = ["flowcept[redis]", "flowcept[telemetry]", "flowcept[mongo]", "GitPython", "pandas", "pyarrow", "requests"]
 webservice = ["fastapi", "uvicorn", "pyyaml", "sse-starlette"]
 
 report_pdf = ["matplotlib", "reportlab", "networkx"]
@@ -62,12 +63,13 @@ mongo = ["pymongo", "pyarrow"]
 dask = ["tomli", "dask[distributed]<=2024.10.0"]
 docs = ["sphinx", "furo"]
 kafka = ["confluent-kafka<=2.8.0"]  # As of today, 2/28/2025, version 2.8.1 is stale. When this gets fixed, let's remove the version constraint. https://pypi.org/project/confluent-kafka/#history
+rabbitmq = ["pika"]
 mlflow = ["mlflow-skinny", "SQLAlchemy", "alembic", "watchdog", "cryptography"]
 nvidia = ["nvidia-ml-py"]
 amd = ["amdsmi"]
 mqtt = ["paho-mqtt"]
 tensorboard = ["tensorboard", "tensorflow", "tbparse"]
-llm_agent = ["mcp[cli]", "langchain_community", "langchain_openai", "streamlit", "PyMuPDF", "matplotlib", "tabulate"]
+llm_agent = ["mcp[cli]", "langchain_community", "langchain_openai", "langgraph", "streamlit", "PyMuPDF", "matplotlib", "tabulate"]
 llm_google = ["flowcept[llm_agent]", "google-genai"]
 llm_agent_audio = ["flowcept[llm_agent]", "streamlit-mic-recorder", "SpeechRecognition", "pydub", "gTTS"]
 # System dependency (required for pydub)
@@ -78,9 +80,9 @@ llm_agent_audio = ["flowcept[llm_agent]", "streamlit-mic-recorder", "SpeechRecog
 
 dev = [
     "flowcept[docs]",
+    "flowcept[rabbitmq]",
     "jupyterlab",
     "nbmake",
-    "pika",
     "pytest",
     "pytest-timeout",
     "ruff",
@@ -105,6 +107,7 @@ all = [
     "flowcept[mongo]",
     "flowcept[dask]",
     "flowcept[kafka]",
+    "flowcept[rabbitmq]",
     "flowcept[mlflow]",
     "flowcept[mqtt]",
     "flowcept[tensorboard]",
@@ -136,6 +139,9 @@ artifacts = ["src/flowcept/webservice/ui_build/**"]
 "resources/sample_settings.yaml" = "resources/sample_settings.yaml"
 
 [tool.pytest.ini_options]
+markers = [
+    "llm: tests that require a real LLM (run locally with env set; excluded from CI except run-llm-tests.yml)",
+]
 filterwarnings = [
     "ignore:websockets\\.legacy is deprecated:DeprecationWarning",
     "ignore:websockets\\.server\\.WebSocketServerProtocol is deprecated:DeprecationWarning",
diff --git a/resources/sample_settings.yaml b/resources/sample_settings.yaml
index 94963b1e..52fd22ae 100644
--- a/resources/sample_settings.yaml
+++ b/resources/sample_settings.yaml
@@ -44,13 +44,15 @@ experiment:
 
 mq:
   enabled: false
-  type: redis  # or kafka or mofka; Please adjust the port (kafka's default is 9092; redis is 6379). If mofka, adjust the group_file.
+  type: redis  # or kafka, mofka, rabbitmq; adjust port accordingly (redis: 6379, kafka: 9092, rabbitmq: 5672). If mofka, also set group_file.
   host: localhost
   # uri: ?
   # instances: ["localhost:6379"] # We can have multiple MQ instances being accessed by the consumers but each interceptor will currently access one single MQ..
   port: 6379
   # group_id: auto  # Kafka-only consumer group id. Use "auto" to generate a unique group per run.
   # group_file: mofka.json
+  # username: guest  # RabbitMQ only (AMQP); default is "guest"
+  # vhost: /         # RabbitMQ only; default is "/"
   channel: interception
   buffer_size: 50
   insertion_buffer_time_secs: 5
@@ -107,6 +109,7 @@ agent:
   chat_enabled: true # Enable the /api/v1/chat endpoint (requires the llm_agent extra and LLM settings above).
   chat_max_tool_iterations: 5 # Max LLM tool-calling iterations per chat message.
   chat_max_query_limit: 1000 # Hard cap for records returned by chat LLM query tools.
+  agent_mode: disabled # How the MCP agent is deployed: disabled | separate | colocated
 
 databases:
 
diff --git a/src/flowcept/README.md b/src/flowcept/README.md
index 5317e89b..7f4f3dfa 100644
--- a/src/flowcept/README.md
+++ b/src/flowcept/README.md
@@ -19,6 +19,20 @@ This directory contains the runtime package. Use this README as a code-orientati
 - `report/`: workflow card and PDF report generation.
 - `webservice/`: FastAPI read-only REST API.
 
+## Separation of Concerns
+
+Keep each module focused on one layer. Do not mix HTTP, orchestration, and persistence
+logic in the same place.
+
+- UI / Dashboard / user client → HTTP route → small service layer → `DBAPI` → DAO
+  (`MongoDBDAO` or `LMDBDAO`) → MongoDB / LMDB.
+- UI / Dashboard / chat route → LangChain / LangGraph orchestrator → MCP tool calls
+  → `DBAPI` or in-memory runtime objects.
+
+The webservice package should stay thin. The agents package should own orchestration
+and tool logic. Persistence stays in DAO files. Runtime queries can read the active
+DataFrame or workflow object in memory when that is the right source of truth.
+
 ## Code Rules
 
 - Keep config defaults and env-var reads in `configs.py`; do not hardcode runtime config elsewhere.
diff --git a/src/flowcept/agents/README.md b/src/flowcept/agents/README.md
index 4fb78c8e..633faa5d 100644
--- a/src/flowcept/agents/README.md
+++ b/src/flowcept/agents/README.md
@@ -1,168 +1,181 @@
 # Flowcept Agent
 
-This package contains the Flowcept MCP server, client helpers, tools, prompts,
-context manager, and optional UI pieces.
+This package contains the Flowcept MCP server, client helpers, data-query tools,
+MCP-wrapper tools, prompts, context manager, and LLM infrastructure.
+
+For code-assistant behavior, use the repository root `AGENTS.md`. Runtime usage
+docs live in `docs/agent.rst`.
+
+## What Lives Here
+
+- `chat_orchestration/`: LangChain / LangGraph orchestration for the web chat.
+  This is where the chat runtime, tool routing, and turn-level orchestration live.
+  It should stay separate from HTTP route handlers.
+- `mcp/`: the standalone MCP server surface. Keep these wrappers thin. They should
+  load context, call tools, and return `ToolResult`, but not own business logic.
+- `mcp/mcp_tools/`: MCP wrappers around shared tool cores. These are the public MCP
+  entry points that external assistants call.
+- `data_query_tools/`: shared query logic. This is where task, workflow, object, and
+  DataFrame query behavior lives. These modules can call `DBAPI` for persisted data
+  or read the in-memory DataFrame / workflow object for runtime questions.
+- `prompts/`: prompt-builder functions and prompt registrations. Keep them as plain
+  Python builders that return strings, not Jinja templates.
+- `provenance_schema_manager/`: schema introspection and documentation context used by
+  prompt builders.
+- `llm/`: model construction and normalization helpers. Centralize LLM creation here.
+- `gui/`: legacy UI helpers. Do not extend this unless the old GUI is being revived.
+
+## Directory Layout
 
-For code-assistant behavior, use the repository root `AGENTS.md`. Do not
-duplicate agent rules here. Runtime usage docs live in `docs/agent.rst`.
-
-## One Agent, Two Orchestrators
-
-Flowcept Agent has one shared backend and two orchestration paths.
-
-Both paths use the same MCP server, in-memory context, tools, prompts, and
-execution functions. The only intended difference is who does routing and LLM
-reasoning:
-
-- **Internal LLM mode:** Flowcept builds the configured LLM and orchestrates.
-- **External LLM mode:** Codex, Claude, LibreChat, Cursor, or another assistant
-  orchestrates and calls Flowcept MCP prompts/tools.
-
-## Shared Backend
-
-- `flowcept_agent.py` starts the MCP server.
-- `flowcept_ctx_manager.py` owns the live task/object/workflow context.
-- `tools/general_tools.py` exposes `prompt_handler` and shared commands.
-- `tools/in_memory_queries/` queries task/object DataFrames.
-- `tools/workflow_query_tools.py` queries the active workflow message object.
-- `prompts/` builds prompts for internal and external LLM generation.
-- `agents_utils.py` builds the configured internal LLM when Flowcept owns
-  orchestration.
-
-## Internal LLM Mode
-
-Use this when Flowcept should route free-text messages itself.
-
-```yaml
-agent:
-  external_llm: false
+```
+agents/
+  context_manager.py         # FlowceptAgentContextManager, mcp_flowcept, get_df_context
+  tool_result.py             # ToolResult Pydantic model (2xx/3xx/4xx/5xx conventions)
+
+  llm/
+    builders.py              # build_llm_model(), normalize_message()
+    providers/
+      claude_gcp.py          # ClaudeOnGCPLLM (Vertex AI)
+      gemini25.py            # Gemini25LLM
+
+  chat_orchestration/
+    chat_orchestrator_service.py  # LangGraph + MemorySaver chat turn orchestration
+
+  provenance_schema_manager/
+    static_schema_builder.py # SCHEMA_CONTEXT, build_schema_context, assert_schema_documented
+    dynamic_schema_tracker.py # Tracks evolving task/object schemas from live messages
+
+  data_query_tools/          # Plain-Python tool cores — NO MCP imports
+    db_query_tools.py        # query_tasks, query_workflows, get_task_summary, …
+    in_memory_task_query_tools.py   # run_df_query, generate_result_df, …
+    in_memory_workflow_query_tools.py  # execute_generated_workflow_query, run_workflow_query
+    pandas_utils.py          # safe_execute, normalize_output, format_result_df, …
+
+  mcp/
+    mcp_server.py            # MCP server entry point (start with `flowcept --start-agent`)
+    mcp_client.py            # Client helpers: run_tool(), run_prompt()
+    mcp_tools/               # Thin MCP wrappers over data_query_tools/
+      db_query_mcp_tools.py
+      in_memory_task_query_mcp_tools.py
+      in_memory_workflow_query_mcp_tools.py
+      session_tools.py       # check_liveness, check_llm, record_guidance, reset_context, …
+      report_tools.py        # generate_workflow_card
+
+  prompts/
+    README.md                # Prompt authoring rules
+    base_prompts.py          # BASE_ROLE, build_single_task_prompt, build_multitask_prompt
+    db_query_prompts.py      # build_db_filter_prompt
+    in_memory_task_query_prompts.py   # Pandas code / plot prompt builders
+    in_memory_workflow_query_prompts.py  # Workflow message query prompt builders
+    chat_prompts.py          # build_chat_system_prompt() for the webservice chat
+    mcp_prompts.py           # @mcp_flowcept.prompt() registrations
 ```
 
-Typical path:
+## One Agent, Two Orchestrators
 
-1. A client calls `prompt_handler(message)`.
-2. Flowcept builds the configured model with `build_llm_model()`.
-3. Flowcept classifies the message with the routing prompt.
-4. Flowcept calls the same MCP tools used by the external path.
-5. Tool results are returned to the client.
+The MCP agent exposes explicit tools. Claude Code, Codex, LibreChat, or another
+assistant can call MCP prompt-builders and execution tools directly.
 
-This mode supports natural-language routing through `prompt_handler`, including
-task/object DataFrame questions, plots, small talk, records, context reset, and
-direct DataFrame code execution.
+The webservice chat path is the sister module that owns the HTTP-facing chat UI.
+Its route layer stays thin and delegates to the chat orchestrator in
+`src/flowcept/webservice/services/`. That orchestrator calls into the same shared
+tool cores used by the MCP surface.
 
-## External LLM Mode
+## Schema Context
 
-Use this when an outside assistant should own reasoning and planning.
+`SCHEMA_CONTEXT` (module-level dict in `provenance_schema_manager/static_schema_builder.py`) is populated at
+MCP server startup via `build_schema_context()`. It maps:
 
-```yaml
-agent:
-  external_llm: true
+```python
+{
+  "task_fields": [...],            # TaskObject attribute docs
+  "workflow_fields": [...],        # WorkflowObject attribute docs
+  "telemetry_summary_fields": [...],  # TelemetrySummary + subclass docs
+  ...
+}
 ```
 
-Typical path:
-
-1. The outside assistant calls a Flowcept MCP prompt builder.
-2. The outside assistant sends that prompt to its own LLM.
-3. The outside assistant calls the matching Flowcept execution tool.
-4. Flowcept executes against the same live in-memory context.
-
-In this mode, arbitrary free-text messages sent to `prompt_handler` are not
-internally routed. This prevents Flowcept from silently becoming the planner
-when the outside assistant is supposed to plan.
+All prompt builders in `prompts/` use `SCHEMA_CONTEXT` for field tables instead
+of hardcoded strings. The MCP server refuses to start if any non-private field
+is undocumented (`SchemaDocumentationError`).
 
 ## Equivalent Tool Paths
 
-| Capability | Internal orchestration | External orchestration |
+| Capability | Internal | External |
 |---|---|---|
-| Task DataFrame question | `prompt_handler("...")` -> `run_df_query(...)` | `build_df_query_prompt(...)` -> external LLM -> `execute_generated_df_code(...)` |
-| Object DataFrame question | `prompt_handler("o: ...")` -> `run_df_query(context_kind="objects")` | `build_df_query_prompt(context_kind="objects")` -> external LLM -> `execute_generated_df_code(context_kind="objects")` |
-| Workflow metadata question | `prompt_handler("w: ...")` -> `run_workflow_query(...)` | `build_workflow_query_prompt(...)` -> external LLM -> `execute_generated_workflow_query(...)` |
-| Direct DataFrame code | `prompt_handler("result = df ...")` | `execute_generated_df_code("result = df ...")` |
-| Context reset and records | `prompt_handler("reset context")`, `@record`, `@show records`, `@reset records` | Same tools/commands |
-| Provenance reports | Flowcept report tools | Same report tools called explicitly |
-
-## Prefix Shortcuts
+| Task DF question | `run_df_query` | `build_df_query_prompt` → LLM → `execute_generated_df_code` |
+| Object DF question | `run_df_query(context_kind="objects")` | same, `context_kind="objects"` |
+| Workflow question | `run_workflow_query` | `build_workflow_query_prompt` → LLM → `execute_generated_workflow_query` |
+| DB provenance | `query_tasks` / `query_workflows` | same tools |
+| Reports | `generate_workflow_card` | same tool |
 
-These shortcuts are accepted by `prompt_handler` in both modes:
+## PROV-AGENT Instrumentation
 
-- `t: <question>` queries the task DataFrame.
-- `o: <question>` queries the object DataFrame.
-- `w: <question>` queries the workflow message object.
-- `result = df ...` executes explicit pandas code.
-- `save` saves the current DataFrame context.
-- `reset context`, `@record`, `@show records`, and `@reset records` manage
-  context and guidance.
+Flowcept tracks AI agent provenance following the **PROV-AGENT** model
+(arXiv:2508.02866), a W3C PROV extension for agentic workflows.
+Two `subtype` values from `flowcept.commons.vocabulary.PROV_AGENT` identify
+agent-specific activities in the task database:
 
-Important nuance: prefix shortcuts are convenience paths. If a shortcut needs
-LLM generation, the current implementation may build Flowcept's configured LLM.
-For strict external orchestration, use prompt-builder tools plus execution tools.
-
-## Start The MCP Server
+| Enum | Stored string | What it captures |
+|---|---|---|
+| `PROV_AGENT.AI_MODEL_INVOCATION` | `"ai_model_invocation"` | One LLM prompt → response call |
+| `PROV_AGENT.AGENT_TOOL` | `"agent_tool"` | One tool execution by an AI agent |
 
-Prefer the CLI:
+### Automatic capture
 
-```bash
-flowcept --start-agent
-```
+**MCP tools** — every `@mcp_flowcept.tool()` function in `mcp_tools/` is also
+decorated with `@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)`.  No extra
+code needed; tool calls are stored automatically when the interceptor is running.
 
-Equivalent module form:
+**LLM calls** — wrap any LangChain model with `FlowceptLLM` to record every
+`.invoke()` as `PROV_AGENT.AI_MODEL_INVOCATION`:
 
-```bash
-python -m flowcept.agents.flowcept_agent
+```python
+from flowcept.instrumentation.flowcept_agent_task import FlowceptLLM
+wrapped = FlowceptLLM(llm, agent_id=my_agent_id)
+response = wrapped.invoke("How many tasks failed?")
 ```
 
-Run from a Python environment where Flowcept is installed.
+**LangGraph chat** — `run_chat` in `chat_orchestration/chat_orchestrator_service.py`
+wraps each graph execution in a `Flowcept` context (`workflow_name="Flowcept LangGraph Chat"`,
+`start_persistence=True`).  This gives every chat turn its own `workflow_id`.
+Within the graph, `call_model` uses `FlowceptLLM` and `call_tools` uses
+`FlowceptTask(subtype=PROV_AGENT.AGENT_TOOL)` — both inherit
+`Flowcept.current_workflow_id` automatically.
 
-## Internal Prompt Handler Example
+### Querying agent provenance
 
 ```python
-from flowcept.agents.agent_client import run_tool
+# All LLM calls by a specific agent
+Flowcept.db.task_query(filter={"subtype": "ai_model_invocation", "agent_id": my_agent_id})
 
-result = run_tool(
-    "prompt_handler",
-    kwargs={"message": "What are the top 5 slowest activities?"},
-)
+# All tool executions in a chat session (workflow)
+Flowcept.db.task_query(filter={"subtype": "agent_tool", "workflow_id": thread_id})
 ```
 
-## External DataFrame Query Example
-
-```python
-from flowcept.agents.agent_client import run_prompt, run_tool
+The UI uses `subtype` to display AI agent workflows differently from regular
+scientific workflow tasks.
 
-prompt = run_prompt(
-    "build_df_query_prompt",
-    args={"query": "What are the top 5 slowest activities?", "context_kind": "tasks"},
-)
+See `docs/schemas.rst` → *PROV-AGENT and Flowcept* for the full data model and
+paper reference.
 
-# The external assistant sends `prompt` to its own LLM and gets pandas code.
-generated_code = (
-    "result = df.assign(duration=(df['ended_at'] - df['started_at']))"
-    ".groupby('activity_id', dropna=False)['duration']"
-    ".mean().sort_values(ascending=False).head(5)"
-    ".reset_index(name='avg_duration')"
-)
+## Starting the MCP Server
 
-result = run_tool(
-    "execute_generated_df_code",
-    kwargs={"user_code": generated_code, "context_kind": "tasks"},
-)
+```bash
+flowcept --start-agent
 ```
 
-## External Workflow Query Example
+## Client Usage
 
 ```python
-from flowcept.agents.agent_client import run_prompt, run_tool
+from flowcept.agents.mcp.mcp_client import run_tool, run_prompt
 
-prompt = run_prompt(
-    "build_workflow_query_prompt",
-    args={"query": "What settings path was used?"},
-)
+# Call a tool
+result = run_tool("run_df_query", kwargs={"query": "top 5 slowest activities", "context_kind": "tasks"})
 
-# The external assistant sends `prompt` to its own LLM and gets a JSON spec.
-query_spec = {"field_paths": ["conf.settings_path"], "missing": [], "answer_style": "short"}
-
-result = run_tool(
-    "execute_generated_workflow_query",
-    kwargs={"query_spec": query_spec},
+# Use a prompt builder (external LLM mode)
+prompt = run_prompt(
+  "build_df_query_prompt",
+  args={"query": "top 5 slowest activities", "context_kind": "tasks"},
 )
 ```
diff --git a/src/flowcept/agents/__init__.py b/src/flowcept/agents/__init__.py
index f24686ac..b248dd24 100644
--- a/src/flowcept/agents/__init__.py
+++ b/src/flowcept/agents/__init__.py
@@ -1,7 +1,7 @@
 # flake8: noqa: F403
 """Agents subpackage."""
 
-from flowcept.agents.tools.general_tools import *
-from flowcept.agents.tools.in_memory_queries.in_memory_queries_tools import *
-from flowcept.agents.tools.db_prov_tools import *
-from flowcept.agents.tools.workflow_query_tools import *
+from flowcept.agents.tool_result import ToolResult  # noqa: F401
+from flowcept.agents.mcp.mcp_tools import *
+from flowcept.agents.mcp.mcp_tools.df_query_mcp_tools import *
+from flowcept.agents.mcp.mcp_tools.db_query_mcp_tools import *
diff --git a/src/flowcept/agents/agents_utils.py b/src/flowcept/agents/agents_utils.py
deleted file mode 100644
index ae6c3e7f..00000000
--- a/src/flowcept/agents/agents_utils.py
+++ /dev/null
@@ -1,232 +0,0 @@
-import os
-import re
-import unicodedata
-from typing import Union, Dict
-
-from flowcept.flowceptor.consumers.agent.base_agent_context_manager import BaseAgentContextManager
-from flowcept.instrumentation.flowcept_agent_task import FlowceptLLM, get_current_context_task
-
-from flowcept.configs import AGENT
-from pydantic import BaseModel
-
-
-class ToolResult(BaseModel):
-    """
-    ToolResult is a standardized wrapper for tool outputs, encapsulating
-    status codes, results, and optional metadata.
-
-    This class provides conventions for interpreting the output of tools
-    (e.g., LLM calls, DataFrame operations, plotting functions) and ensures
-    consistent handling of both successes and errors.
-
-    Conventions
-    -----------
-    - **2xx: Success (string result)**
-      - Result is the expected output as a string.
-      - Example: ``201`` → operation completed successfully.
-
-    - **3xx: Success (dict result)**
-      - Result is the expected output as a dictionary.
-      - Example: ``301`` → operation completed successfully.
-
-    - **4xx: Error (string message)**
-      - System or agent internal error, returned as a string message.
-      - ``400``: LLM call problem (e.g., server connection or token issues).
-      - ``404``: Empty or ``None`` result.
-      - ``405``: LLM responded, but format was wrong.
-      - ``406``: Error executing Python code.
-      - ``499``: Other uncategorized error.
-
-    - **5xx: Error (dict result)**
-      - System or agent internal error, returned as a structured dictionary.
-
-    - **None**
-      - Result not yet set or tool did not return anything.
-
-    Attributes
-    ----------
-    code : int or None
-        Status code indicating success or error category.
-    result : str or dict, optional
-        The main output of the tool (string, dict, or error message).
-    extra : dict or str or None
-        Additional metadata or debugging information.
-    tool_name : str or None
-        Name of the tool that produced this result.
-
-    Methods
-    -------
-    result_is_str() -> bool
-        Return True if the result should be interpreted as a string.
-    is_success() -> bool
-        Return True if the result represents any type of success.
-    is_success_string() -> bool
-        Return True if the result is a success with a string output (2xx).
-    is_error_string() -> bool
-        Return True if the result is an error with a string message (4xx).
-    is_success_dict() -> bool
-        Return True if the result is a success with a dict output (3xx).
-
-    Examples
-    --------
-    >>> ToolResult(code=201, result="Operation successful")
-    ToolResult(code=201, result='Operation successful')
-
-    >>> ToolResult(code=301, result={"data": [1, 2, 3]})
-    ToolResult(code=301, result={'data': [1, 2, 3]})
-
-    >>> ToolResult(code=405, result="Invalid format from LLM")
-    ToolResult(code=405, result='Invalid format from LLM')
-    """
-
-    code: int | None = None
-    result: Union[str, Dict] = None
-    extra: Dict | str | None = None
-    tool_name: str | None = None
-
-    def result_is_str(self) -> bool:
-        """Returns True if the result is a string."""
-        return (200 <= self.code < 300) or (400 <= self.code < 500)
-
-    def is_success(self):
-        """Returns True if the result is a success."""
-        return self.is_success_string() or self.is_success_dict()
-
-    def is_success_string(self):
-        """Returns True if the result is a success string."""
-        return 200 <= self.code < 300
-
-    def is_error_string(self):
-        """Returns True if the result is an error string."""
-        return 400 <= self.code < 500
-
-    def is_success_dict(self) -> bool:
-        """Returns True if the result is a success dictionary."""
-        return 300 <= self.code < 400
-
-
-def build_llm_model(
-    model_name=None,
-    model_kwargs=None,
-    service_provider=None,
-    agent_id=BaseAgentContextManager.agent_id,
-    track_tools=True,
-    return_response_object=False,
-) -> FlowceptLLM:
-    """
-    Build and return an LLM instance using agent configuration.
-
-    This function retrieves the model name and keyword arguments from the AGENT configuration,
-    constructs a SambaStudio LLM instance, and returns it.
-
-    Returns
-    -------
-    LLM
-        An initialized LLM object configured using the `AGENT` settings.
-    """
-    _model_kwargs = (AGENT.get("model_kwargs") or {}).copy()
-    if model_kwargs is not None:
-        for k in model_kwargs:
-            _model_kwargs[k] = model_kwargs[k]
-
-    if "model" not in _model_kwargs:
-        _model_kwargs["model"] = AGENT.get("model", model_name)
-
-    if service_provider:
-        _service_provider = service_provider
-    else:
-        _service_provider = AGENT.get("service_provider")
-
-    if _service_provider == "sambanova":
-        from langchain_community.llms.sambanova import SambaStudio
-
-        os.environ["SAMBASTUDIO_URL"] = os.environ.get("SAMBASTUDIO_URL", AGENT.get("llm_server_url"))
-        os.environ["SAMBASTUDIO_API_KEY"] = os.environ.get("SAMBASTUDIO_API_KEY", AGENT.get("api_key"))
-
-        llm = SambaStudio(model_kwargs=_model_kwargs)
-    elif _service_provider == "azure":
-        from langchain_openai.chat_models.azure import AzureChatOpenAI
-
-        api_key = os.environ.get("AZURE_OPENAI_API_KEY", AGENT.get("api_key", None))
-        service_url = os.environ.get("AZURE_OPENAI_API_ENDPOINT", AGENT.get("llm_server_url", None))
-        llm = AzureChatOpenAI(
-            azure_deployment=_model_kwargs.get("model"), azure_endpoint=service_url, api_key=api_key, **_model_kwargs
-        )
-    elif _service_provider == "openai":
-        from langchain_openai import ChatOpenAI
-
-        api_key = os.environ.get("OPENAI_API_KEY", AGENT.get("api_key", None))
-        base_url = os.environ.get("OPENAI_BASE_URL", AGENT.get("llm_server_url") or None)
-        org = os.environ.get("OPENAI_ORG_ID", AGENT.get("organization", None))
-
-        init_kwargs = {"api_key": api_key}
-        if base_url:
-            init_kwargs["base_url"] = base_url
-        if org:
-            init_kwargs["organization"] = org
-
-        llm = ChatOpenAI(**init_kwargs, **_model_kwargs)
-    elif _service_provider == "google":
-        if "claude" in _model_kwargs["model"]:
-            api_key = os.environ.get("GOOGLE_API_KEY", AGENT.get("api_key", None))
-            _model_kwargs["model_id"] = _model_kwargs.pop("model")
-            _model_kwargs["google_token_auth"] = api_key
-            from flowcept.agents.llms.claude_gcp import ClaudeOnGCPLLM
-
-            llm = ClaudeOnGCPLLM(**_model_kwargs)
-        elif "gemini" in _model_kwargs["model"]:
-            from flowcept.agents.llms.gemini25 import Gemini25LLM
-
-            llm = Gemini25LLM(**_model_kwargs)
-    else:
-        raise Exception("Currently supported providers are sambanova, openai, azure, and google.")
-    if track_tools:
-        llm = FlowceptLLM(llm, return_response_object=return_response_object)
-        if agent_id is None:
-            agent_id = BaseAgentContextManager.agent_id
-        llm.agent_id = agent_id
-        if track_tools:
-            tool_task = get_current_context_task()
-            if tool_task:
-                llm.parent_task_id = tool_task.task_id
-    return llm
-
-
-def normalize_message(user_msg: str) -> str:
-    """
-    Normalize a user message into a canonical, comparison-friendly form.
-
-    The function standardizes text by trimming whitespace, applying Unicode
-    normalization, normalizing dash characters, collapsing repeated whitespace,
-    removing trailing punctuation that does not affect semantics, and converting
-    the result to lowercase.
-
-    Parameters
-    ----------
-    user_msg : str
-        Raw user input message.
-
-    Returns
-    -------
-    str
-        Normalized message suitable for matching, comparison, or hashing.
-    """
-    # 1) Strip leading/trailing whitespace
-    user_msg = user_msg.strip()
-
-    # 2) Unicode normalize to avoid weird characters (like fancy quotes, dashes)
-    user_msg = unicodedata.normalize("NFKC", user_msg)
-
-    # 3) Normalize dashes commonly used in chemistry (C–H, C—H, etc.)
-    user_msg = user_msg.replace("–", "-").replace("—", "-")
-
-    # 4) Collapse multiple spaces / newlines into a single space
-    user_msg = re.sub(r"\s+", " ", user_msg)
-
-    # 5) Remove trailing punctuation that doesn't change semantics
-    #    e.g., "?", "!", "." at the VERY end
-    user_msg = re.sub(r"[?!.\s]+$", "", user_msg)
-
-    user_msg = user_msg.lower()
-
-    return user_msg
diff --git a/src/flowcept/agents/chat_orchestration/__init__.py b/src/flowcept/agents/chat_orchestration/__init__.py
new file mode 100644
index 00000000..e3c007b6
--- /dev/null
+++ b/src/flowcept/agents/chat_orchestration/__init__.py
@@ -0,0 +1 @@
+"""LangChain/LangGraph orchestration for Flowcept agent chat."""
diff --git a/src/flowcept/agents/chat_orchestration/chat_orchestrator_service.py b/src/flowcept/agents/chat_orchestration/chat_orchestrator_service.py
new file mode 100644
index 00000000..2ed02aa0
--- /dev/null
+++ b/src/flowcept/agents/chat_orchestration/chat_orchestrator_service.py
@@ -0,0 +1,683 @@
+"""LLM chat orchestration for the webservice: LangGraph + MemorySaver tool-calling loop."""
+
+from __future__ import annotations
+
+import json
+import uuid
+from typing import Any, Dict, Generator, List, Optional
+
+from langchain_core.messages import AIMessage, HumanMessage, SystemMessage, ToolMessage
+from langgraph.checkpoint.memory import MemorySaver
+from langgraph.graph import END, MessagesState, StateGraph
+
+from langgraph.errors import GraphRecursionError
+
+from flowcept.agents.prompts.chat_prompts import build_chat_system_prompt
+from flowcept.agents.mcp.mcp_client import run_tool
+from flowcept.commons.flowcept_logger import FlowceptLogger
+from flowcept.commons.utils import sanitize_json_like
+from flowcept.commons.vocabulary import PROV_AGENT
+from flowcept.configs import AGENT_CHAT_MAX_TOOL_ITERATIONS, AGENT_CHAT_MAX_TOOL_RESULT_CHARS, INSTRUMENTATION_ENABLED
+
+MAX_TOOL_ITERATIONS = AGENT_CHAT_MAX_TOOL_ITERATIONS
+# Cap individual tool result strings fed into LangGraph state to prevent context overflow.
+_MAX_TOOL_RESULT_CHARS = AGENT_CHAT_MAX_TOOL_RESULT_CHARS
+CHAT_WORKFLOW_NAME = "Flowcept LangGraph Chat"
+
+# Module-level saver — persists across requests keyed by thread_id.
+_memory = MemorySaver()
+
+
+def _format_error(exc: BaseException, _depth: int = 0) -> str:
+    """Return a user-facing error string, unwrapping ExceptionGroup to its real cause."""
+    if _depth > 5:
+        return str(exc) or type(exc).__name__
+    if hasattr(exc, "exceptions"):  # ExceptionGroup / BaseExceptionGroup (Python 3.11+)
+        inner = "; ".join(_format_error(sub, _depth + 1) for sub in exc.exceptions)
+        return (
+            f"A tool call failed ({inner}). "
+            "This may be a transient service error — try rephrasing your question "
+            "or narrowing the scope (e.g. add a workflow_id or campaign_id)."
+        )
+    if exc.__cause__ is not None:
+        return _format_error(exc.__cause__, _depth + 1)
+    return str(exc) or type(exc).__name__
+
+
+def _build_langchain_tools(context: Optional[Dict[str, Any]], allow_dashboard_edit: bool):
+    """Wrap MCP tools as LangChain tools."""
+    from langchain_core.tools import tool
+
+    def _run_mcp(tool_name: str, **kwargs) -> str:
+        return run_tool(tool_name, kwargs=kwargs)[0]
+
+    def _coerce_projection(p: Any) -> Optional[List[str]]:
+        """Accept a list of field names or a Mongo projection dict {field: 1}."""
+        if p is None:
+            return None
+        if isinstance(p, dict):
+            return [k for k, v in p.items() if v]
+        return list(p)
+
+    def _coerce_sort(s: Any) -> Optional[List[Dict[str, Any]]]:
+        """Accept [{field, order}] or a Mongo sort dict {field: -1}."""
+        if s is None:
+            return None
+        if isinstance(s, dict):
+            return [{"field": k, "order": v} for k, v in s.items()]
+        return list(s)
+
+    def _scoped_filter(filter: Optional[Dict[str, Any]]) -> Dict[str, Any]:
+        """Apply workflow/campaign scope from the HTTP context."""
+        scoped = dict(filter or {})
+        for key in ("workflow_id", "campaign_id"):
+            if (context or {}).get(key):
+                scoped[key] = context[key]
+        return scoped
+
+    @tool
+    def query_tasks(
+        filter: Optional[Dict[str, Any]] = None,
+        projection: Optional[Any] = None,
+        limit: int = 100,
+        sort: Optional[Any] = None,
+    ) -> str:
+        """Query task provenance records with a Mongo-style filter.
+
+        projection: list of field names, or a Mongo projection dict {"field": 1}.
+        sort: list of {"field": "...", "order": 1|-1}, or a Mongo sort dict {"field": -1}.
+        """
+        return _run_mcp(
+            "query_tasks",
+            filter=_scoped_filter(filter),
+            projection=_coerce_projection(projection),
+            limit=limit,
+            sort=_coerce_sort(sort),
+        )
+
+    @tool
+    def query_workflows(filter: Optional[Dict[str, Any]] = None, limit: int = 100) -> str:
+        """Query workflow provenance records with a Mongo-style filter."""
+        return _run_mcp("query_workflows", filter=_scoped_filter(filter), limit=limit)
+
+    @tool
+    def get_task_summary(filter: Optional[Dict[str, Any]] = None) -> str:
+        """Summarize tasks: status counts, per-activity durations, and time range."""
+        return _run_mcp("get_task_summary", filter=_scoped_filter(filter))
+
+    @tool
+    def list_campaigns(campaign_id: Optional[str] = None) -> str:
+        """List derived campaign summaries (campaigns group workflows and tasks).
+
+        campaign_id: when provided, returns only that campaign's summary.
+        Always pass the campaign_id from the user context to scope the result.
+        """
+        effective_id = campaign_id or (context or {}).get("campaign_id")
+        return _run_mcp("list_campaigns", campaign_id=effective_id)
+
+    @tool
+    def list_agents() -> str:
+        """List derived agent summaries (agents observed in task provenance).
+
+        Automatically scoped to the current workflow when workflow_id is in context.
+        """
+        workflow_id = (context or {}).get("workflow_id")
+        effective_filter = {"workflow_id": workflow_id} if workflow_id else None
+        return _run_mcp("list_agents", filter=effective_filter)
+
+    @tool
+    def make_chart(card_spec: Dict[str, Any]) -> str:
+        """Build a chart from a declarative dashboard card spec; the UI renders the result."""
+        scoped_spec = dict(card_spec)
+        data_spec = dict(scoped_spec.get("data") or {})
+        data_spec["filter"] = _scoped_filter(data_spec.get("filter"))
+        scoped_spec["data"] = data_spec
+        return _run_mcp("make_chart", card_spec=scoped_spec, context=None)
+
+    @tool
+    def highlight_lineage(
+        task_ids: Optional[Any] = None,
+        filter: Optional[Dict[str, Any]] = None,
+    ) -> str:
+        """Highlight the full provenance lineage (ancestors + descendants) of tasks in the Dataflow graph.
+
+        Pass `task_ids` as a list of task ID strings, or a single task ID string.
+        Or use `filter` to find the seed tasks first.
+        The UI will dim all other nodes and visually trace the lineage chain.
+        Always pass a workflow_id in the filter when on a workflow page.
+        """
+        wf_id = (context or {}).get("workflow_id")
+        ids: Optional[List[str]] = None
+        if task_ids is not None:
+            ids = [task_ids] if isinstance(task_ids, str) else list(task_ids)
+        return _run_mcp("highlight_lineage", task_ids=ids, filter=filter, workflow_id=wf_id)
+
+    def _query_text(query: Any) -> str:
+        if isinstance(query, str):
+            return query
+        return json.dumps(query, default=str)
+
+    @tool("generate_result_df")
+    def generate_result_df(query: Any) -> str:
+        """Answer questions about task execution using the in-memory tasks DataFrame.
+
+        Use for questions about WHAT HAPPENED during the workflow: activities, task inputs/outputs,
+        timing, telemetry, agent actions, configuration parameters passed as task inputs, task counts,
+        lineage, and execution order. Each DataFrame row is a task record.
+
+        Do NOT use for questions about the inherent properties of stored data artifacts (models,
+        datasets, files) — use generate_objects_df for those.
+        """
+        return _run_mcp("run_df_query", query=_query_text(query), plot=False, context_kind="tasks")
+
+    @tool("generate_plot_code")
+    def generate_plot_code(query: Any = None, card_spec: Optional[Dict[str, Any]] = None) -> str:
+        """Generate plotting output using the MCP server's in-memory task DataFrame."""
+        query_payload = query if query is not None else card_spec
+        return _run_mcp("run_df_query", query=_query_text(query_payload), plot=True, context_kind="tasks")
+
+    @tool
+    def extract_or_fix_python_code(raw_text: str, runtime_error: Optional[str] = None) -> str:
+        """Extract or repair pandas code using the MCP server's in-memory task DataFrame columns."""
+        return _run_mcp(
+            "extract_or_fix_python_code",
+            raw_text=raw_text,
+            runtime_error=runtime_error,
+            context_kind="tasks",
+        )
+
+    @tool
+    def get_workflow_context() -> str:
+        """Return the workflow record loaded in the agent's in-memory context (DF path counterpart to query_workflows).
+
+        Use this tool ONLY when the question is specifically about workflow-level metadata: workflow name,
+        campaign, start/end timestamps, owner/user, description, hardware, or workflow structure.
+        Do NOT call this tool for questions about tasks, activities, agents, data artifacts, or model parameters —
+        use generate_result_df or generate_objects_df for those instead.
+        """
+        return _run_mcp("get_workflow_context")
+
+    @tool
+    def query_objects(
+        filter: Optional[Dict[str, Any]] = None,
+        projection: Optional[Any] = None,
+        limit: int = 100,
+    ) -> str:
+        """Query stored data-object records (ML models, datasets, blobs) by their inherent properties.
+
+        Use when the question asks about WHAT AN ARTIFACT IS — e.g. model training technique,
+        optimizer, number of parameters or weights, purpose or designed uses, science domain, loss,
+        dataset sample count or split ratio, object type, file size, or any custom_metadata field.
+        Filter by ``workflow_id`` or ``object_type`` (``"ml_model"``, ``"dataset"``).
+        ``custom_metadata`` sub-fields use dot-notation, e.g. ``custom_metadata.model_profile.params``.
+
+        Do NOT use for questions about task execution — use query_tasks for those.
+        """
+        # Objects have no campaign_id field; scope by workflow_id only.
+        obj_filter = dict(filter or {})
+        if (context or {}).get("workflow_id"):
+            obj_filter["workflow_id"] = context["workflow_id"]
+        return _run_mcp(
+            "query_objects",
+            filter=obj_filter,
+            projection=_coerce_projection(projection),
+            limit=limit,
+        )
+
+    @tool("generate_objects_df")
+    def generate_objects_df(query: Any) -> str:
+        """Answer questions about the inherent properties of stored data artifacts using the objects DataFrame.
+
+        Use when the question asks about WHAT AN ARTIFACT IS or WHAT IT CONTAINS — not what task
+        processed it. Examples: model training technique (custom_metadata.finetuning_technique),
+        parameter count (custom_metadata.n_params or custom_metadata.model_profile.params),
+        purpose or designed uses (custom_metadata.task_type), science domain
+        (custom_metadata.science_domain), loss, dataset sample count or split ratio, object type,
+        file size, or any field stored in custom_metadata. Each DataFrame row is an object record
+        with fields like object_type, custom_metadata.*, file_path, and workflow_id.
+
+        Do NOT use for questions about task execution (who ran tasks, timing, agent actions, task
+        inputs) — use generate_result_df for those.
+        """
+        return _run_mcp("run_df_query", query=_query_text(query), plot=False, context_kind="objects")
+
+    db_tools = [
+        query_tasks,
+        query_workflows,
+        get_task_summary,
+        list_campaigns,
+        list_agents,
+        make_chart,
+        highlight_lineage,
+        query_objects,
+    ]
+    df_tools = [
+        generate_result_df,
+        generate_plot_code,
+        extract_or_fix_python_code,
+        get_workflow_context,
+        list_agents,
+        generate_objects_df,
+    ]
+    tool_context = (context or {}).get("tool_context", "db")
+    if tool_context == "df":
+        tools = df_tools
+    else:
+        tools = db_tools
+
+    if allow_dashboard_edit:
+
+        @tool
+        def get_dashboard(dashboard_id: str) -> str:
+            """Get a stored dashboard spec by id."""
+            return _run_mcp("get_dashboard", dashboard_id=dashboard_id)
+
+        @tool
+        def update_dashboard(dashboard_id: str, spec: Dict[str, Any]) -> str:
+            """Replace a stored dashboard spec with a complete revised spec."""
+            return _run_mcp("update_dashboard", dashboard_id=dashboard_id, spec=spec)
+
+        tools += [get_dashboard, update_dashboard]
+    return tools
+
+
+def _with_workflow_schema_context(context: Optional[Dict[str, Any]]) -> Optional[Dict[str, Any]]:
+    """Attach MCP-owned workflow schema context to chat context when available."""
+    if not context or not context.get("workflow_id"):
+        return context
+    enriched = dict(context)
+    try:
+        payload = json.loads(run_tool("get_workflow_schema_context", kwargs={"workflow_id": context["workflow_id"]})[0])
+        if payload.get("code", 500) < 400 and isinstance(payload.get("result"), dict):
+            enriched["workflow_schema_context"] = payload["result"].get("prompt_context")
+    except Exception:
+        return enriched
+    return enriched
+
+
+def _build_graph(llm, tools, agent_id: Optional[str] = None, require_first_tool: bool = False):
+    """Build a LangGraph agent + tools graph compiled with the module-level MemorySaver."""
+    bound = llm.bind_tools(tools)
+    first_bound = llm.bind_tools(tools, tool_choice="required") if require_first_tool else bound
+    tools_by_name = {t.name: t for t in tools}
+
+    def _needs_first_tool(state: MessagesState) -> bool:
+        return require_first_tool and not any(isinstance(message, ToolMessage) for message in state["messages"])
+
+    def _latest_user_text(state: MessagesState) -> str:
+        for message in reversed(state["messages"]):
+            if isinstance(message, HumanMessage):
+                return str(message.content)
+        return ""
+
+    def _tool_calls_for_text(text: str) -> List[Dict[str, Any]]:
+        lower = text.lower()
+        names = set(tools_by_name)
+        has_specific_value = any(marker in lower for marker in ("task_id", "object_id", "workflow_id"))
+        if "generate_result_df" in names and any(
+            word in lower for word in ("submit", "submitted", "producer", "produced")
+        ):
+            # Pattern B: general attribution — query starts with "which/what" (no specific lookup
+            # value) and asks about the agent. list_agents alone is sufficient.
+            if (
+                "list_agents" in names
+                and "agent" in lower
+                and not has_specific_value
+                and lower.strip().startswith(("which ", "what "))
+            ):
+                return [{"name": "list_agents", "args": {}, "id": str(uuid.uuid4())}]
+            query = (
+                text + "\nInterpret submission/producer questions through provenance dataflow: "
+                "find upstream task rows whose generated.* values match used.* values consumed by the target activity, "
+                "then return the upstream activity_id and agent_id. "
+                "For work-item submission, prefer producer tasks with generated list/dict descriptors that map to "
+                "target used identifiers or parameters; do not treat dataset/file/artifact producers as submitters "
+                "unless the user explicitly asks about data artifacts. "
+                "If the named value appears inside a list of dictionaries in a generated.* field, "
+                "extract the full matching dictionary and include its key-value fields."
+            )
+            tool_calls = [{"name": "generate_result_df", "args": {"query": query}, "id": str(uuid.uuid4())}]
+            if "list_agents" in names:
+                tool_calls.append({"name": "list_agents", "args": {}, "id": str(uuid.uuid4())})
+            return tool_calls
+        if "list_agents" in names and "agent" in lower and not has_specific_value:
+            return [{"name": "list_agents", "args": {}, "id": str(uuid.uuid4())}]
+        if "get_task_summary" in names and any(
+            phrase in lower
+            for phrase in (
+                "lineage",
+                "data flow",
+                "execution order",
+                "how many",
+                "count",
+                "summary",
+                "duration",
+            )
+        ):
+            return [{"name": "get_task_summary", "args": {}, "id": str(uuid.uuid4())}]
+        if "make_chart" in names and any(word in lower for word in ("plot", "chart", "graph")):
+            return [
+                {
+                    "name": "make_chart",
+                    "args": {
+                        "card_spec": {
+                            "chart_id": "chat-chart",
+                            "type": "chart",
+                            "title": text,
+                            "data": {
+                                "source": "tasks",
+                                "group_by": "activity_id",
+                                "metrics": [{"agg": "count"}],
+                            },
+                            "viz": {"kind": "bar"},
+                        }
+                    },
+                    "id": str(uuid.uuid4()),
+                }
+            ]
+        if "query_objects" in names and any(
+            phrase in lower for phrase in ("object type", "blob object", "artifact type", "object_type")
+        ):
+            return [{"name": "query_objects", "args": {}, "id": str(uuid.uuid4())}]
+        if "generate_objects_df" in names and any(
+            phrase in lower for phrase in ("object type", "blob object", "artifact type", "object_type")
+        ):
+            return [{"name": "generate_objects_df", "args": {"query": text}, "id": str(uuid.uuid4())}]
+        if "extract_or_fix_python_code" in names and ("fix" in lower or "python code" in lower or "dataframe" in lower):
+            return [{"name": "extract_or_fix_python_code", "args": {"raw_text": text}, "id": str(uuid.uuid4())}]
+        if "generate_plot_code" in names and any(word in lower for word in ("plot", "chart", "graph")):
+            return [{"name": "generate_plot_code", "args": {"query": text}, "id": str(uuid.uuid4())}]
+        if "generate_result_df" in names and any(word in lower for word in ("lineage", "execution order", "data flow")):
+            query = (
+                text
+                + "\nThe user is asking for workflow lineage/order. Return the ordered distinct activity_id values "
+                "from the workflow, using task timestamps or row order when timestamps are unavailable. "
+                "Include upstream, target, and downstream activities; do not answer only with metric-matching rows."
+            )
+            return [{"name": "generate_result_df", "args": {"query": query}, "id": str(uuid.uuid4())}]
+        if "generate_result_df" in names and "how many" in lower and any(w in lower for w in ("task", "tasks")):
+            query = (
+                text + "\nReturn a self-descriptive DataFrame, e.g. result = pd.DataFrame({'task_count': [len(df)]})"
+                " so the count is clearly labeled."
+            )
+            return [{"name": "generate_result_df", "args": {"query": query}, "id": str(uuid.uuid4())}]
+        if "generate_result_df" in names and any(
+            word in lower
+            for word in (
+                "activity",
+                "agent",
+                "count",
+                "how many",
+                "lineage",
+                "task",
+            )
+        ):
+            return [{"name": "generate_result_df", "args": {"query": text}, "id": str(uuid.uuid4())}]
+        if "query_workflows" in names and "workflow" in lower:
+            return [{"name": "query_workflows", "args": {}, "id": str(uuid.uuid4())}]
+        if "get_workflow_context" in names and any(word in lower for word in ("workflow", "workflows")):
+            # DF path: workflow records live in the MCP context object, not the tasks DataFrame.
+            # get_workflow_context is the DF-path counterpart to query_workflows.
+            return [{"name": "get_workflow_context", "args": {}, "id": str(uuid.uuid4())}]
+        if "generate_result_df" in names:
+            return [{"name": "generate_result_df", "args": {"query": text}, "id": str(uuid.uuid4())}]
+        return [{"name": next(iter(tools_by_name)), "args": {}, "id": str(uuid.uuid4())}]
+
+    def _enforce_first_tool(response: AIMessage, state: MessagesState) -> AIMessage:
+        if not _needs_first_tool(state):
+            return response
+        return AIMessage(content="", tool_calls=_tool_calls_for_text(_latest_user_text(state)))
+
+    if INSTRUMENTATION_ENABLED and agent_id is not None:
+        from flowcept.instrumentation.flowcept_agent_task import FlowceptLLM
+        from flowcept.instrumentation.task_capture import FlowceptTask
+
+        # workflow_id is resolved automatically from Flowcept.current_workflow_id
+        # which is set by the Flowcept context in run_chat.
+        instrumented_llm = FlowceptLLM(bound, agent_id=agent_id, return_response_object=True)
+
+        def call_model(state: MessagesState):
+            """Agent node: invoke the LLM with current messages (instrumented)."""
+            active_llm = (
+                FlowceptLLM(first_bound, agent_id=agent_id, return_response_object=True)
+                if _needs_first_tool(state)
+                else instrumented_llm
+            )
+            return {"messages": [_enforce_first_tool(active_llm.invoke(state["messages"]), state)]}
+
+        def call_tools(state: MessagesState):
+            """Tools node: execute all pending tool calls with provenance capture."""
+            last = state["messages"][-1]
+            tool_msgs = []
+            for tc in getattr(last, "tool_calls", []):
+                name = tc["name"]
+                args = tc.get("args") or {}
+                call_id = tc.get("id") or name
+                tool_fn = tools_by_name.get(name)
+                with FlowceptTask(
+                    activity_id=name,
+                    subtype=PROV_AGENT.AGENT_TOOL,
+                    used=sanitize_json_like(args, mongo_safe_keys=True),
+                    agent_id=agent_id,
+                ) as task:
+                    output = (
+                        tool_fn.invoke(args) if tool_fn is not None else json.dumps({"error": f"Unknown tool {name}"})
+                    )
+                    task.end(generated={"output": output[:500] if isinstance(output, str) else output})
+                if isinstance(output, str) and len(output) > _MAX_TOOL_RESULT_CHARS:
+                    output = output[:_MAX_TOOL_RESULT_CHARS] + f"... [truncated, {len(output)} chars total]"
+                tool_msgs.append(ToolMessage(content=output, tool_call_id=call_id, name=name))
+            return {"messages": tool_msgs}
+
+    else:
+
+        def call_model(state: MessagesState):
+            """Agent node: invoke the LLM with current messages."""
+            response = (first_bound if _needs_first_tool(state) else bound).invoke(state["messages"])
+            return {"messages": [_enforce_first_tool(response, state)]}
+
+        def call_tools(state: MessagesState):
+            """Tools node: execute all pending tool calls and return ToolMessages."""
+            last = state["messages"][-1]
+            tool_msgs = []
+            for tc in getattr(last, "tool_calls", []):
+                name = tc["name"]
+                args = tc.get("args") or {}
+                call_id = tc.get("id") or name
+                tool_fn = tools_by_name.get(name)
+                output = tool_fn.invoke(args) if tool_fn is not None else json.dumps({"error": f"Unknown tool {name}"})
+                if isinstance(output, str) and len(output) > _MAX_TOOL_RESULT_CHARS:
+                    output = output[:_MAX_TOOL_RESULT_CHARS] + f"... [truncated, {len(output)} chars total]"
+                tool_msgs.append(ToolMessage(content=output, tool_call_id=call_id, name=name))
+            return {"messages": tool_msgs}
+
+    def should_continue(state: MessagesState):
+        """Route to tools if the last AI message has tool calls; otherwise end."""
+        last = state["messages"][-1]
+        if isinstance(last, AIMessage) and getattr(last, "tool_calls", None):
+            return "tools"
+        return END
+
+    graph = StateGraph(MessagesState)
+    graph.add_node("agent", call_model)
+    graph.add_node("tools", call_tools)
+    graph.set_entry_point("agent")
+    graph.add_conditional_edges("agent", should_continue)
+    graph.add_edge("tools", "agent")
+    return graph.compile(checkpointer=_memory)
+
+
+def _prepare_input_messages(
+    messages: List[Dict[str, str]],
+    context: Optional[Dict[str, Any]],
+    thread_id: Optional[str],
+) -> List:
+    """Convert client messages to LangChain message objects.
+
+    When a stateful thread already has a checkpoint, only the new user messages
+    are returned (server owns history via MemorySaver).  For new threads and
+    stateless calls the full message list is returned with the system prompt
+    prepended.
+    """
+    config = {"configurable": {"thread_id": thread_id}} if thread_id else None
+    is_new_thread = config is None or _memory.get(config) is None
+
+    lc_messages = []
+    for m in messages:
+        role = m.get("role")
+        content = m.get("content", "")
+        lc_messages.append(AIMessage(content=content) if role == "assistant" else HumanMessage(content=content))
+
+    if is_new_thread:
+        lc_messages = [SystemMessage(content=build_chat_system_prompt(context))] + lc_messages
+
+    return lc_messages
+
+
+def run_chat(
+    llm,
+    messages: List[Dict[str, str]],
+    context: Optional[Dict[str, Any]] = None,
+    allow_dashboard_edit: bool = False,
+    thread_id: Optional[str] = None,
+) -> Generator[Dict[str, Any], None, None]:
+    """Run one chat turn as a generator of events backed by LangGraph + MemorySaver.
+
+    Yields dict events: ``{"event": "tool_call"|"tool_result"|"card"|"token"|"done"|"error", ...}``.
+
+    When *thread_id* is ``None`` the call is stateless (client manages full history in
+    *messages*).  When *thread_id* is provided the server owns history: pass only the
+    new message(s) in *messages* on follow-up turns.
+
+    Parameters
+    ----------
+    llm : Any
+        A langchain chat model (from ``build_llm_model``).
+    messages : list of dict
+        ``[{"role": "user"|"assistant", "content": "..."}]``.
+        Full history when *thread_id* is ``None``; only new messages otherwise.
+    context : dict, optional
+        UI context injected into the system prompt and chart tool.
+    allow_dashboard_edit : bool, optional
+        Whether dashboard-modifying tools are bound.
+    thread_id : str, optional
+        Stable ID that keys server-side conversation memory.
+    """
+    logger = FlowceptLogger()
+    context = _with_workflow_schema_context(context)
+    tools = _build_langchain_tools(context, allow_dashboard_edit)
+
+    effective_thread_id = thread_id if thread_id is not None else str(uuid.uuid4())
+
+    agent_id: Optional[str] = None
+    if INSTRUMENTATION_ENABLED:
+        from flowcept.flowceptor.consumers.agent.base_agent_context_manager import BaseAgentContextManager
+
+        agent_id = BaseAgentContextManager.agent_id or effective_thread_id
+
+    try:
+        llm.bind_tools(tools)
+    except (NotImplementedError, AttributeError):
+        logger.warning("Chat LLM does not support tool binding; answering without tools.")
+        from langchain_core.messages import SystemMessage as _SM
+
+        lc = [_SM(content=build_chat_system_prompt(context))] + [
+            AIMessage(content=m.get("content", ""))
+            if m.get("role") == "assistant"
+            else HumanMessage(content=m.get("content", ""))
+            for m in messages
+        ]
+        try:
+            response = llm.invoke(lc)
+            yield {"event": "token", "data": getattr(response, "content", str(response))}
+        except Exception as exc:
+            logger.exception(exc)
+            yield {"event": "error", "data": str(exc)}
+        yield {"event": "done"}
+        return
+
+    config = {
+        "configurable": {"thread_id": effective_thread_id},
+        "recursion_limit": MAX_TOOL_ITERATIONS * 2 + 2,
+    }
+
+    graph = _build_graph(
+        llm,
+        tools,
+        agent_id=agent_id,
+        require_first_tool=(context or {}).get("tool_context", "db") in {"db", "df"},
+    )
+    lc_messages = _prepare_input_messages(messages, context, thread_id)
+
+    # Each LangGraph execution gets its own Flowcept workflow so all AI model
+    # invocations and tool calls within this call share a single workflow_id.
+    # Chat owns its persistence lifecycle so HTTP requests, tests, and deployed
+    # webservice instances all record agent provenance without external state.
+    from flowcept.flowcept_api.flowcept_controller import Flowcept as _FC
+
+    with _FC(
+        workflow_name=CHAT_WORKFLOW_NAME,
+        start_persistence=True,
+        save_workflow=True,
+        agent_name="FlowceptAgent",
+    ):
+        accumulated_tool_results: List[str] = []
+        try:
+            for chunk in graph.stream({"messages": lc_messages}, config=config, stream_mode="updates"):
+                for node_name, node_output in chunk.items():
+                    msgs = node_output.get("messages", [])
+                    if node_name == "agent":
+                        last = msgs[-1] if msgs else None
+                        if last is None:
+                            continue
+                        tool_calls = getattr(last, "tool_calls", None) or []
+                        if tool_calls:
+                            for tc in tool_calls:
+                                yield {"event": "tool_call", "data": {"name": tc["name"], "args": tc.get("args", {})}}
+                        else:
+                            yield {"event": "token", "data": getattr(last, "content", "")}
+                            yield {"event": "done"}
+                    elif node_name == "tools":
+                        for tm in msgs:
+                            name = getattr(tm, "name", "")
+                            accumulated_tool_results.append(f"[{name}]: {tm.content[:2000]}")
+                            summary: Dict[str, Any] = {"name": name}
+                            try:
+                                parsed = json.loads(tm.content)
+                                summary["code"] = parsed.get("code")
+                                summary["tool_name"] = parsed.get("tool_name")
+                                if name == "make_chart" and isinstance(parsed.get("result"), dict):
+                                    yield {"event": "card", "data": parsed["result"]}
+                                if name == "highlight_lineage" and isinstance(parsed.get("result"), dict):
+                                    yield {"event": "ui:highlight", "data": parsed["result"]}
+                            except Exception:
+                                pass
+                            yield {"event": "tool_result", "data": summary}
+        except GraphRecursionError:
+            logger.warning(
+                f"LLM hit the tool-call recursion limit ({MAX_TOOL_ITERATIONS} iterations) "
+                "without producing a final answer. Synthesizing from accumulated tool results."
+            )
+            if accumulated_tool_results:
+                summary_prompt = (
+                    "The following tool results were retrieved. "
+                    "Write a concise final answer to the user's question based solely on this data. "
+                    "Do not call any tools.\n\n" + "\n\n".join(accumulated_tool_results)
+                )
+                try:
+                    response = llm.invoke([HumanMessage(content=summary_prompt)])
+                    content = getattr(response, "content", None) or str(response)
+                    if content:
+                        yield {"event": "token", "data": content}
+                    else:
+                        yield {"event": "token", "data": "\n\n".join(accumulated_tool_results[:3])}
+                except Exception as fallback_exc:
+                    logger.exception(fallback_exc)
+                    # Synthesis failed — surface raw tool results so the caller gets a 200
+                    yield {"event": "token", "data": "\n\n".join(accumulated_tool_results[:3])}
+            else:
+                yield {"event": "error", "data": "Reached tool call limit without retrieving any data."}
+            yield {"event": "done"}
+        except Exception as e:
+            logger.exception(e)
+            yield {"event": "error", "data": _format_error(e)}
diff --git a/src/flowcept/agents/data_query_tools/__init__.py b/src/flowcept/agents/data_query_tools/__init__.py
new file mode 100644
index 00000000..31e7bcf1
--- /dev/null
+++ b/src/flowcept/agents/data_query_tools/__init__.py
@@ -0,0 +1 @@
+"""Plain-Python tool cores — no framework (MCP/LangChain) imports."""
diff --git a/src/flowcept/agents/data_query_tools/dashboard_tools.py b/src/flowcept/agents/data_query_tools/dashboard_tools.py
new file mode 100644
index 00000000..c4ad9f72
--- /dev/null
+++ b/src/flowcept/agents/data_query_tools/dashboard_tools.py
@@ -0,0 +1,122 @@
+"""Dashboard agent tools: chart building and dashboard CRUD.
+
+Plain Python — no LangChain, no MCP, no webservice imports.
+These tools are used by the LangGraph chat agent and MCP server; framework
+wrappers live in their respective layers.
+"""
+
+from __future__ import annotations
+
+from datetime import datetime, timezone
+from typing import Any, Dict, List, Optional
+
+from flowcept.agents.tool_result import ToolResult
+from flowcept.commons.daos.docdb_dao.docdb_dao_utils import validate_filter as _validate_filter
+from flowcept.commons.flowcept_logger import FlowceptLogger
+from flowcept.commons.utils import normalize_docs
+from flowcept.flowcept_api.db_api import DBAPI
+
+
+def _guarded(tool_name: str):
+    """Decorator: validate filters, cap limits, and convert errors to ToolResult codes."""
+
+    def decorator(func):
+        def wrapper(*args, **kwargs):
+            try:
+                if "filter" in kwargs:
+                    _validate_filter(kwargs.get("filter"))
+                return func(*args, **kwargs)
+            except ValueError as e:
+                return ToolResult(code=400, result=str(e), tool_name=tool_name)
+            except Exception as e:
+                FlowceptLogger().exception(e)
+                return ToolResult(code=499, result=f"Error in {tool_name}: {e}", tool_name=tool_name)
+
+        wrapper.__name__ = func.__name__
+        wrapper.__doc__ = func.__doc__
+        return wrapper
+
+    return decorator
+
+
+def _normalize(docs: List[Dict]) -> List[Dict]:
+    return normalize_docs(docs)
+
+
+@_guarded("make_chart")
+def make_chart(card_spec: Dict[str, Any], context: Optional[Dict[str, Any]] = None) -> ToolResult:
+    """Build a chart card: resolve a declarative data binding into plottable rows.
+
+    Parameters
+    ----------
+    card_spec : dict
+        A dashboard chart spec with a ``data`` binding describing what to query.
+    context : dict, optional
+        Extra filter ANDed into the chart data filter (e.g., ``{"workflow_id": "..."}``).
+
+    Returns
+    -------
+    ToolResult
+        ``result`` holds ``{"chart": <spec>, "rows": [...], "count": int}``.
+    """
+    data_spec = card_spec.get("data")
+    if not data_spec:
+        return ToolResult(code=400, result="Chart spec must include a data binding.", tool_name="make_chart")
+    _validate_filter(data_spec.get("filter", {}))
+    if context:
+        _validate_filter(context)
+    resolved = DBAPI().resolve_chart_data(data_spec, context=context)
+    result = {"chart": card_spec, "rows": _normalize(resolved["rows"]), "count": resolved["count"]}
+    return ToolResult(code=301, result=result, tool_name="make_chart")
+
+
+@_guarded("get_dashboard")
+def get_dashboard(dashboard_id: str) -> ToolResult:
+    """Get a stored dashboard spec by id.
+
+    Parameters
+    ----------
+    dashboard_id : str
+        Dashboard identifier.
+
+    Returns
+    -------
+    ToolResult
+        ``result`` holds the dashboard spec dict, or a 404 message.
+    """
+    doc = DBAPI.get_dao_instance().get_dashboard(dashboard_id)
+    if doc is None:
+        return ToolResult(code=404, result=f"Dashboard not found: {dashboard_id}", tool_name="get_dashboard")
+    return ToolResult(code=301, result=doc, tool_name="get_dashboard")
+
+
+@_guarded("update_dashboard")
+def update_dashboard(dashboard_id: str, spec: Dict[str, Any]) -> ToolResult:
+    """Replace a stored dashboard spec, preserving id and creation time.
+
+    Parameters
+    ----------
+    dashboard_id : str
+        Dashboard identifier.
+    spec : dict
+        Full replacement dashboard spec.
+
+    Returns
+    -------
+    ToolResult
+        ``result`` holds the saved dashboard spec dict.
+    """
+    dao = DBAPI.get_dao_instance()
+    existing = dao.get_dashboard(dashboard_id)
+    if existing is None:
+        return ToolResult(code=404, result=f"Dashboard not found: {dashboard_id}", tool_name="update_dashboard")
+    _validate_filter(spec.get("context", {}))
+    for card in spec.get("charts", []):
+        if card.get("data"):
+            _validate_filter(card["data"].get("filter", {}))
+    spec["dashboard_id"] = dashboard_id
+    spec["created_at"] = existing.get("created_at")
+    spec["updated_at"] = datetime.now(timezone.utc).isoformat()
+    if not dao.save_dashboard(spec):
+        return ToolResult(code=500, result="Could not save dashboard.", tool_name="update_dashboard")
+    return ToolResult(code=301, result=spec, tool_name="update_dashboard")
diff --git a/src/flowcept/agents/tools/prov_tools.py b/src/flowcept/agents/data_query_tools/db_query_tools.py
similarity index 57%
rename from src/flowcept/agents/tools/prov_tools.py
rename to src/flowcept/agents/data_query_tools/db_query_tools.py
index 5105c0f1..f964359c 100644
--- a/src/flowcept/agents/tools/prov_tools.py
+++ b/src/flowcept/agents/data_query_tools/db_query_tools.py
@@ -10,16 +10,12 @@
 
 from typing import Any, Dict, List, Optional
 
-from datetime import datetime, timezone
-
-from flowcept.agents.agents_utils import ToolResult
+from flowcept.agents.tool_result import ToolResult
+from flowcept.agents.data_query_tools.tools_utils import query_runtime_retry
 from flowcept.commons.flowcept_logger import FlowceptLogger
 from flowcept.configs import AGENT_CHAT_MAX_QUERY_LIMIT
 from flowcept.flowcept_api.db_api import DBAPI
-from flowcept.webservice.schemas.dashboards import DashboardChart, DashboardSpec
-from flowcept.webservice.services import stats
-from flowcept.webservice.services.dashboard_store import get_dashboard_store
-from flowcept.webservice.services.serializers import normalize_docs
+from flowcept.commons.utils import normalize_docs
 
 ALLOWED_FILTER_OPERATORS = {
     "$and",
@@ -90,10 +86,51 @@ def wrapper(*args, **kwargs):
     return decorator
 
 
+_WORKFLOW_HEAVY_FIELDS = frozenset(
+    {
+        "machine_info",
+        "flowcept_settings",
+        "code_repository",
+        "conf",
+        "extra_metadata",
+        "environment_id",
+        "sys_name",
+        "interceptor_ids",
+        "adapter_id",
+        "flowcept_version",
+    }
+)
+
+
 def _normalize(docs: List[Dict]) -> List[Dict]:
     return normalize_docs(docs)
 
 
+def _normalize_workflows(docs: List[Dict]) -> List[Dict]:
+    """Normalize workflow docs, stripping heavy infrastructure-only fields for LLM responses."""
+    pruned = [{k: v for k, v in doc.items() if k not in _WORKFLOW_HEAVY_FIELDS} for doc in docs]
+    return normalize_docs(pruned)
+
+
+def _sanitize_projection(projection: Optional[List[str]]) -> Optional[List[str]]:
+    """Remove child paths whose parent field is already in *projection*.
+
+    MongoDB raises ``OperationFailure: Path collision`` when a projection
+    includes both ``"generated"`` and ``"generated.val_accuracy"``.  This
+    helper strips the redundant children so the parent field covers them.
+    """
+    if not projection:
+        return projection
+    result = []
+    for field in projection:
+        parts = field.split(".")
+        # keep this field only if none of its parent paths is already included
+        parent_already_included = any(".".join(parts[:i]) in projection for i in range(1, len(parts)))
+        if not parent_already_included:
+            result.append(field)
+    return result or None
+
+
 @_guarded("query_tasks")
 def query_tasks(
     filter: Optional[Dict[str, Any]] = None,
@@ -120,7 +157,27 @@ def query_tasks(
         ``result`` holds ``{"items": [...], "count": int}``.
     """
     sort_tuples = None if not sort else [(s["field"], s["order"]) for s in sort]
-    docs = DBAPI().task_query(filter=filter or {}, projection=projection, limit=limit, sort=sort_tuples) or []
+    proj_holder = [_sanitize_projection(projection)]
+
+    def _execute():
+        return (
+            DBAPI().task_query(
+                filter=filter or {},
+                projection=proj_holder[0],
+                limit=limit,
+                sort=sort_tuples,
+            )
+            or []
+        )
+
+    def _fix(exc, attempt):
+        # Only auto-fix MongoDB projection path-collision errors; let others propagate.
+        if "Path collision" not in str(exc):
+            raise exc
+        proj_holder[0] = _sanitize_projection(proj_holder[0])
+        return _execute
+
+    docs = query_runtime_retry(_execute, _fix, max_attempts=2)
     items = _normalize(docs)
     return ToolResult(code=301, result={"items": items, "count": len(items)}, tool_name="query_tasks")
 
@@ -142,7 +199,7 @@ def query_workflows(filter: Optional[Dict[str, Any]] = None, limit: int = 100) -
         ``result`` holds ``{"items": [...], "count": int}``.
     """
     docs = (DBAPI().workflow_query(filter=filter or {}) or [])[:limit]
-    items = _normalize(docs)
+    items = _normalize_workflows(docs)
     return ToolResult(code=301, result={"items": items, "count": len(items)}, tool_name="query_workflows")
 
 
@@ -160,61 +217,91 @@ def get_task_summary(filter: Optional[Dict[str, Any]] = None) -> ToolResult:
     ToolResult
         ``result`` holds the summary dict.
     """
-    summary = stats.task_summary(DBAPI(), filter or {})
+    summary = DBAPI().task_summary(filter or {})
+    activity_stats = summary.get("activity_stats") or []
+    summary["activity_ids"] = [row.get("activity_id") for row in activity_stats if row.get("activity_id")]
+    summary["activity_counts"] = {
+        row.get("activity_id"): row.get("count") for row in activity_stats if row.get("activity_id")
+    }
     return ToolResult(code=301, result=_normalize([summary])[0], tool_name="get_task_summary")
 
 
 @_guarded("list_campaigns")
-def list_campaigns() -> ToolResult:
+def list_campaigns(campaign_id: Optional[str] = None) -> ToolResult:
     """List derived campaign summaries (campaigns group workflows and tasks).
 
+    Parameters
+    ----------
+    campaign_id : str, optional
+        When provided, only the summary for that campaign is returned.
+        Pass the campaign_id from the user context to scope the result.
+
     Returns
     -------
     ToolResult
         ``result`` holds ``{"items": [...], "count": int}``.
     """
-    items = _normalize(stats.derive_campaigns(DBAPI()))
+    items = _normalize(DBAPI().derive_campaigns(campaign_id=campaign_id))
     return ToolResult(code=301, result={"items": items, "count": len(items)}, tool_name="list_campaigns")
 
 
 @_guarded("list_agents")
-def list_agents() -> ToolResult:
+def list_agents(filter: Dict = None) -> ToolResult:
     """List derived agent summaries (agents observed in task provenance).
 
+    Parameters
+    ----------
+    filter : dict, optional
+        Mongo-style filter to scope the agent derivation (e.g., ``{"workflow_id": "..."}``).
+
     Returns
     -------
     ToolResult
         ``result`` holds ``{"items": [...], "count": int}``.
     """
-    items = _normalize(stats.derive_agents(DBAPI()))
+    items = _normalize(DBAPI().derive_agents(filter))
     return ToolResult(code=301, result={"items": items, "count": len(items)}, tool_name="list_agents")
 
 
-@_guarded("make_chart")
-def make_chart(card_spec: Dict[str, Any], context: Optional[Dict[str, Any]] = None) -> ToolResult:
-    """Build a dashboard-style chart card: validate the spec and resolve its data rows.
+@_guarded("query_objects")
+def query_objects(
+    filter: Optional[Dict[str, Any]] = None,
+    projection: Optional[List[str]] = None,
+    limit: int = 100,
+) -> ToolResult:
+    """Query stored data-object provenance records with a Mongo-style filter.
+
+    Data objects include ML models (``object_type="ml_model"``), datasets
+    (``object_type="dataset"``), and generic blobs.  Their ``custom_metadata``
+    field carries artifact-specific information such as ``model_profile.params``,
+    ``n_input_neurons``, ``loss``, ``split_ratio``, and ``n_samples``.
+    Use this tool when the user asks about model parameters, dataset size, file
+    types, artifact sizes, or any stored artifact metadata.
 
     Parameters
     ----------
-    card_spec : dict
-        A dashboard ``DashboardChart`` spec (type chart/metric/table with a ``data`` binding).
-    context : dict, optional
-        Extra filter ANDed into the chart data filter (e.g., ``{"workflow_id": "..."}``).
+    filter : dict, optional
+        Mongo-style filter.  Common fields: ``object_type``, ``workflow_id``,
+        ``task_id``, ``tags``.  ``custom_metadata`` sub-fields use dot-notation,
+        e.g. ``{"custom_metadata.model_profile.params": {"$gt": 2}}``.
+    projection : list of str, optional
+        Fields to include (dot-notation accepted).
+    limit : int, optional
+        Maximum records (capped by settings).
 
     Returns
     -------
     ToolResult
-        ``result`` holds ``{"chart": <validated spec>, "rows": [...], "count": int}``.
+        ``result`` holds ``{"items": [...], "count": int}``.
     """
-    card = DashboardChart(**card_spec)
-    if card.data is None:
-        return ToolResult(code=400, result="Chart spec must include a data binding.", tool_name="make_chart")
-    validate_filter(card.data.filter)
-    if context:
-        validate_filter(context)
-    resolved = stats.resolve_chart_data(DBAPI(), card.data, context=context)
-    result = {"chart": card.model_dump(), "rows": _normalize(resolved["rows"]), "count": resolved["count"]}
-    return ToolResult(code=301, result=result, tool_name="make_chart")
+    capped = min(limit, MAX_QUERY_LIMIT)
+    docs = (DBAPI().blob_object_query(filter=filter or {}) or [])[:capped]
+    items = _normalize(docs)
+    if projection:
+        safe_proj = set(_sanitize_projection(projection) or [])
+        if safe_proj:
+            items = [{k: v for k, v in d.items() if k in safe_proj} for d in items]
+    return ToolResult(code=301, result={"items": items, "count": len(items)}, tool_name="query_objects")
 
 
 @_guarded("highlight_lineage")
@@ -257,64 +344,28 @@ def highlight_lineage(
     if not resolved_ids:
         return ToolResult(code=404, result="No tasks found for the given criteria.", tool_name="highlight_lineage")
 
-    # Return only the seed task IDs. The frontend BFS expands ancestors/descendants
+    # Fetch activity names for the resolved task IDs so the LLM can describe the lineage.
+    activity_map: Dict[str, str] = {}
+    try:
+        detail_docs = (
+            db.task_query(
+                filter={"task_id": {"$in": resolved_ids}},
+                projection=["task_id", "activity_id", "agent_id"],
+                limit=len(resolved_ids) + 10,
+            )
+            or []
+        )
+        for doc in detail_docs:
+            tid = doc.get("task_id", "")
+            if tid:
+                activity_map[tid] = doc.get("activity_id") or doc.get("agent_id") or ""
+    except Exception:
+        pass
+
+    # Return seed task IDs. The frontend BFS expands ancestors/descendants
     # from these seeds using the dataflow graph — a single source of truth for lineage.
     return ToolResult(
         code=301,
-        result={"task_ids": resolved_ids},
+        result={"task_ids": resolved_ids, "activities": activity_map},
         tool_name="highlight_lineage",
     )
-
-
-@_guarded("get_dashboard")
-def get_dashboard(dashboard_id: str) -> ToolResult:
-    """Get a stored dashboard spec by id.
-
-    Parameters
-    ----------
-    dashboard_id : str
-        Dashboard identifier.
-
-    Returns
-    -------
-    ToolResult
-        ``result`` holds the dashboard spec dict, or a 404 message.
-    """
-    doc = get_dashboard_store().get(dashboard_id)
-    if doc is None:
-        return ToolResult(code=404, result=f"Dashboard not found: {dashboard_id}", tool_name="get_dashboard")
-    return ToolResult(code=301, result=doc, tool_name="get_dashboard")
-
-
-@_guarded("update_dashboard")
-def update_dashboard(dashboard_id: str, spec: Dict[str, Any]) -> ToolResult:
-    """Replace a stored dashboard spec (validated), preserving id and creation time.
-
-    Parameters
-    ----------
-    dashboard_id : str
-        Dashboard identifier.
-    spec : dict
-        Full replacement ``DashboardSpec``.
-
-    Returns
-    -------
-    ToolResult
-        ``result`` holds the saved dashboard spec dict.
-    """
-    store = get_dashboard_store()
-    existing = store.get(dashboard_id)
-    if existing is None:
-        return ToolResult(code=404, result=f"Dashboard not found: {dashboard_id}", tool_name="update_dashboard")
-    validated = DashboardSpec(**spec)
-    validate_filter(validated.context)
-    for card in validated.cards:
-        if card.data is not None:
-            validate_filter(card.data.filter)
-    validated.dashboard_id = dashboard_id
-    validated.created_at = existing.get("created_at")
-    validated.updated_at = datetime.now(timezone.utc).isoformat()
-    doc = validated.model_dump()
-    if not store.save(doc):
-        return ToolResult(code=500, result="Could not save dashboard.", tool_name="update_dashboard")
-    return ToolResult(code=301, result=doc, tool_name="update_dashboard")
diff --git a/src/flowcept/agents/data_query_tools/df_query_tools.py b/src/flowcept/agents/data_query_tools/df_query_tools.py
new file mode 100644
index 00000000..963555f1
--- /dev/null
+++ b/src/flowcept/agents/data_query_tools/df_query_tools.py
@@ -0,0 +1,565 @@
+"""Plain-Python DF (DataFrame) query tools.
+
+Functions in this module operate on pandas DataFrames and do NOT import from the
+MCP framework (no ``@mcp_flowcept.tool()``). The MCP layer lives in
+``mcp_tools/df_query_mcp_tools.py``.
+"""
+
+import json
+from flowcept.agents.tool_result import ToolResult
+from flowcept.agents.llm.builders import build_llm_model
+from flowcept.agents.data_query_tools.tools_utils import query_runtime_retry
+from flowcept.commons.flowcept_logger import FlowceptLogger
+
+from flowcept.agents.data_query_tools.pandas_utils import (
+    load_saved_df,
+    safe_execute,
+    safe_json_parse,
+    normalize_output,
+    format_result_df,
+    summarize_df,
+)
+
+from flowcept.agents.prompts.df_query_prompts import (
+    build_plot_code_prompt,
+    extract_or_fix_json_code_prompt,
+    build_pandas_code_prompt,
+    build_dataframe_summarizer_prompt,
+    build_extract_or_fix_python_code_prompt,
+)
+
+EMPTY_DF_MESSAGE = "Current df is empty or null."
+
+
+def _call_llm(llm, prompt: str) -> str:
+    """Call an LLM with a string prompt and always return a plain string.
+
+    Handles both ``FlowceptLLM`` (whose ``invoke`` already returns ``str``)
+    and raw LangChain models (whose ``invoke`` returns an ``AIMessage``).
+    """
+    response = llm.invoke(prompt)
+    return response.content if hasattr(response, "content") else str(response)
+
+
+def run_df_query(
+    query: str,
+    df,
+    schema,
+    value_examples,
+    custom_user_guidance,
+    llm=None,
+    plot=False,
+    context_kind: str = "tasks",
+) -> ToolResult:
+    r"""Run a natural language query against a DataFrame.
+
+    Parameters
+    ----------
+    query : str
+        Natural language query or Python code snippet.
+    df : pandas.DataFrame
+        The DataFrame to query.
+    schema : dict
+        Schema of the DataFrame.
+    value_examples : dict
+        Example values for each field.
+    custom_user_guidance : list
+        Custom guidance strings from the user.
+    llm : callable, optional
+        LLM callable. Built from settings if None.
+    plot : bool, optional
+        If True, generate plotting code.
+    context_kind : str, optional
+        "tasks" or "objects".
+
+    Returns
+    -------
+    ToolResult
+    """
+    if df is None or not len(df):
+        return ToolResult(code=404, result=EMPTY_DF_MESSAGE)
+    if "save" in query:
+        return save_df(df, schema, value_examples)
+    if "result = df" in query:
+        return run_df_code(user_code=query, df=df)
+
+    if plot:
+        return generate_plot_code(
+            llm,
+            query,
+            schema,
+            value_examples,
+            df,
+            custom_user_guidance=custom_user_guidance,
+            context_kind=context_kind,
+        )
+    return generate_result_df(
+        llm,
+        query,
+        schema,
+        value_examples,
+        df,
+        custom_user_guidance=custom_user_guidance,
+        context_kind=context_kind,
+    )
+
+
+def execute_df_code(user_code: str, df) -> ToolResult:
+    """Execute externally generated pandas code against a DataFrame.
+
+    Parameters
+    ----------
+    user_code : str
+        Pandas code expected to assign output to ``result``.
+    df : pandas.DataFrame
+        DataFrame to execute against.
+
+    Returns
+    -------
+    ToolResult
+    """
+    if df is None or not len(df):
+        return ToolResult(code=404, result=EMPTY_DF_MESSAGE)
+    return run_df_code(user_code=user_code, df=df)
+
+
+def generate_plot_code(
+    llm,
+    query,
+    dynamic_schema,
+    value_examples,
+    df,
+    custom_user_guidance=None,
+    context_kind="tasks",
+) -> ToolResult:
+    """Generate DataFrame and plotting code from a natural language query using an LLM.
+
+    Parameters
+    ----------
+    llm : callable
+        LLM callable.
+    query : str
+        Natural language query.
+    dynamic_schema : dict
+        Schema of the DataFrame.
+    value_examples : dict
+        Example values.
+    df : pandas.DataFrame
+        The DataFrame.
+    custom_user_guidance : list, optional
+        Custom guidance strings.
+    context_kind : str, optional
+        "tasks" or "objects".
+
+    Returns
+    -------
+    ToolResult
+    """
+    if llm is None:
+        llm = build_llm_model()
+    plot_prompt = build_plot_code_prompt(
+        query,
+        dynamic_schema,
+        value_examples,
+        list(df.columns),
+        context_kind=context_kind,
+    )
+    try:
+        response = _call_llm(llm, plot_prompt)
+    except Exception as e:
+        return ToolResult(code=400, result=str(e), extra=plot_prompt)
+
+    result_code, plot_code, description = None, None, ""
+    try:
+        parsed = safe_json_parse(response)
+        result_code = parsed["result_code"]
+        plot_code = parsed["plot_code"]
+        description = parsed.get("description", "")
+    except (ValueError, KeyError):
+        tool_response = extract_or_fix_json_code(llm, response)
+        if tool_response.code != 201:
+            return ToolResult(code=499, result=tool_response.result)
+        try:
+            parsed = safe_json_parse(tool_response.result)
+            result_code = parsed.get("result_code")
+            plot_code = parsed.get("plot_code")
+            description = parsed.get("description", "")
+            if not result_code or not plot_code:
+                return ToolResult(
+                    code=405,
+                    result=f"Fixed JSON missing result_code or plot_code: {parsed}",
+                    extra=plot_prompt,
+                )
+        except ValueError as e:
+            return ToolResult(
+                code=405,
+                result=f"Tried to parse this as JSON: {tool_response.result}, but got Error: {e}",
+                extra=plot_prompt,
+            )
+    except Exception as e:
+        return ToolResult(code=499, result=str(e), extra=plot_prompt)
+
+    columns = list(df.columns)
+    code_holder = [result_code]
+    retry_count = [0]
+
+    def _execute():
+        return safe_execute(df, code_holder[0])
+
+    def _fix(exc, attempt):
+        tool_result = extract_or_fix_python_code(llm, code_holder[0], columns, runtime_error=str(exc))
+        if tool_result.code != 201:
+            raise RuntimeError(f"LLM could not fix the code: {tool_result.result}")
+        code_holder[0] = tool_result.result
+        retry_count[0] += 1
+        return _execute
+
+    try:
+        result_df = query_runtime_retry(_execute, _fix, max_attempts=3)
+        result_code = code_holder[0]
+    except Exception as e:
+        return ToolResult(code=406, result=str(e), extra={"retry_attempts": retry_count[0]})
+
+    try:
+        result_df = format_result_df(result_df)
+    except Exception as e:
+        return ToolResult(code=404, result=str(e))
+
+    return ToolResult(
+        code=301,
+        result={"result_df": result_df, "plot_code": plot_code, "result_code": result_code, "description": description},
+        tool_name="generate_plot_code",
+        extra={"retry_attempts": retry_count[0]},
+    )
+
+
+def generate_result_df(
+    llm,
+    query: str,
+    dynamic_schema,
+    example_values,
+    df,
+    custom_user_guidance=None,
+    attempt_fix=True,
+    summarize=True,
+    context_kind="tasks",
+) -> ToolResult:
+    """Generate a result DataFrame from a natural language query using an LLM.
+
+    Parameters
+    ----------
+    llm : callable
+        LLM callable. Built from settings if None.
+    query : str
+        Natural language query.
+    dynamic_schema : dict
+        Schema of the DataFrame.
+    example_values : dict
+        Example values.
+    df : pandas.DataFrame
+        The DataFrame to query.
+    custom_user_guidance : list, optional
+        Custom guidance strings.
+    attempt_fix : bool, optional
+        If True, attempt to fix invalid generated code.
+    summarize : bool, optional
+        If True, summarize the result.
+    context_kind : str, optional
+        "tasks" or "objects".
+
+    Returns
+    -------
+    ToolResult
+    """
+    _logger = FlowceptLogger()
+    if llm is None:
+        llm = build_llm_model()
+    try:
+        prompt = build_pandas_code_prompt(
+            query,
+            dynamic_schema,
+            example_values,
+            custom_user_guidance,
+            list(df.columns),
+            context_kind=context_kind,
+        )
+        response = _call_llm(llm, prompt)
+    except Exception as e:
+        return ToolResult(code=400, result=str(e), extra=prompt)
+
+    result_code = response
+    columns = list(df.columns)
+
+    code_holder = [result_code]
+    retry_count = [0]
+
+    def _execute():
+        return safe_execute(df, code_holder[0])
+
+    def _fix(exc, attempt):
+        if not attempt_fix:
+            raise exc
+        tool_result = extract_or_fix_python_code(llm, code_holder[0], columns, runtime_error=str(exc))
+        if tool_result.code != 201:
+            raise RuntimeError(f"LLM could not fix the code: {tool_result.result}")
+        code_holder[0] = tool_result.result
+        retry_count[0] += 1
+        return _execute
+
+    try:
+        result_df = query_runtime_retry(_execute, _fix, max_attempts=3)
+        result_code = code_holder[0]
+    except Exception as e:
+        return ToolResult(
+            code=405,
+            result=(f"Failed to execute after retries: ```python\n{code_holder[0]}```\nLast error: {e}"),
+            extra={
+                "generated_code": code_holder[0],
+                "exception": str(e),
+                "prompt": prompt,
+                "retry_attempts": retry_count[0],
+            },
+        )
+
+    try:
+        result_df = normalize_output(result_df)
+    except Exception as e:
+        return ToolResult(
+            code=504,
+            result="Failed to normalize output.",
+            extra={"generated_code": result_code, "exception": str(e), "prompt": prompt},
+        )
+
+    result_df = result_df.dropna(axis=1, how="all")
+
+    return_code = 301
+    summary, summary_error = None, None
+    if summarize:
+        try:
+            tool_result = summarize_result(
+                llm,
+                result_code,
+                result_df,
+                query,
+                dynamic_schema,
+                example_values,
+                list(df.columns),
+                context_kind=context_kind,
+            )
+            if tool_result.is_success():
+                return_code = 301
+                summary = tool_result.result
+            else:
+                return_code = 302
+                summary_error = tool_result.result
+        except Exception as e:
+            _logger.exception(e)
+            summary = ""
+            summary_error = str(e)
+            return_code = 303
+
+    try:
+        result_df_str = format_result_df(result_df)
+    except Exception as e:
+        return ToolResult(
+            code=405,
+            result="Failed to format output.",
+            extra={"generated_code": result_code, "exception": str(e), "prompt": prompt},
+        )
+
+    return ToolResult(
+        code=return_code,
+        result={
+            "result_code": result_code,
+            "result_df": result_df_str,
+            "result_df_markdown": result_df.to_markdown(index=False),
+            "summary": summary,
+            "summary_error": summary_error,
+        },
+        tool_name="generate_result_df",
+        extra={"prompt": prompt, "retry_attempts": retry_count[0]},
+    )
+
+
+def run_df_code(user_code: str, df) -> ToolResult:
+    """Execute user-provided Python code on a DataFrame and format the result.
+
+    Parameters
+    ----------
+    user_code : str
+        Python code string that operates on the DataFrame.
+    df : pandas.DataFrame
+        The input DataFrame.
+
+    Returns
+    -------
+    ToolResult
+    """
+    try:
+        result_df = safe_execute(df, user_code)
+    except Exception as e:
+        return ToolResult(code=405, result=f"Failed to run this as Python code: {user_code}. Got error {e}")
+
+    try:
+        result_df = normalize_output(result_df)
+    except Exception as e:
+        return ToolResult(code=405, result=str(e))
+
+    result_df = result_df.dropna(axis=1, how="all")
+    return ToolResult(
+        code=301,
+        result={"result_code": user_code, "result_df": format_result_df(result_df)},
+        tool_name="run_df_code",
+    )
+
+
+def extract_or_fix_python_code(llm, raw_text, current_fields, runtime_error: str = None) -> ToolResult:
+    """Extract or repair Python code from raw text using an LLM.
+
+    Parameters
+    ----------
+    llm : callable
+        LLM callable.
+    raw_text : str
+        Raw text possibly containing Python code.
+    current_fields : list
+        Available DataFrame column names.
+    runtime_error : str, optional
+        Exception message from a previous execution attempt.  When provided,
+        the LLM is explicitly asked to fix that runtime error.
+
+    Returns
+    -------
+    ToolResult
+    """
+    prompt = build_extract_or_fix_python_code_prompt(raw_text, current_fields, runtime_error=runtime_error)
+    try:
+        response = _call_llm(llm, prompt)
+        return ToolResult(code=201, result=response)
+    except Exception as e:
+        return ToolResult(code=499, result=str(e))
+
+
+def extract_or_fix_json_code(llm, raw_text) -> ToolResult:
+    """Extract or repair JSON code from raw text using an LLM.
+
+    Parameters
+    ----------
+    llm : callable
+        LLM callable.
+    raw_text : str
+        Raw text possibly containing JSON.
+
+    Returns
+    -------
+    ToolResult
+    """
+    prompt = extract_or_fix_json_code_prompt(raw_text)
+    try:
+        response = _call_llm(llm, prompt)
+        return ToolResult(code=201, result=response)
+    except Exception as e:
+        return ToolResult(code=499, result=str(e))
+
+
+def summarize_result(
+    llm,
+    code,
+    result,
+    query: str,
+    dynamic_schema,
+    example_values,
+    current_fields,
+    context_kind="tasks",
+) -> ToolResult:
+    """Summarize a pandas result with local reduction for large DataFrames.
+
+    Parameters
+    ----------
+    llm : callable
+        LLM callable.
+    code : str
+        The pandas code that produced the result.
+    result : pandas.DataFrame
+        The result DataFrame.
+    query : str
+        The original user query.
+    dynamic_schema : dict
+        Schema of the DataFrame.
+    example_values : dict
+        Example values.
+    current_fields : list
+        Current DataFrame column names.
+    context_kind : str, optional
+        "tasks" or "objects".
+
+    Returns
+    -------
+    ToolResult
+    """
+    summarized_df = summarize_df(result, code)
+    prompt = build_dataframe_summarizer_prompt(
+        code,
+        summarized_df,
+        dynamic_schema,
+        example_values,
+        query,
+        current_fields,
+        context_kind=context_kind,
+    )
+    try:
+        response = _call_llm(llm, prompt)
+        return ToolResult(code=201, result=response)
+    except Exception as e:
+        return ToolResult(code=400, result=str(e))
+
+
+def save_df(df, schema, value_examples) -> ToolResult:
+    """Save a DataFrame, its schema, and example values to temporary files.
+
+    Parameters
+    ----------
+    df : pandas.DataFrame
+        The DataFrame to save.
+    schema : dict
+        Schema dict.
+    value_examples : dict
+        Example values dict.
+
+    Returns
+    -------
+    ToolResult
+    """
+    with open("/tmp/current_tasks_schema.json", "w") as f:
+        json.dump(schema, f, indent=2)
+    with open("/tmp/value_examples.json", "w") as f:
+        json.dump(value_examples, f, indent=2)
+    df.to_csv("/tmp/current_agent_df.csv", index=False)
+    return ToolResult(code=201, result="Saved df and schema to /tmp directory")
+
+
+def query_on_saved_df(query: str, dynamic_schema_path, value_examples_path, df_path):
+    """Run a natural language query against a saved DataFrame.
+
+    Parameters
+    ----------
+    query : str
+        Natural language query.
+    dynamic_schema_path : str
+        Path to a JSON schema file.
+    value_examples_path : str
+        Path to a JSON example values file.
+    df_path : str
+        Path to the saved DataFrame CSV file.
+
+    Returns
+    -------
+    ToolResult
+    """
+    df = load_saved_df(df_path)
+    with open(dynamic_schema_path) as f:
+        dynamic_schema = json.load(f)
+    with open(value_examples_path) as f:
+        value_examples = json.load(f)
+    llm = build_llm_model()
+    return generate_result_df(llm, query, dynamic_schema, value_examples, df, attempt_fix=False, summarize=False)
diff --git a/src/flowcept/agents/tools/in_memory_queries/pandas_agent_utils.py b/src/flowcept/agents/data_query_tools/pandas_utils.py
similarity index 89%
rename from src/flowcept/agents/tools/in_memory_queries/pandas_agent_utils.py
rename to src/flowcept/agents/data_query_tools/pandas_utils.py
index 86cf0f71..92463495 100644
--- a/src/flowcept/agents/tools/in_memory_queries/pandas_agent_utils.py
+++ b/src/flowcept/agents/data_query_tools/pandas_utils.py
@@ -73,6 +73,9 @@ def normalize_output(result):
         else:
             raise ValueError(f"Unsupported ndarray shape: {result.shape}")
 
+    elif isinstance(result, dict):
+        _df = pd.DataFrame([result])
+
     else:
         raise TypeError(f"Unsupported result type: {type(result)}")
 
@@ -216,6 +219,11 @@ def clean_code(text):
     """
     Extracts the first valid Python code block or line that starts with 'result =' from a model response.
 
+    Handles:
+    - Fenced code blocks (```python ... ```)
+    - Multi-line code with intermediate variable assignments before result = ...
+    - Single-line result = ... statements
+
     Parameters
     ----------
     text : str
@@ -231,7 +239,26 @@ def clean_code(text):
     if block_match:
         return block_match.group(1).strip()
 
-    # Fallback: try to find a line that starts with "result ="
+    # Scan for consecutive Python-looking lines starting from the first identifier assignment.
+    # This handles multi-line code with intermediate variables (e.g., per_act = ...; result = ...).
+    code_lines = []
+    in_code = False
+    for line in text.strip().splitlines():
+        stripped = line.strip()
+        if not in_code and re.match(r"^[a-zA-Z_]\w*\s*=", stripped):
+            in_code = True
+        if in_code:
+            code_lines.append(line)
+    if code_lines:
+        candidate = "\n".join(code_lines).strip()
+        try:
+            compile(candidate, "<string>", "exec")
+            if "result" in candidate:
+                return candidate
+        except SyntaxError:
+            pass
+
+    # Single-line fallback for prose+code responses where only the first assignment matters
     line_match = re.search(r"(result\s*=\s*.+)", text)
     if line_match:
         return line_match.group(1).strip()
diff --git a/src/flowcept/agents/data_query_tools/tools_utils.py b/src/flowcept/agents/data_query_tools/tools_utils.py
new file mode 100644
index 00000000..654ced47
--- /dev/null
+++ b/src/flowcept/agents/data_query_tools/tools_utils.py
@@ -0,0 +1,50 @@
+"""Shared retry loop for query runtime errors.
+
+Covers only errors raised when *executing* a generated query — pandas runtime
+errors for the DF path and MongoDB OperationFailure for the DB path.
+
+Out of scope: JSON/code parse errors, LLM output format errors, network errors,
+auth errors, and schema validation errors.
+"""
+
+
+def query_runtime_retry(execute_fn, fix_fn, max_attempts: int = 3):
+    """Run *execute_fn*; on runtime error call *fix_fn* to get a corrected
+    callable and retry, up to *max_attempts* total attempts.
+
+    Parameters
+    ----------
+    execute_fn : callable
+        Parameterless callable that executes the query.  Returns a value on
+        success; raises an exception on query runtime error.
+    fix_fn : callable(exc, attempt) -> new_execute_fn
+        Called with the caught exception and the zero-based attempt index.
+        Must return a new (or updated) parameterless callable that re-runs the
+        corrected query.  Raise from *fix_fn* to signal that the error is
+        unrecoverable — no further retries will be made.
+    max_attempts : int, optional
+        Total number of attempts, including the first.  Default is 3.
+
+    Returns
+    -------
+    object
+        Whatever the first successful *execute_fn* call returns.
+
+    Raises
+    ------
+    Exception
+        Re-raises the last caught exception when all attempts are exhausted or
+        *fix_fn* itself raises.
+    """
+    last_exc = None
+    for attempt in range(max_attempts):
+        try:
+            return execute_fn()
+        except Exception as exc:
+            last_exc = exc
+            if attempt < max_attempts - 1:
+                try:
+                    execute_fn = fix_fn(exc, attempt)
+                except Exception:
+                    break
+    raise last_exc
diff --git a/src/flowcept/agents/gui/README.md b/src/flowcept/agents/gui/README.md
new file mode 100644
index 00000000..4e7ddedb
--- /dev/null
+++ b/src/flowcept/agents/gui/README.md
@@ -0,0 +1,11 @@
+# Deprecated GUI
+
+This module is deprecated.
+
+Flowcept UI work has moved to the web UI under `src/flowcept/webservice/`.
+That UI includes the chat interface and is the place for current and future
+user-facing interaction work.
+
+Keep this package only for legacy reference while the old Streamlit agent GUI
+is retired.
+
diff --git a/src/flowcept/agents/gui/gui_utils.py b/src/flowcept/agents/gui/gui_utils.py
index 0596abf1..838fa283 100644
--- a/src/flowcept/agents/gui/gui_utils.py
+++ b/src/flowcept/agents/gui/gui_utils.py
@@ -10,8 +10,8 @@
 import streamlit as st
 from flowcept.agents.gui import AI
 from flowcept.agents import prompt_handler
-from flowcept.agents.agent_client import run_tool
-from flowcept.agents.agents_utils import ToolResult
+from flowcept.agents.mcp.mcp_client import run_tool
+from flowcept.agents.tool_result import ToolResult
 
 
 from flowcept.agents.gui.audio_utils import _md_to_plain_text, speak
diff --git a/src/flowcept/agents/llm/__init__.py b/src/flowcept/agents/llm/__init__.py
new file mode 100644
index 00000000..c124df5d
--- /dev/null
+++ b/src/flowcept/agents/llm/__init__.py
@@ -0,0 +1 @@
+"""LLM infrastructure for the Flowcept agent subsystem."""
diff --git a/src/flowcept/agents/llm/builders.py b/src/flowcept/agents/llm/builders.py
new file mode 100644
index 00000000..80d9ddd4
--- /dev/null
+++ b/src/flowcept/agents/llm/builders.py
@@ -0,0 +1,113 @@
+"""LLM factory and message normalization utilities."""
+
+import os
+import re
+import unicodedata
+
+from flowcept.flowceptor.consumers.agent.base_agent_context_manager import BaseAgentContextManager
+from flowcept.instrumentation.flowcept_agent_task import FlowceptLLM, get_current_context_task
+from flowcept.configs import AGENT
+
+
+def build_llm_model(
+    model_name=None,
+    model_kwargs=None,
+    service_provider=None,
+    agent_id=BaseAgentContextManager.agent_id,
+    track_tools=True,
+    return_response_object=False,
+) -> FlowceptLLM:
+    """Build and return an LLM instance using agent configuration.
+
+    Returns
+    -------
+    FlowceptLLM
+        An initialized LLM object configured using the ``AGENT`` settings.
+    """
+    _model_kwargs = (AGENT.get("model_kwargs") or {}).copy()
+    if model_kwargs is not None:
+        for k in model_kwargs:
+            _model_kwargs[k] = model_kwargs[k]
+
+    if "model" not in _model_kwargs:
+        _model_kwargs["model"] = AGENT.get("model", model_name)
+
+    if service_provider:
+        _service_provider = service_provider
+    else:
+        _service_provider = AGENT.get("service_provider")
+
+    if _service_provider == "sambanova":
+        from langchain_community.llms.sambanova import SambaStudio
+
+        os.environ["SAMBASTUDIO_URL"] = os.environ.get("SAMBASTUDIO_URL", AGENT.get("llm_server_url"))
+        os.environ["SAMBASTUDIO_API_KEY"] = os.environ.get("SAMBASTUDIO_API_KEY", AGENT.get("api_key"))
+
+        llm = SambaStudio(model_kwargs=_model_kwargs)
+    elif _service_provider == "azure":
+        from langchain_openai.chat_models.azure import AzureChatOpenAI
+
+        api_key = os.environ.get("AZURE_OPENAI_API_KEY", AGENT.get("api_key", None))
+        service_url = os.environ.get("AZURE_OPENAI_API_ENDPOINT", AGENT.get("llm_server_url", None))
+        llm = AzureChatOpenAI(
+            azure_deployment=_model_kwargs.get("model"), azure_endpoint=service_url, api_key=api_key, **_model_kwargs
+        )
+    elif _service_provider == "openai":
+        from langchain_openai import ChatOpenAI
+
+        api_key = os.environ.get("OPENAI_API_KEY", AGENT.get("api_key", None))
+        base_url = os.environ.get("OPENAI_BASE_URL", AGENT.get("llm_server_url") or None)
+        org = os.environ.get("OPENAI_ORG_ID", AGENT.get("organization", None))
+
+        init_kwargs = {"api_key": api_key}
+        if base_url:
+            init_kwargs["base_url"] = base_url
+        if org:
+            init_kwargs["organization"] = org
+
+        llm = ChatOpenAI(**init_kwargs, **_model_kwargs)
+    elif _service_provider == "google":
+        if "claude" in _model_kwargs["model"]:
+            api_key = os.environ.get("GOOGLE_API_KEY", AGENT.get("api_key", None))
+            _model_kwargs["model_id"] = _model_kwargs.pop("model")
+            _model_kwargs["google_token_auth"] = api_key
+            from flowcept.agents.llm.providers.claude_gcp import ClaudeOnGCPLLM
+
+            llm = ClaudeOnGCPLLM(**_model_kwargs)
+        elif "gemini" in _model_kwargs["model"]:
+            from flowcept.agents.llm.providers.gemini25 import Gemini25LLM
+
+            llm = Gemini25LLM(**_model_kwargs)
+    else:
+        raise Exception("Currently supported providers are sambanova, openai, azure, and google.")
+
+    if track_tools:
+        llm = FlowceptLLM(llm, return_response_object=return_response_object)
+        if agent_id is None:
+            agent_id = BaseAgentContextManager.agent_id
+        llm.agent_id = agent_id
+        tool_task = get_current_context_task()
+        if tool_task:
+            llm.parent_task_id = tool_task.task_id
+    return llm
+
+
+def normalize_message(user_msg: str) -> str:
+    """Normalize a user message into a canonical, comparison-friendly form.
+
+    Parameters
+    ----------
+    user_msg : str
+        Raw user input message.
+
+    Returns
+    -------
+    str
+        Normalized message suitable for matching, comparison, or hashing.
+    """
+    user_msg = user_msg.strip()
+    user_msg = unicodedata.normalize("NFKC", user_msg)
+    user_msg = user_msg.replace("–", "-").replace("—", "-")
+    user_msg = re.sub(r"\s+", " ", user_msg)
+    user_msg = re.sub(r"[?!.\s]+$", "", user_msg)
+    return user_msg.lower()
diff --git a/src/flowcept/agents/llm/providers/__init__.py b/src/flowcept/agents/llm/providers/__init__.py
new file mode 100644
index 00000000..e9ee9706
--- /dev/null
+++ b/src/flowcept/agents/llm/providers/__init__.py
@@ -0,0 +1 @@
+"""LLM provider wrappers (Claude on GCP, Gemini 2.5)."""
diff --git a/src/flowcept/agents/llms/claude_gcp.py b/src/flowcept/agents/llm/providers/claude_gcp.py
similarity index 100%
rename from src/flowcept/agents/llms/claude_gcp.py
rename to src/flowcept/agents/llm/providers/claude_gcp.py
diff --git a/src/flowcept/agents/llms/gemini25.py b/src/flowcept/agents/llm/providers/gemini25.py
similarity index 100%
rename from src/flowcept/agents/llms/gemini25.py
rename to src/flowcept/agents/llm/providers/gemini25.py
diff --git a/src/flowcept/agents/llms/__init__.py b/src/flowcept/agents/llms/__init__.py
deleted file mode 100644
index 49212d57..00000000
--- a/src/flowcept/agents/llms/__init__.py
+++ /dev/null
@@ -1 +0,0 @@
-"""LLMs subpackage."""
diff --git a/src/flowcept/agents/mcp/__init__.py b/src/flowcept/agents/mcp/__init__.py
new file mode 100644
index 00000000..533cb8f5
--- /dev/null
+++ b/src/flowcept/agents/mcp/__init__.py
@@ -0,0 +1 @@
+"""MCP server, client, and tool adapters for the Flowcept agent."""
diff --git a/src/flowcept/agents/flowcept_ctx_manager.py b/src/flowcept/agents/mcp/context_manager.py
similarity index 66%
rename from src/flowcept/agents/flowcept_ctx_manager.py
rename to src/flowcept/agents/mcp/context_manager.py
index 8a974496..9bfade01 100644
--- a/src/flowcept/agents/flowcept_ctx_manager.py
+++ b/src/flowcept/agents/mcp/context_manager.py
@@ -1,9 +1,27 @@
-from flowcept.agents.dynamic_schema_tracker import DynamicSchemaTracker
-from flowcept.agents.tools.in_memory_queries.pandas_agent_utils import load_saved_df
+from contextlib import asynccontextmanager
+
+from flowcept.agents.provenance_schema_manager.context_schema_manager import ContextSchemaManager
+from flowcept.agents.provenance_schema_manager.static_schema_builder import (
+    SCHEMA_CONTEXT,
+    assert_schema_documented,
+    build_schema_context,
+)
+from flowcept.agents.data_query_tools.pandas_utils import load_saved_df
 from flowcept.commons.flowcept_dataclasses.task_object import TaskObject
+from flowcept.commons.flowcept_dataclasses.workflow_object import WorkflowObject
+from flowcept.commons.flowcept_dataclasses.agent_object import AgentObject
+from flowcept.commons.flowcept_dataclasses.blob_object import BlobObject
+from flowcept.commons.task_data_preprocess import (
+    TelemetrySummary,
+    CpuSummary,
+    MemorySummary,
+    DiskSummary,
+    NetworkSummary,
+    summarize_task,
+)
 from flowcept.commons.flowcept_logger import FlowceptLogger
-from flowcept.commons.vocabulary import Status
-from flowcept.configs import AGENT
+from flowcept.commons.vocabulary import PROV_AGENT
+from flowcept.configs import AGENT, AGENT_HOST, AGENT_PORT
 from mcp.server.fastmcp import FastMCP
 
 import json
@@ -15,8 +33,6 @@
 
 from flowcept.flowceptor.consumers.agent.base_agent_context_manager import BaseAgentContextManager, BaseAppContext
 
-from flowcept.commons.task_data_preprocess import summarize_task
-
 
 AGENT_DEBUG = AGENT.get("debug", False)
 
@@ -64,6 +80,7 @@ def reset_context(self):
         self.objects_df = pd.DataFrame()
         self.objects_schema = {}
         self.objects_value_examples = {}
+        self.workflow_schema_cache = {}
 
         if AGENT_DEBUG:
             from flowcept.commons.flowcept_logger import FlowceptLogger
@@ -105,12 +122,43 @@ class FlowceptAgentContextManager(BaseAgentContextManager):
     def __init__(self):
         self.context = FlowceptAppContext()
         self.tracker_config = dict(max_examples=3, max_str_len=50)
-        self.schema_tracker = DynamicSchemaTracker(**self.tracker_config)
-        self.objects_schema_tracker = DynamicSchemaTracker(**self.tracker_config)
+        self.schema_manager = ContextSchemaManager(self.context, self.tracker_config)
+        self._seen_activities: dict = {}
         self.msgs_counter = 0
         self.context_chunk_size = 1  # Should be in the settings
         super().__init__(allow_mq_disabled=True)
 
+    def reset_context(self):
+        """Reset MCP runtime context and workflow-scoped schema trackers."""
+        self.context.reset_context()
+        self.schema_manager.reset()
+        self._seen_activities = {}
+        self.msgs_counter = 0
+
+    @asynccontextmanager
+    async def lifespan(self, app):
+        """Start schema assertions before the MCP server begins serving requests.
+
+        Validates that all domain-class fields have attribute docstrings, then
+        populates ``SCHEMA_CONTEXT`` for use by prompt builders. Raises
+        ``SchemaDocumentationError`` loudly so the server refuses to start when
+        any field is undocumented.
+        """
+        assert_schema_documented(
+            TaskObject,
+            WorkflowObject,
+            AgentObject,
+            BlobObject,
+            TelemetrySummary,
+            CpuSummary,
+            MemorySummary,
+            DiskSummary,
+            NetworkSummary,
+        )
+        SCHEMA_CONTEXT.update(build_schema_context())
+        async with super().lifespan(app) as ctx:
+            yield ctx
+
     def message_handler(self, msg_obj: Dict):
         """
         Handle an incoming message and update context accordingly.
@@ -127,21 +175,28 @@ def message_handler(self, msg_obj: Dict):
         """
         msg_type = msg_obj.get("type", None)
         if msg_type == "workflow":
-            # Preserve an explicitly loaded workflow when the agent registers its own runtime workflow.
-            if msg_obj.get("name") == "flowcept_agent_workflow" and self.context.workflow_msg_obj:
-                self.logger.info("Ignoring agent runtime workflow; keeping loaded workflow context.")
+            # Preserve the user-loaded workflow when the agent/chat runtime emits its own workflow.
+            # Compare workflow_ids: if we have a loaded workflow and the incoming message belongs to
+            # a different workflow, ignore it so runtime chat/agent workflows never overwrite the
+            # explicitly loaded provenance workflow.
+            loaded_wf_id = (self.context.workflow_msg_obj or {}).get("workflow_id")
+            incoming_wf_id = msg_obj.get("workflow_id")
+            if loaded_wf_id and incoming_wf_id and loaded_wf_id != incoming_wf_id:
+                self.logger.info("Ignoring runtime workflow (different workflow_id); keeping loaded workflow context.")
                 return True
             self.context.workflow_msg_obj = msg_obj
+            if WorkflowObject.from_dict(msg_obj).workflow_is_finished():
+                self.schema_manager.persist_workflow_schema_snapshot(msg_obj.get("workflow_id"))
             return True
 
         if msg_type == "object":
             self.context.objects.append(msg_obj)
-            self.update_objects_schema_and_add_to_df(objects=[msg_obj])
+            self.schema_manager.update_objects_schema_and_add_to_df(objects=[msg_obj])
             return True
 
         if msg_type == "task":
             task_msg = TaskObject.from_dict(msg_obj)
-            if task_msg.subtype == "llm_task" and task_msg.agent_id == self.agent_id:
+            if task_msg.subtype == PROV_AGENT.AI_MODEL_INVOCATION and task_msg.agent_id == self.agent_id:
                 self.logger.info(f"Going to ignore our own LLM messages: {task_msg}")
                 return True
 
@@ -158,47 +213,18 @@ def message_handler(self, msg_obj: Dict):
                         FlowceptTask(
                             agent_id=self.agent_id,
                             generated={"msg": "Provenance Agent reset context."},
-                            subtype="agent_task",
+                            subtype=PROV_AGENT.AGENT_TOOL,
                             activity_id="reset_user_context",
                         ).send()
                     return True
                 elif task_msg.activity_id == "provenance_query":
-                    self.logger.info("Received a prov query message!")
-                    query_text = task_msg.used.get("query")
-                    from flowcept.agents import ToolResult
-                    from flowcept.agents.tools.general_tools import prompt_handler
-                    from flowcept.agents.agent_client import run_tool
-
-                    resp = run_tool(tool_name=prompt_handler, kwargs={"message": query_text})[0]
-
-                    try:
-                        error = None
-                        status = Status.FINISHED
-                        tool_result = ToolResult(**json.loads(resp))
-                        if tool_result.result_is_str():
-                            generated = {"text": tool_result.result}
-                        else:
-                            generated = tool_result.result
-                    except Exception as e:
-                        status = Status.ERROR
-                        error = f"Could not convert the following into a ToolResult:\n{resp}\nException: {e}"
-                        generated = {"text": str(resp)}
-                    if self._mq_dao is None:
-                        self.logger.warning("MQ is disabled; skipping provenance_query response message.")
-                    else:
-                        FlowceptTask(
-                            agent_id=self.agent_id,
-                            generated=generated,
-                            stderr=error,
-                            status=status,
-                            subtype="agent_task",
-                            activity_id="provenance_query_response",
-                        ).send()
-
+                    self.logger.info(
+                        "Ignoring legacy provenance_query task; explicit workflow query tools are used instead."
+                    )
                     return True
 
             elif (
-                task_msg.subtype == "agent_task"
+                task_msg.subtype == PROV_AGENT.AGENT_TOOL
                 and task_msg.agent_id is not None
                 and task_msg.agent_id == self.agent_id
             ):
@@ -219,7 +245,7 @@ def message_handler(self, msg_obj: Dict):
                     f"Going to add to index! {(self.msgs_counter - self.context_chunk_size, self.msgs_counter)}"
                 )
                 try:
-                    self.update_schema_and_add_to_df(
+                    self.schema_manager.update_schema_and_add_to_df(
                         tasks=self.context.task_summaries[
                             self.msgs_counter - self.context_chunk_size : self.msgs_counter
                         ]
@@ -231,42 +257,29 @@ def message_handler(self, msg_obj: Dict):
                     self.logger.error(f"Could not add these tasks to buffer!\n{task_slice}")
                     self.logger.exception(e)
 
+                activity_id = msg_obj.get("activity_id")
+                workflow_id = msg_obj.get("workflow_id")
+                if (
+                    activity_id
+                    and workflow_id
+                    and msg_obj.get("ended_at")
+                    and msg_obj.get("used")
+                    and msg_obj.get("generated")
+                    and activity_id not in self._seen_activities.get(workflow_id, set())
+                ):
+                    self.schema_manager.update_workflow_schema_cache([msg_obj])
+                    self._seen_activities.setdefault(workflow_id, set()).add(activity_id)
+
                 # self.monitor_chunk()
 
         return True
 
-    def update_schema_and_add_to_df(self, tasks: List[Dict]):
-        """Update the schema and add to the DataFrame in context."""
-        self.schema_tracker.update_with_tasks(tasks)
-        self.context.tasks_schema = self.schema_tracker.get_schema()
-        self.context.value_examples = self.schema_tracker.get_example_values()
-
-        _df = self._to_context_df(tasks)
-        self.context.df = pd.concat([self.context.df, _df], ignore_index=True)
-
-    def update_objects_schema_and_add_to_df(self, objects: List[Dict]):
-        """Update the object schema and add to the object DataFrame context."""
-        self.objects_schema_tracker.update_with_tasks(objects)
-        self.context.objects_schema = self.objects_schema_tracker.get_schema()
-        self.context.objects_value_examples = self.objects_schema_tracker.get_example_values()
-
-        _df = self._to_context_df(objects)
-        self.context.objects_df = pd.concat([self.context.objects_df, _df], ignore_index=True)
-
-    @staticmethod
-    def _to_context_df(records: List[Dict]):
-        _df = pd.json_normalize(records)
-        for col in _df.columns:
-            if _df[col].apply(lambda v: isinstance(v, list)).any():
-                _df[col] = _df[col].apply(lambda v: tuple(v) if isinstance(v, list) else v)
-        return pd.DataFrame(_df)
-
     def monitor_chunk(self):
         """
         Perform LLM-based analysis on the current chunk of task messages and send the results.
         """
         self.logger.debug(f"Going to begin LLM job! {self.msgs_counter}")
-        from flowcept.agents.agent_client import run_tool
+        from flowcept.agents.mcp.mcp_client import run_tool
 
         result = run_tool("analyze_task_chunk")
         if len(result):
@@ -289,9 +302,14 @@ def monitor_chunk(self):
 if "allowed_hosts" in AGENT:
     from mcp.server.transport_security import TransportSecuritySettings
 
+    allowed_hosts = list(AGENT.get("allowed_hosts") or [])
+    for host in {AGENT_HOST, "localhost", "127.0.0.1", "::1"}:
+        for allowed_host in {host, f"{host}:*", f"{host}:{AGENT_PORT}"}:
+            if allowed_host not in allowed_hosts:
+                allowed_hosts.append(allowed_host)
     agent_transport_security = TransportSecuritySettings(
         enable_dns_rebinding_protection=True,
-        allowed_hosts=AGENT.get("allowed_hosts"),
+        allowed_hosts=allowed_hosts,
     )
 
 mcp_flowcept = FastMCP(
@@ -313,8 +331,7 @@ def get_df_context(context_kind="tasks"):
     tuple
         ``(df, schema, value_examples, custom_user_guidance)`` from lifespan context.
     """
-    ctx = mcp_flowcept.get_context()
-    lifespan_context = ctx.request_context.lifespan_context
+    lifespan_context = ctx_manager.context
     if context_kind == "objects":
         df = lifespan_context.objects_df
         schema = lifespan_context.objects_schema
diff --git a/src/flowcept/agents/agent_client.py b/src/flowcept/agents/mcp/mcp_client.py
similarity index 100%
rename from src/flowcept/agents/agent_client.py
rename to src/flowcept/agents/mcp/mcp_client.py
diff --git a/src/flowcept/agents/mcp/mcp_prompts.py b/src/flowcept/agents/mcp/mcp_prompts.py
new file mode 100644
index 00000000..68e122ef
--- /dev/null
+++ b/src/flowcept/agents/mcp/mcp_prompts.py
@@ -0,0 +1,42 @@
+"""MCP prompt registrations — all ``@mcp_flowcept.prompt()`` decorators live here.
+
+Separated from the prompt builders in ``prompts/`` so those files have no MCP imports.
+"""
+
+from flowcept.agents.mcp.context_manager import mcp_flowcept, get_df_context, EMPTY_DF_MESSAGE
+from flowcept.agents.prompts.df_query_prompts import build_pandas_code_prompt
+
+
+@mcp_flowcept.prompt(
+    name="build_df_query_prompt",
+    title="Build DataFrame Query Prompt",
+    description="Build prompt context for external LLM code generation over agent DataFrame context.",
+)
+def build_df_query_prompt(query: str, context_kind: str = "tasks") -> str:
+    """Build the internal pandas-code generation prompt for external LLM orchestration.
+
+    Parameters
+    ----------
+    query : str
+        Natural language question to translate into pandas code.
+    context_kind : str, optional
+        "tasks" or "objects".
+
+    Returns
+    -------
+    str
+        Prompt text to guide external LLM code generation.
+        Returns an explanatory message when there is no active DataFrame context.
+    """
+    df, schema, value_examples, custom_user_guidance = get_df_context(context_kind=context_kind)
+    if df is None or not len(df):
+        return EMPTY_DF_MESSAGE
+    current_fields = list(df.columns)
+    return build_pandas_code_prompt(
+        query,
+        schema,
+        value_examples,
+        custom_user_guidance,
+        current_fields,
+        context_kind=context_kind,
+    )
diff --git a/src/flowcept/agents/flowcept_agent.py b/src/flowcept/agents/mcp/mcp_server.py
similarity index 55%
rename from src/flowcept/agents/flowcept_agent.py
rename to src/flowcept/agents/mcp/mcp_server.py
index 5de2481a..1fd327a1 100644
--- a/src/flowcept/agents/flowcept_agent.py
+++ b/src/flowcept/agents/mcp/mcp_server.py
@@ -1,12 +1,22 @@
+"""MCP server entry point for the Flowcept agent."""
+
 import json
 import os
+import socket
+import time
 from threading import Thread
 
-from flowcept.agents import check_liveness
-from flowcept.agents.agents_utils import ToolResult
-from flowcept.agents.tools.general_tools import prompt_handler
-from flowcept.agents.agent_client import run_tool
-from flowcept.agents.flowcept_ctx_manager import mcp_flowcept, ctx_manager
+from flowcept.agents.mcp.mcp_client import run_tool
+from flowcept.agents.mcp.context_manager import mcp_flowcept, ctx_manager
+
+# Import all mcp_tools modules so their @mcp_flowcept.tool() decorators fire
+from flowcept.agents.mcp.mcp_tools.session_tools import check_liveness
+import flowcept.agents.mcp.mcp_tools.db_query_mcp_tools  # noqa: F401
+import flowcept.agents.mcp.mcp_tools.dashboard_mcp_tools  # noqa: F401
+import flowcept.agents.mcp.mcp_tools.df_query_mcp_tools  # noqa: F401
+import flowcept.agents.mcp.mcp_tools.report_tools  # noqa: F401
+import flowcept.agents.mcp.mcp_tools.schema_mcp_tools  # noqa: F401
+import flowcept.agents.mcp.mcp_prompts  # noqa: F401
 from flowcept.commons.flowcept_logger import FlowceptLogger
 from flowcept.configs import AGENT_HOST, AGENT_PORT, DUMP_BUFFER_PATH
 from flowcept.flowceptor.consumers.agent.base_agent_context_manager import BaseAgentContextManager
@@ -15,20 +25,16 @@
 import uvicorn
 
 
-class FlowceptAgent:
-    """
-    Flowcept agent server wrapper with optional offline buffer loading.
-    """
+class FlowceptMCPServer:
+    """Flowcept mcp server wrapper with optional offline buffer loading."""
 
     def __init__(self, buffer_path: str | None = None, buffer_messages: list[dict] | None = None):
-        """
-        Initialize a FlowceptAgent.
+        """Initialize a Flowcept MCP server.
 
         Parameters
         ----------
         buffer_path : str or None
-            Optional path to a JSONL buffer file. When MQ is disabled, the agent
-            loads this file once at startup.
+            Optional path to a JSONL buffer file.
         buffer_messages : list[dict] or None
             Optional list of buffer messages to load directly into the agent context.
         """
@@ -39,8 +45,7 @@ def __init__(self, buffer_path: str | None = None, buffer_messages: list[dict] |
         self._server = None
 
     def _load_buffer_messages(self, messages: list[dict]) -> int:
-        """
-        Load a list of message objects into the agent context.
+        """Load a list of message objects into the agent context.
 
         Returns
         -------
@@ -58,9 +63,17 @@ def _load_buffer_messages(self, messages: list[dict]) -> int:
         self.logger.info(f"Loaded {count} messages from buffer list.")
         return count
 
+    def reset_context(self):
+        """Reset the MCP agent context without restarting the HTTP server."""
+        ctx_manager.reset_context()
+
+    def load_buffer_messages(self, messages: list[dict]) -> int:
+        """Replace the active MCP context with the provided buffer messages."""
+        self.reset_context()
+        return self._load_buffer_messages(messages)
+
     def _load_buffer_once(self) -> int:
-        """
-        Load messages from a JSONL buffer file into the agent context.
+        """Load messages from a JSONL buffer file into the agent context.
 
         Returns
         -------
@@ -91,8 +104,6 @@ def _load_buffer_once(self) -> int:
     def _run_server(self):
         """Run the MCP server (blocking call)."""
         try:
-            # sse-starlette keeps a module-level exit Event bound to the first event loop that
-            # served SSE; reset it so this server's fresh loop can serve SSE in the same process.
             from sse_starlette.sse import AppStatus
 
             AppStatus.should_exit_event = None
@@ -103,31 +114,51 @@ def _run_server(self):
         self._server.run()
 
     def start(self):
-        """
-        Start the agent server in a background thread.
+        """Start the agent server in a background thread.
 
         Returns
         -------
-        FlowceptAgent
+        FlowceptMCPServer
             The current instance.
         """
-        if self.buffer_path is not None:
-            if self.buffer_messages is not None:
-                self._load_buffer_messages(self.buffer_messages)
-            else:
-                self._load_buffer_once()
-
-        # Daemon thread so the hosting process can always exit (e.g., test runners);
-        # long-running deployments block explicitly via wait().
+        if self.buffer_path is not None or self.buffer_messages is not None:
+            self.reset_context()
+        if self.buffer_messages is not None:
+            self._load_buffer_messages(self.buffer_messages)
+        elif self.buffer_path is not None:
+            self._load_buffer_once()
+
         self._server_thread = Thread(target=self._run_server, daemon=True)
         self._server_thread.start()
-        self.logger.info(f"Flowcept agent server started on {AGENT_HOST}:{AGENT_PORT}")
+        self._wait_until_ready()
+        self.logger.info(f"Flowcept mcp server started on {AGENT_HOST}:{AGENT_PORT}")
         return self
 
+    def _wait_until_ready(self, timeout_sec: float = 10.0):
+        """Wait until the local MCP TCP listener accepts connections."""
+        deadline = time.time() + timeout_sec
+        while time.time() < deadline:
+            try:
+                with socket.create_connection((AGENT_HOST, AGENT_PORT), timeout=0.2):
+                    return
+            except OSError:
+                time.sleep(0.05)
+        raise TimeoutError(f"Flowcept MCP server did not start on {AGENT_HOST}:{AGENT_PORT}.")
+
+    def _wait_until_stopped(self, timeout_sec: float = 10.0):
+        """Wait until the local MCP TCP listener stops accepting connections."""
+        deadline = time.time() + timeout_sec
+        while time.time() < deadline:
+            try:
+                with socket.create_connection((AGENT_HOST, AGENT_PORT), timeout=0.2):
+                    time.sleep(0.05)
+            except OSError:
+                return
+        self.logger.warning(f"Flowcept MCP server still appears reachable on {AGENT_HOST}:{AGENT_PORT}.")
+
     def stop(self):
         """Stop the agent server and wait briefly for shutdown."""
         if self._server is None and self._server_thread is not None:
-            # The server object is created inside the thread; give it a moment to appear.
             self._server_thread.join(timeout=1)
         if self._server is not None:
             self._server.should_exit = True
@@ -135,38 +166,17 @@ def stop(self):
             self._server_thread.join(timeout=5)
             if self._server_thread.is_alive():
                 self.logger.warning("Agent server thread did not stop within 5s; continuing shutdown.")
+        self._wait_until_stopped()
 
     def wait(self):
         """Block until the server thread exits."""
         if self._server_thread is not None:
             self._server_thread.join()
 
-    def query(self, message: str) -> ToolResult:
-        """
-        Send a prompt to the agent's main router tool and return the response.
-        """
-        try:
-            resp = run_tool(tool_name=prompt_handler, kwargs={"message": message})[0]
-        except Exception as e:
-            return ToolResult(code=400, result=f"Error executing tool prompt_handler: {e}", tool_name="prompt_handler")
-
-        try:
-            return ToolResult(**json.loads(resp))
-        except Exception as e:
-            return ToolResult(
-                code=499,
-                result=f"Could not parse tool response as JSON: {resp}",
-                extra=str(e),
-                tool_name="prompt_handler",
-            )
-
 
 def main():
-    """
-    Start the MCP server.
-    """
-    agent = FlowceptAgent().start()
-    # Wake up tool call
+    """Start the MCP server."""
+    agent = FlowceptMCPServer().start()
     print(run_tool(check_liveness, host=AGENT_HOST, port=AGENT_PORT)[0])
     agent.wait()
 
diff --git a/src/flowcept/agents/mcp/mcp_tools/__init__.py b/src/flowcept/agents/mcp/mcp_tools/__init__.py
new file mode 100644
index 00000000..9b02dffb
--- /dev/null
+++ b/src/flowcept/agents/mcp/mcp_tools/__init__.py
@@ -0,0 +1,4 @@
+"""Thin MCP tool wrappers over data_query_tools/ cores."""
+
+from flowcept.agents.mcp.mcp_tools.report_tools import generate_workflow_card  # noqa: F401
+from flowcept.agents.mcp.mcp_tools.session_tools import check_liveness  # noqa: F401
diff --git a/src/flowcept/agents/mcp/mcp_tools/dashboard_mcp_tools.py b/src/flowcept/agents/mcp/mcp_tools/dashboard_mcp_tools.py
new file mode 100644
index 00000000..416cab04
--- /dev/null
+++ b/src/flowcept/agents/mcp/mcp_tools/dashboard_mcp_tools.py
@@ -0,0 +1,30 @@
+"""Thin MCP wrappers for dashboard agent tools."""
+
+from typing import Any, Dict, Optional
+
+from flowcept.agents.data_query_tools import dashboard_tools
+from flowcept.agents.mcp.context_manager import mcp_flowcept
+from flowcept.agents.tool_result import ToolResult
+from flowcept.commons.vocabulary import PROV_AGENT
+from flowcept.instrumentation.flowcept_agent_task import agent_flowcept_task
+
+
+@mcp_flowcept.tool()
+@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)
+def make_chart(card_spec: Dict[str, Any], context: Optional[Dict[str, Any]] = None) -> ToolResult:
+    """Build a chart from a declarative dashboard card spec."""
+    return dashboard_tools.make_chart(card_spec=card_spec, context=context)
+
+
+@mcp_flowcept.tool()
+@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)
+def get_dashboard(dashboard_id: str) -> ToolResult:
+    """Get a stored dashboard spec by id."""
+    return dashboard_tools.get_dashboard(dashboard_id=dashboard_id)
+
+
+@mcp_flowcept.tool()
+@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)
+def update_dashboard(dashboard_id: str, spec: Dict[str, Any]) -> ToolResult:
+    """Replace a stored dashboard spec with a complete revised spec."""
+    return dashboard_tools.update_dashboard(dashboard_id=dashboard_id, spec=spec)
diff --git a/src/flowcept/agents/mcp/mcp_tools/db_query_mcp_tools.py b/src/flowcept/agents/mcp/mcp_tools/db_query_mcp_tools.py
new file mode 100644
index 00000000..d5203480
--- /dev/null
+++ b/src/flowcept/agents/mcp/mcp_tools/db_query_mcp_tools.py
@@ -0,0 +1,80 @@
+"""Thin MCP wrappers exposing DB provenance query tools to external agent clients.
+
+One-liner delegates to :mod:`flowcept.agents.data_query_tools.db_query_tools`.
+No business logic here — all logic lives in ``data_query_tools/``.
+"""
+
+from typing import Any, Dict, List, Optional
+
+from flowcept.agents.tool_result import ToolResult
+from flowcept.agents.mcp.context_manager import mcp_flowcept
+from flowcept.agents.data_query_tools import db_query_tools
+from flowcept.commons.vocabulary import PROV_AGENT
+from flowcept.instrumentation.flowcept_agent_task import agent_flowcept_task
+
+
+@mcp_flowcept.tool()
+@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)
+def query_tasks(
+    filter: Optional[Dict[str, Any]] = None,
+    projection: Optional[List[str]] = None,
+    limit: int = 100,
+    sort: Optional[List[Dict[str, Any]]] = None,
+) -> ToolResult:
+    """Query task provenance records in the database with a Mongo-style filter."""
+    return db_query_tools.query_tasks(filter=filter, projection=projection, limit=limit, sort=sort)
+
+
+@mcp_flowcept.tool()
+@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)
+def query_workflows(filter: Optional[Dict[str, Any]] = None, limit: int = 100) -> ToolResult:
+    """Query workflow provenance records in the database with a Mongo-style filter."""
+    return db_query_tools.query_workflows(filter=filter, limit=limit)
+
+
+@mcp_flowcept.tool()
+@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)
+def get_task_summary(filter: Optional[Dict[str, Any]] = None) -> ToolResult:
+    """Summarize tasks matching a filter: status counts, per-activity durations, time range."""
+    return db_query_tools.get_task_summary(filter=filter)
+
+
+@mcp_flowcept.tool()
+@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)
+def list_campaigns(campaign_id: Optional[str] = None) -> ToolResult:
+    """List derived campaign summaries (campaigns group workflows and tasks)."""
+    return db_query_tools.list_campaigns(campaign_id=campaign_id)
+
+
+@mcp_flowcept.tool()
+@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)
+def list_agents(filter: Optional[Dict[str, Any]] = None) -> ToolResult:
+    """List derived agent summaries (agents observed in task provenance)."""
+    return db_query_tools.list_agents(filter=filter)
+
+
+@mcp_flowcept.tool()
+@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)
+def query_objects(
+    filter: Optional[Dict[str, Any]] = None,
+    projection: Optional[Any] = None,
+    limit: int = 100,
+) -> ToolResult:
+    """Query stored data-object records (ML models, datasets, blobs) with a Mongo-style filter.
+
+    Use for model parameters, dataset metadata, artifact sizes, or file types.
+    """
+    if isinstance(projection, dict):
+        projection = [k for k, v in projection.items() if v]
+    return db_query_tools.query_objects(filter=filter, projection=projection or None, limit=limit)
+
+
+@mcp_flowcept.tool()
+@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)
+def highlight_lineage(
+    task_ids: Optional[List[str]] = None,
+    filter: Optional[Dict[str, Any]] = None,
+    workflow_id: Optional[str] = None,
+) -> ToolResult:
+    """Return seed tasks for UI lineage highlighting."""
+    return db_query_tools.highlight_lineage(task_ids=task_ids, filter=filter, workflow_id=workflow_id)
diff --git a/src/flowcept/agents/mcp/mcp_tools/df_query_mcp_tools.py b/src/flowcept/agents/mcp/mcp_tools/df_query_mcp_tools.py
new file mode 100644
index 00000000..5d61fec1
--- /dev/null
+++ b/src/flowcept/agents/mcp/mcp_tools/df_query_mcp_tools.py
@@ -0,0 +1,137 @@
+"""Thin MCP wrappers for DF (DataFrame) query tools.
+
+One-liner delegates to :mod:`flowcept.agents.data_query_tools.df_query_tools`.
+MCP context lookup (df, schema, value_examples, custom_user_guidance) happens here.
+"""
+
+from flowcept.agents.tool_result import ToolResult
+from flowcept.agents.mcp.context_manager import mcp_flowcept, get_df_context, ctx_manager, EMPTY_DF_MESSAGE
+from flowcept.agents.data_query_tools import df_query_tools as _core
+from flowcept.commons.vocabulary import PROV_AGENT
+from flowcept.instrumentation.flowcept_agent_task import agent_flowcept_task
+
+_WORKFLOW_HEAVY_FIELDS = frozenset(
+    {
+        "machine_info",
+        "flowcept_settings",
+        "code_repository",
+        "conf",
+        "extra_metadata",
+        "environment_id",
+        "sys_name",
+        "interceptor_ids",
+        "adapter_id",
+        "flowcept_version",
+    }
+)
+
+
+@mcp_flowcept.tool()
+@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)
+def get_workflow_context() -> ToolResult:
+    """Return the in-memory workflow record(s) currently loaded in the agent context.
+
+    The DF path stores workflow provenance in the MCP context rather than in the
+    tasks DataFrame.  This tool is the DF-path counterpart to the DB-path
+    ``query_workflows`` tool: both return ``{items, count}`` with heavy
+    infrastructure fields stripped.
+
+    Returns
+    -------
+    ToolResult
+        ``result`` holds ``{"items": [...], "count": int}``.
+    """
+    wf = ctx_manager.context.workflow_msg_obj
+    if not wf:
+        return ToolResult(code=404, result="No workflow loaded in agent context.", tool_name="get_workflow_context")
+    pruned = {k: v for k, v in wf.items() if k not in _WORKFLOW_HEAVY_FIELDS}
+    # Add a lightweight hardware_summary from machine_info so hardware questions can be answered.
+    machine_info = wf.get("machine_info")
+    if machine_info and isinstance(machine_info, dict):
+        for node_data in machine_info.values():
+            if isinstance(node_data, dict):
+                hw: dict = {}
+                if "platform" in node_data:
+                    hw["platform"] = node_data["platform"]
+                if "cpu" in node_data:
+                    cpu = node_data["cpu"]
+                    hw["cpu"] = {k: cpu[k] for k in ("brand_raw", "arch", "count") if k in cpu}
+                if hw:
+                    pruned["hardware_summary"] = hw
+                break
+    return ToolResult(code=301, result={"items": [pruned], "count": 1}, tool_name="get_workflow_context")
+
+
+@mcp_flowcept.tool()
+@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)
+def run_df_query(query: str, llm=None, plot: bool = False, context_kind: str = "tasks") -> ToolResult:
+    r"""Run a natural language query against the current context DataFrame.
+
+    This tool retrieves the active DataFrame, schema, and example values
+    from the MCP Flowcept context and uses an LLM to process the query.
+
+    Parameters
+    ----------
+    query : str
+        Natural language query or Python code snippet.
+    llm : callable, optional
+        LLM callable. Built from settings if None.
+    plot : bool, optional
+        If True, generate plotting code.
+    context_kind : str, optional
+        "tasks" or "objects".
+
+    Returns
+    -------
+    ToolResult
+    """
+    df, schema, value_examples, custom_user_guidance = get_df_context(context_kind=context_kind)
+    return _core.run_df_query(
+        query=query,
+        df=df,
+        schema=schema,
+        value_examples=value_examples,
+        custom_user_guidance=custom_user_guidance,
+        llm=llm,
+        plot=plot,
+        context_kind=context_kind,
+    )
+
+
+@mcp_flowcept.tool()
+@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)
+def execute_generated_df_code(user_code: str, context_kind: str = "tasks") -> ToolResult:
+    """Execute externally generated pandas code against the current agent DataFrame.
+
+    Parameters
+    ----------
+    user_code : str
+        Pandas code expected to assign output to ``result``.
+    context_kind : str, optional
+        "tasks" or "objects".
+
+    Returns
+    -------
+    ToolResult
+    """
+    df, _, _, _ = get_df_context(context_kind=context_kind)
+    if df is None or not len(df):
+        return ToolResult(code=404, result=EMPTY_DF_MESSAGE)
+    return _core.execute_df_code(user_code=user_code, df=df)
+
+
+@mcp_flowcept.tool()
+@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)
+def extract_or_fix_python_code(raw_text: str, runtime_error: str = None, context_kind: str = "tasks") -> ToolResult:
+    """Extract or repair pandas code using the current agent DataFrame columns."""
+    from flowcept.agents.llm.builders import build_llm_model
+
+    df, _, _, _ = get_df_context(context_kind=context_kind)
+    if df is None or not len(df):
+        return ToolResult(code=404, result=EMPTY_DF_MESSAGE)
+    return _core.extract_or_fix_python_code(
+        build_llm_model(track_tools=False),
+        raw_text,
+        list(df.columns),
+        runtime_error=runtime_error,
+    )
diff --git a/src/flowcept/agents/mcp/mcp_tools/report_tools.py b/src/flowcept/agents/mcp/mcp_tools/report_tools.py
new file mode 100644
index 00000000..c0a3ffb1
--- /dev/null
+++ b/src/flowcept/agents/mcp/mcp_tools/report_tools.py
@@ -0,0 +1,59 @@
+"""MCP tool for generating workflow provenance cards.
+
+Split from ``general_tools.py`` — thin wrapper around ``Flowcept.generate_report``.
+"""
+
+from flowcept import Flowcept
+from flowcept.agents.tool_result import ToolResult
+from flowcept.agents.mcp.context_manager import mcp_flowcept
+from flowcept.commons.vocabulary import PROV_AGENT
+from flowcept.instrumentation.flowcept_agent_task import agent_flowcept_task
+
+
+@mcp_flowcept.tool()
+@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)
+def generate_workflow_card(
+    workflow_id: str = None,
+    campaign_id: str = None,
+    input_jsonl_path: str = None,
+) -> ToolResult:
+    """Generate and return a markdown workflow card as text.
+
+    Exactly one of ``workflow_id``, ``campaign_id``, or ``input_jsonl_path`` must be provided.
+
+    Parameters
+    ----------
+    workflow_id : str, optional
+        Query by workflow identifier.
+    campaign_id : str, optional
+        Query by campaign identifier (produces a campaign-level card).
+    input_jsonl_path : str, optional
+        Path to a Flowcept JSONL buffer file used as input instead of the DB.
+
+    Returns
+    -------
+    ToolResult
+        ``code=301`` with markdown text in ``result["markdown"]`` on success,
+        or an error payload on failure.
+    """
+    try:
+        if not any([workflow_id, campaign_id, input_jsonl_path]):
+            return ToolResult(code=400, result="One of workflow_id, campaign_id, or input_jsonl_path is required.")
+
+        stats = Flowcept.generate_report(
+            report_type="workflow_card",
+            format="markdown",
+            workflow_id=workflow_id,
+            campaign_id=campaign_id,
+            input_jsonl_path=input_jsonl_path,
+        )
+        return ToolResult(
+            code=301,
+            result={
+                "workflow_id": workflow_id,
+                "campaign_id": campaign_id,
+                "markdown": stats["markdown"],
+            },
+        )
+    except Exception as e:
+        return ToolResult(code=499, result=str(e))
diff --git a/src/flowcept/agents/mcp/mcp_tools/schema_mcp_tools.py b/src/flowcept/agents/mcp/mcp_tools/schema_mcp_tools.py
new file mode 100644
index 00000000..90ebae7d
--- /dev/null
+++ b/src/flowcept/agents/mcp/mcp_tools/schema_mcp_tools.py
@@ -0,0 +1,28 @@
+"""MCP tools for workflow-scoped schema context."""
+
+from typing import Optional
+
+from flowcept.agents.mcp.context_manager import ctx_manager, mcp_flowcept
+from flowcept.agents.prompts.db_query_prompts import build_db_schema_context
+from flowcept.agents.tool_result import ToolResult
+from flowcept.commons.vocabulary import PROV_AGENT
+from flowcept.instrumentation.flowcept_agent_task import agent_flowcept_task
+
+
+@mcp_flowcept.tool()
+@agent_flowcept_task(subtype=PROV_AGENT.AGENT_TOOL)
+def get_workflow_schema_context(workflow_id: Optional[str] = None) -> ToolResult:
+    """Return workflow-scoped dynamic schema context for DB and runtime queries."""
+    snapshot = ctx_manager.schema_manager.get_workflow_schema_snapshot(workflow_id)
+    if not snapshot:
+        return ToolResult(code=404, result="No workflow schema context is available.")
+    prompt_context = build_db_schema_context(
+        dynamic_schema=snapshot.get("dynamic_schema"),
+        example_values=snapshot.get("value_examples"),
+        current_fields=snapshot.get("current_fields"),
+    )
+    return ToolResult(
+        code=301,
+        result={"workflow_id": workflow_id, "schema": snapshot, "prompt_context": prompt_context},
+        tool_name="get_workflow_schema_context",
+    )
diff --git a/src/flowcept/agents/mcp/mcp_tools/session_tools.py b/src/flowcept/agents/mcp/mcp_tools/session_tools.py
new file mode 100644
index 00000000..79091896
--- /dev/null
+++ b/src/flowcept/agents/mcp/mcp_tools/session_tools.py
@@ -0,0 +1,150 @@
+"""Session-level MCP tools: liveness, LLM check, guidance recording, and context reset."""
+
+import json
+from typing import List
+
+from flowcept.agents.tool_result import ToolResult
+from flowcept.agents.llm.builders import build_llm_model
+from flowcept.agents.mcp.context_manager import ctx_manager, mcp_flowcept
+
+
+def _with_message_type(message: dict) -> dict:
+    """Return a message with Flowcept type inferred for persisted DB documents."""
+    if message.get("type"):
+        return message
+    typed = dict(message)
+    if typed.get("object_id"):
+        typed["type"] = "object"
+    elif typed.get("task_id") or typed.get("activity_id"):
+        typed["type"] = "task"
+    elif typed.get("workflow_id"):
+        typed["type"] = "workflow"
+    return typed
+
+
+@mcp_flowcept.tool()
+def get_latest(n: int = None) -> str:
+    """Return the most recent task(s) from the task buffer.
+
+    Parameters
+    ----------
+    n : int, optional
+        Number of most recent tasks to return. If None, return only the latest.
+
+    Returns
+    -------
+    str
+        JSON-encoded task(s).
+    """
+    tasks = ctx_manager.context.tasks
+    if not tasks:
+        return "No tasks available."
+    if n is None:
+        return json.dumps(tasks[-1])
+    return json.dumps(tasks[-n])
+
+
+@mcp_flowcept.tool()
+def check_liveness() -> str:
+    """Confirm the agent is alive and responding.
+
+    Returns
+    -------
+    str
+        Liveness status string.
+    """
+    return f"I'm {mcp_flowcept.name} and I'm ready!"
+
+
+@mcp_flowcept.tool()
+def check_llm() -> str:
+    """Check connectivity and response from the LLM backend.
+
+    Returns
+    -------
+    str
+        LLM response.
+    """
+    llm = build_llm_model()
+    return llm("Hello?")
+
+
+@mcp_flowcept.tool()
+def record_guidance(message: str) -> ToolResult:
+    """Record a custom guidance message in agent memory.
+
+    Parameters
+    ----------
+    message : str
+        Guidance text to record.
+
+    Returns
+    -------
+    ToolResult
+    """
+    message = message.replace("@record", "")
+    custom_guidance: List = ctx_manager.context.custom_guidance
+    custom_guidance.append(message)
+    return ToolResult(code=201, result=f"Ok. I recorded in my memory: {message}")
+
+
+@mcp_flowcept.tool()
+def show_records() -> ToolResult:
+    """List all recorded user guidance.
+
+    Returns
+    -------
+    ToolResult
+    """
+    try:
+        custom_guidance: List = ctx_manager.context.custom_guidance
+        if not custom_guidance:
+            message = "There is no recorded user guidance."
+        else:
+            message = "This is the list of custom guidance I have in my memory:\n"
+            message += "\n".join(f" - {msg}" for msg in custom_guidance)
+        return ToolResult(code=201, result=message)
+    except Exception as e:
+        return ToolResult(code=499, result=str(e))
+
+
+@mcp_flowcept.tool()
+def reset_records() -> ToolResult:
+    """Reset all recorded user guidance.
+
+    Returns
+    -------
+    ToolResult
+    """
+    try:
+        ctx_manager.context.custom_guidance = []
+        return ToolResult(code=201, result="Custom guidance reset.")
+    except Exception as e:
+        return ToolResult(code=499, result=str(e))
+
+
+@mcp_flowcept.tool()
+def reset_context() -> ToolResult:
+    """Reset all agent context.
+
+    Returns
+    -------
+    ToolResult
+    """
+    try:
+        ctx_manager.reset_context()
+        return ToolResult(code=201, result="Context reset.")
+    except Exception as e:
+        return ToolResult(code=499, result=str(e))
+
+
+@mcp_flowcept.tool()
+def load_buffer_messages(messages: List[dict]) -> ToolResult:
+    """Replace active MCP context with provided Flowcept buffer messages."""
+    try:
+        ctx_manager.reset_context()
+        for msg_obj in messages:
+            ctx_manager.message_handler(_with_message_type(msg_obj))
+        return ToolResult(code=201, result={"count": len(messages)})
+    except Exception as e:
+        return ToolResult(code=499, result=str(e))
diff --git a/src/flowcept/agents/prompts/README.md b/src/flowcept/agents/prompts/README.md
new file mode 100644
index 00000000..12d060ae
--- /dev/null
+++ b/src/flowcept/agents/prompts/README.md
@@ -0,0 +1,27 @@
+# Agents Prompts
+
+This directory contains all prompt builder functions for the Flowcept agent subsystem.
+
+## Files
+
+| File | Purpose |
+|---|---|
+| `base_prompts.py` | `BASE_ROLE`, `build_single_task_prompt`, `build_multitask_prompt` — schema-aware analysis prompts using `SCHEMA_CONTEXT` |
+| `db_query_prompts.py` | `build_db_filter_prompt` — generates Mongo-style filter JSON for DB queries |
+| `in_memory_task_query_prompts.py` | Prompt builders for in-memory task DataFrame queries (`generate_pandas_code_prompt`, `generate_plot_code_prompt`, etc.) |
+| `in_memory_workflow_query_prompts.py` | Prompt builders for querying the active workflow message object |
+| `general_prompts.py` | Routing and small-talk prompts; `ROUTING_PROMPT`, `SMALL_TALK_PROMPT` |
+| `chat_prompts.py` | `build_chat_system_prompt` — system prompt builder for the webservice chat endpoint |
+
+## Design Rules
+
+1. **No MCP imports** — prompt files must never import `mcp_flowcept` or `FastMCP`.
+   - The `@mcp_flowcept.prompt()` registrations live in `prompts/mcp_prompts.py`.
+
+2. **Schema from SCHEMA_CONTEXT** — prompt builders that need field names or types must
+   use `SCHEMA_CONTEXT` from `schema_introspection.py`, not hardcoded strings.
+   `SCHEMA_CONTEXT` is populated at MCP server startup and is a module-level dict.
+
+3. **Naming convention** — all public builder functions are named `build_*_prompt`.
+
+4. **No side effects** — functions are pure builders; they never call LLMs or make DB queries.
diff --git a/src/flowcept/agents/prompts/base_prompts.py b/src/flowcept/agents/prompts/base_prompts.py
new file mode 100644
index 00000000..6ebb3026
--- /dev/null
+++ b/src/flowcept/agents/prompts/base_prompts.py
@@ -0,0 +1,107 @@
+# flake8: noqa: E501
+"""Base prompt builders using SCHEMA_CONTEXT for schema-aware task analysis.
+
+These replace the hardcoded schema strings in ``general_prompts.py`` with
+live schema tables derived from ``SCHEMA_CONTEXT`` (populated at MCP server startup).
+"""
+
+from flowcept.agents.provenance_schema_manager.static_schema_builder import SCHEMA_CONTEXT
+
+BASE_ROLE = (
+    "You are a helpful assistant analyzing provenance data from a large-scale workflow composed of multiple tasks."
+)
+
+
+def _build_schema_table() -> str:
+    """Build a markdown schema reference table from SCHEMA_CONTEXT."""
+    rows = [
+        "| Field | Type | Description |",
+        "|---|---|---|",
+    ]
+    for field in SCHEMA_CONTEXT.get("task_fields", []):
+        rows.append(f"| `{field['name']}` | {field['type']} | {field['description']} |")
+    for field in SCHEMA_CONTEXT.get("telemetry_summary_fields", []):
+        rows.append(f"| `telemetry_summary.{field['name']}` | {field['type']} | {field['description']} |")
+    if not SCHEMA_CONTEXT:
+        rows.append("| *(schema not yet loaded)* | | |")
+    return "\n".join(rows)
+
+
+def _build_data_schema_prompt() -> str:
+    """Return a schema description string for a task object."""
+    return (
+        "A task object has its provenance: input data is stored in the 'used' field (column prefix `used.`), "
+        "output in the 'generated' field (column prefix `generated.`). "
+        "Tasks sharing the same 'workflow_id' belong to the same workflow execution trace. "
+        "Pay attention to the 'tags' field, as it may indicate critical tasks. "
+        "The 'telemetry_summary' field reports CPU, disk, memory, and network usage, along with 'duration_sec'. "
+        "Task placement is stored in the 'hostname' field.\n\n"
+        "### Known task fields\n\n" + _build_schema_table()
+    )
+
+
+_ANALYSIS_CORE = (
+    "Correlations involving 'used' vs 'generated' data are especially important. "
+    "So are relationships between (used or generated) data and resource metrics. "
+    "Highlight outliers or critical information and give actionable insights or recommendations."
+)
+
+
+def _build_prompt(role_suffix: str, job: str, data_label: str, data) -> str:
+    return (
+        f"{BASE_ROLE}{role_suffix}\n\n"
+        f"{_build_data_schema_prompt()}\n\n"
+        f"{job} {_ANALYSIS_CORE}\n\n"
+        f"{data_label}:\n```json\n{data}\n```"
+    )
+
+
+def build_single_task_prompt(task_obj: dict) -> str:
+    """Build a prompt for single-task analysis using the live schema context.
+
+    Parameters
+    ----------
+    task_obj : dict
+        The task object to analyze.
+
+    Returns
+    -------
+    str
+        Formatted analysis prompt.
+    """
+    return _build_prompt(
+        role_suffix=" You are focusing now on a particular task object.",
+        job=(
+            "Your job is to analyze this single task. Find any anomalies, relationships, or correlations between "
+            "input, output, resource usage metrics, task duration, and task placement. "
+            "Explain what this task may be doing, using the data provided."
+        ),
+        data_label="Task object",
+        data=task_obj,
+    )
+
+
+def build_multitask_prompt(task_objs: list) -> str:
+    """Build a prompt for multi-task workflow analysis using the live schema context.
+
+    Parameters
+    ----------
+    task_objs : list
+        The list of task objects to analyze.
+
+    Returns
+    -------
+    str
+        Formatted analysis prompt.
+    """
+    return _build_prompt(
+        role_suffix="",
+        job=(
+            "Your job is to analyze a list of task objects to identify patterns across tasks, anomalies, "
+            "relationships, or correlations between inputs, outputs, resource usage, duration, and task placement. "
+            "Try to infer the purpose of the workflow. "
+            "Use the data provided to justify your analysis."
+        ),
+        data_label="Task objects",
+        data=task_objs,
+    )
diff --git a/src/flowcept/agents/prompts/chat_prompts.py b/src/flowcept/agents/prompts/chat_prompts.py
index 95ef8ecd..d822b59e 100644
--- a/src/flowcept/agents/prompts/chat_prompts.py
+++ b/src/flowcept/agents/prompts/chat_prompts.py
@@ -1,21 +1,153 @@
-"""System prompt for the webservice provenance chat."""
+"""System prompt builder for the webservice provenance chat."""
 
-CHAT_SYSTEM_PROMPT = """You are the Flowcept provenance assistant, embedded in Flowcept's web UI.
-Flowcept captures workflow provenance: campaigns group workflows; workflows contain tasks;
-tasks record used (inputs), generated (outputs), status, timings, telemetry, and host info;
-binary artifacts (datasets, ML models) are stored as versioned objects.
+from __future__ import annotations
 
-Key task fields: task_id, workflow_id, campaign_id, activity_id (function name), status
-(FINISHED/ERROR/RUNNING), started_at, ended_at, used.*, generated.*, telemetry_at_start/end
-(cpu, memory, disk, network, process, gpu), hostname, agent_id, tags.
-Key workflow fields: workflow_id, name, campaign_id, user, utc_timestamp.
+import json
+from typing import Any, Dict, Optional
 
-You have tools to query this data. Rules:
+_TASK_KEY_FIELDS = {
+    "task_id",
+    "activity_id",
+    "workflow_id",
+    "campaign_id",
+    "agent_id",
+    "status",
+    "started_at",
+    "ended_at",
+    "used",
+    "generated",
+    "hostname",
+    "tags",
+    "parent_task_id",
+    "telemetry_at_start",
+    "telemetry_at_end",
+}
+_WORKFLOW_KEY_FIELDS = {"workflow_id", "name", "campaign_id", "user", "utc_timestamp"}
+_BLOB_KEY_FIELDS = {"object_id", "object_type", "task_id", "workflow_id", "tags", "version"}
+
+
+def _build_schema_section() -> str:
+    """Build field descriptions from SCHEMA_CONTEXT; fall back to safe static text."""
+    try:
+        from flowcept.agents.provenance_schema_manager.static_schema_builder import (
+            SCHEMA_CONTEXT,
+            build_schema_context,
+        )
+
+        ctx = SCHEMA_CONTEXT if SCHEMA_CONTEXT else build_schema_context()
+    except Exception:
+        ctx = {}
+
+    def _fmt(fields, key_set):
+        parts = []
+        for f in fields:
+            if f["name"] in key_set:
+                desc = f.get("description", "")
+                parts.append(f"`{f['name']}`" + (f" ({desc})" if desc else ""))
+        return ", ".join(parts) if parts else None
+
+    task_line = _fmt(ctx.get("task_fields", []), _TASK_KEY_FIELDS)
+    wf_line = _fmt(ctx.get("workflow_fields", []), _WORKFLOW_KEY_FIELDS)
+    blob_line = _fmt(ctx.get("blob_fields", []), _BLOB_KEY_FIELDS)
+
+    if task_line and wf_line and blob_line:
+        return f"Key task fields: {task_line}.\nKey workflow fields: {wf_line}.\nKey object fields: {blob_line}."
+
+    # fallback when SCHEMA_CONTEXT is not yet populated — derived from the key-field sets
+    def _static(key_set):
+        return ", ".join(f"`{n}`" for n in sorted(key_set))
+
+    return (
+        f"Key task fields: {_static(_TASK_KEY_FIELDS)}.\n"
+        f"Key workflow fields: {_static(_WORKFLOW_KEY_FIELDS)}.\n"
+        f"Key object fields: {_static(_BLOB_KEY_FIELDS)}."
+    )
+
+
+def build_chat_system_prompt(context: Optional[Dict[str, Any]] = None) -> str:
+    """Build the system prompt for the webservice provenance chat."""
+    context = dict(context or {})
+    workflow_schema_context = context.pop("workflow_schema_context", None)
+    schema_section = _build_schema_section()
+    prompt = (
+        "You are the Flowcept provenance assistant, embedded in Flowcept's web UI.\n"
+        "Flowcept captures workflow provenance: campaigns group workflows; workflows contain tasks;\n"
+        "tasks record used (inputs), generated (outputs), status, timings, telemetry, and host info;\n"
+        "data objects (versioned binary artifacts) are stored separately with an object_type label.\n\n"
+        + schema_section
+        + "\n\n"
+    )
+    prompt += """You have tools to query this data. Rules:
 - Use the tools to answer data questions; never invent values. Quote real numbers from results.
 - Filters are Mongo-style; allowed operators: $and $or $nor $not $exists $eq $ne $gt $gte $lt
-  $lte $in $nin $regex.
-- When the user context includes workflow_id/campaign_id, scope your queries with it.
+  $lte $in $nin $regex. Never use $options — for case-insensitive regex use the inline flag:
+  {"field": {"$regex": "(?i)pattern"}}.
+- When the user context includes workflow_id/campaign_id, ALWAYS scope your queries with it.
+- For campaigns: ALWAYS call list_campaigns to get campaign details including the human-readable
+  campaign name. Never answer a campaign question from context alone — the context only has IDs.
+- For workflows: when reporting any workflow result, ALWAYS include both the `workflow_id`
+  raw value and the `name` field value explicitly, using their field labels. For a single
+  result write: "workflow_id: <id>, name: <name>". For multiple results use a markdown
+  table with `workflow_id` and `name` as columns. Never omit either field.
+- When answering about workflow activities, lineage, or execution order, use only activity_id
+  values returned by provenance tools. MCP/chat tool names are not workflow activities unless
+  they explicitly appear as activity_id values in the returned provenance records.
+- For agents: list_agents returns {agent_id (UUID), name (human-readable), activities,
+  task_count}. ALWAYS refer to agents by their `name` field, not by agent_id UUID.
+
+  Two patterns — pick based on whether the question names a SPECIFIC item:
+
+  PATTERN A — Specific named value in task data (the user references a concrete task_id
+  or an identifier/value that appears in a task's used.* or generated.* fields): e.g.
+  "what inputs did the task that used <value> consume?", "which agent submitted the
+  task that processed <value>?", "what produced <value>?".
+    Use EXACTLY 3 tool calls — no shortcuts:
+    (1) Call get_task_summary scoped to the workflow_id to discover activity names.
+    (2) Call query_tasks scoped to the workflow_id. Do NOT filter by the specific value —
+        you do not know which used.* or generated.* field stores it. Include
+        projection=["task_id","activity_id","used","generated","agent_id","status"].
+        Inspect BOTH used.* and generated.* fields. If the value appears as generated
+        by one task and used by another, the generated-side task is the upstream
+        producer/submitter of that work item, while the used-side task consumed it.
+    (3) Call list_agents — MANDATORY for attribution. query_tasks returns raw agent_id UUIDs;
+        only list_agents maps them to human-readable agent names and shows which activities
+        each agent ran. Required even if step 2 task data answers the data part.
+    Write your final answer ONLY after all 3 calls complete. The stop-early rule does not
+    apply here — all 3 calls are always required for any Pattern A question.
+
+  PATTERN B — General attribution (no specific value named): e.g. "which agent submitted
+  the work items?", "which agent ran activity X?", "which agent and task submitted the
+  records?". The word "task" in the question does NOT require calling query_tasks —
+  list_agents shows which activities each agent ran.
+    Call list_agents only. Answer directly; do NOT call query_tasks.
+    If the user asks who "submitted work items for" an activity, answer with the
+    upstream agent activity that created/submitted work for that activity. Do not require
+    the target activity itself to have an agent_id; target activity execution and upstream
+    submission are different provenance roles.
+
 - Prefer get_task_summary for aggregate questions (counts, durations) over fetching all tasks.
+  When reporting task counts, your response MUST include each activity_id and its task count.
+  Reporting only "X tasks total" without the per-activity list is INCOMPLETE. Always format
+  as: "Activity A: N tasks, Activity B: M tasks, … Total: X tasks."
+- For data lineage and data flow questions ("complete lineage", "data lineage of",
+  "how did X influence Y?", "trace the lineage", "influence subsequent"):
+  Do NOT call highlight_lineage — it is a UI widget action only.
+  Do NOT call query_tasks — task-level details are not needed for lineage questions.
+  Use EXACTLY 2 tool calls — no more, no fewer:
+    (1) get_task_summary — to see all activities and their counts in the workflow.
+    (2) list_agents — to see which agent ran which activities.
+  Even if the question mentions "the best" or "the worst" task: do NOT search for a
+  specific task. All tasks of the same activity type share the same upstream lineage.
+  Write your final answer ONLY after BOTH calls complete. Do NOT call any additional
+  tools after these 2 calls — get_task_summary and list_agents are sufficient.
+  Describe the workflow using `activity_ids` / `activity_counts` returned by get_task_summary
+  and the agent/activity mapping returned by list_agents. For "complete lineage" or
+  execution-order questions, include every activity_id in `activity_ids`. Do not add activity
+  names that are not in those results.
+- highlight_lineage is ONLY for explicit UI highlight requests ("highlight in the graph",
+  "show lineage in the UI", "visually dim unrelated nodes in the graph").
+- When enumerating discrete parameter values (numeric values, category labels, IDs, etc.):
+  ALWAYS list ALL values explicitly rather than giving a range.
 - When asked for a chart/plot, call make_chart with a declarative chart spec:
   {"chart_id": "<short-id>", "type": "chart", "title": "...",
    "data": {"source": "tasks", "filter": {...}, "group_by": "<field>",
@@ -26,8 +158,15 @@
   two sentences.
 - To modify the user's dashboard (only when asked), call get_dashboard, then update_dashboard
   with the complete revised spec; explain what changed.
-- When the user asks to highlight, trace, show, or visualise the lineage/ancestors/descendants
-  of a task, ALWAYS call highlight_lineage. Pass task_ids directly when given, or use filter to
-  find the seed tasks first. The UI will visually dim all unrelated nodes in the Dataflow graph.
 - Be concise. Use markdown tables for tabular answers. State filters you used.
+- IMPORTANT: after you receive tool results sufficient to answer the question, write your
+  FINAL ANSWER immediately — UNLESS you are in Pattern A (query_tasks + list_agents) or a
+  lineage question (get_task_summary + list_agents), in which case BOTH calls are required
+  before writing your answer. Do NOT call more tools beyond the required set unless the
+  result was empty or returned an error code.
 """
+    if workflow_schema_context:
+        prompt += f"\nWorkflow-specific observed schema context:\n{workflow_schema_context}\n"
+    if context:
+        prompt += f"\nCurrent user context (scope queries with it): {json.dumps(context)}"
+    return prompt
diff --git a/src/flowcept/agents/prompts/db_query_prompts.py b/src/flowcept/agents/prompts/db_query_prompts.py
new file mode 100644
index 00000000..e0662700
--- /dev/null
+++ b/src/flowcept/agents/prompts/db_query_prompts.py
@@ -0,0 +1,103 @@
+# flake8: noqa: E501
+"""Prompt builders for database provenance queries.
+
+All functions are plain Python — no MCP framework imports.
+"""
+
+from flowcept.agents.provenance_schema_manager.static_schema_builder import SCHEMA_CONTEXT
+from flowcept.agents.prompts.schema_prompt_context import (
+    build_allowed_fields_prompt,
+    build_task_structure_prompt,
+)
+
+ALLOWED_FILTER_OPERATORS = frozenset(
+    {
+        "$and",
+        "$or",
+        "$nor",
+        "$not",
+        "$exists",
+        "$eq",
+        "$ne",
+        "$gt",
+        "$gte",
+        "$lt",
+        "$lte",
+        "$in",
+        "$nin",
+        "$regex",
+    }
+)
+
+
+def _build_task_field_list() -> str:
+    """Return a bullet list of valid task field names from SCHEMA_CONTEXT."""
+    fields = [f"`{f['name']}`" for f in SCHEMA_CONTEXT.get("task_fields", [])]
+    fields += [f"`telemetry_summary.{f['name']}`" for f in SCHEMA_CONTEXT.get("telemetry_summary_fields", [])]
+    return "\n".join(f"  - {name}" for name in fields) if fields else "  *(schema not yet loaded)*"
+
+
+def build_db_schema_context(
+    dynamic_schema: dict = None,
+    example_values: dict = None,
+    current_fields: list[str] = None,
+) -> str:
+    """Build shared schema context for database-backed query prompts."""
+    if current_fields:
+        context = build_allowed_fields_prompt(current_fields, target_name="database task records")
+        if dynamic_schema is not None:
+            context += build_task_structure_prompt(
+                dynamic_schema=dynamic_schema,
+                example_values=example_values or {},
+                current_fields=current_fields,
+                record_description="Each database task record represents one task.",
+            )
+        return context
+    return "## Valid field names\n" + _build_task_field_list()
+
+
+def build_db_filter_prompt(
+    query: str,
+    collection: str = "tasks",
+    dynamic_schema: dict = None,
+    example_values: dict = None,
+    current_fields: list[str] = None,
+) -> str:
+    """Build a prompt that asks an LLM to generate a Mongo-style filter JSON for a DB query.
+
+    Parameters
+    ----------
+    query : str
+        Natural language question to translate into a filter.
+    collection : str, optional
+        Target collection name ("tasks" or "workflows").
+
+    Returns
+    -------
+    str
+        Formatted prompt.
+    """
+    return f"""You are an expert in MongoDB query construction for workflow provenance data.
+The user wants to query the ``{collection}`` collection.
+
+## Valid filter operators
+Only these operators are allowed:
+{", ".join(sorted(ALLOWED_FILTER_OPERATORS))}
+
+{build_db_schema_context(dynamic_schema=dynamic_schema, example_values=example_values, current_fields=current_fields)}
+
+## Rules
+- Use only field names from the list above.
+- Use only operators from the allowlist.
+- Do NOT invent field names or operators.
+- Return only valid JSON — no markdown, no explanations.
+- For missing information, return an empty filter: {{}}
+- Date/time fields use Unix timestamps (seconds since epoch).
+
+## Output format
+Return a single JSON object (the filter). Example:
+{{"activity_id": "process_data", "telemetry_summary.duration_sec": {{"$gt": 60}}}}
+
+User query:
+{query}
+"""
diff --git a/src/flowcept/agents/prompts/df_query_prompts.py b/src/flowcept/agents/prompts/df_query_prompts.py
new file mode 100644
index 00000000..a861c71c
--- /dev/null
+++ b/src/flowcept/agents/prompts/df_query_prompts.py
@@ -0,0 +1,441 @@
+# flake8: noqa: E501
+"""Prompt builders for DF (DataFrame) chat query path.
+
+All functions are plain Python — no MCP framework decorators.
+The ``@mcp_flowcept.prompt()`` registration lives in ``prompts/mcp_prompts.py``.
+"""
+
+from flowcept.agents.prompts.schema_prompt_context import (
+    build_allowed_fields_prompt,
+    build_example_values_prompt,
+    build_task_structure_prompt,
+)
+
+
+def get_df_form(context_kind="tasks"):
+    """Return DataFrame context description string."""
+    if context_kind == "objects":
+        return "The user has a pandas DataFrame called `df`, created from flattened object metadata messages using `pd.json_normalize`."
+    return "The user has a pandas DataFrame called `df`, created from flattened task objects using `pd.json_normalize`."
+
+
+def build_current_df_columns_prompt(current_fields) -> str:
+    """Build the authoritative DataFrame field constraint."""
+    return (
+        build_allowed_fields_prompt(current_fields, target_name="df")
+        + '- If the query cannot be answered using ALLOWED_FIELDS, return exactly: result = "info not available"\n'
+    )
+
+
+def get_example_values_prompt(example_values):
+    """Return example values prompt string."""
+    return build_example_values_prompt(example_values)
+
+
+def get_object_schema_prompt(example_values, current_fields):
+    """Return schema prompt for object context."""
+    schema_prompt = """
+     ## DATAFRAME STRUCTURE
+
+        Each row in `df` represents one workflow object metadata message.
+
+        Important object fields:
+        - `object_type`: semantic object category, such as input_file, dataset, artifact, or ml_model.
+        - `type`: Flowcept message type. For object rows this is usually "object"; do not use it as the object category.
+        - `file_path`: object path when available.
+        - `workflow_id`: workflow associated with the object.
+        - `custom_metadata.*`: user-defined metadata (e.g. model_profile.params, n_samples, split_ratio).
+
+        ALWAYS CHECK THE ALLOWED_FIELDS list before proceeding.
+        ---
+    """
+    return schema_prompt + get_example_values_prompt(example_values)
+
+
+def get_df_schema_prompt(dynamic_schema, example_values, current_fields, context_kind="tasks"):
+    """Return the full DataFrame schema prompt."""
+    if context_kind == "objects":
+        return get_object_schema_prompt(example_values, current_fields)
+
+    return build_task_structure_prompt(
+        dynamic_schema=dynamic_schema,
+        example_values=example_values,
+        current_fields=current_fields,
+        record_description="Each row in `df` represents a single task.",
+    )
+
+
+def build_plot_code_prompt(query, dynamic_schema, example_values, current_fields, context_kind="tasks") -> str:
+    """Build a prompt for Streamlit chart code generation.
+
+    Parameters
+    ----------
+    query : str
+        Natural language query.
+    dynamic_schema : dict
+        DataFrame schema.
+    example_values : dict
+        Example values.
+    current_fields : list
+        Current DataFrame columns.
+    context_kind : str, optional
+        "tasks" or "objects".
+
+    Returns
+    -------
+    str
+        Formatted prompt.
+    """
+    return f"""
+        You are a Streamlit chart expert.
+        {get_df_form(context_kind)}
+
+        {get_df_schema_prompt(dynamic_schema, example_values, current_fields, context_kind=context_kind)}
+
+        ### 3. Guidelines
+
+        - When plotting from a grouped or aggregated result, set an appropriate column (like activity_id, started_at, etc.) as the index before plotting to ensure x-axis labels are correct.
+        - When aggregating by "activity_id", remember to include .set_index('activity_id') in your response.
+        - Prefer bar charts (`st.bar_chart`) when the x-axis has ≤10 discrete categories (e.g., category labels, discrete parameter values). Use line charts only for continuous/time-series data.
+
+        ### 4. Output Format
+
+        You must write Python code using Streamlit (st) to visualize the requested data.
+
+        - Always assume `df` is already defined.
+        - First, assign the query result to a variable called `result` using pandas.
+        - Then, write the plotting code based on `result`.
+        - Return a Python dictionary with three fields:
+          - `"result_code"`: the pandas code that assigns `result`
+          - `"plot_code"`: the code that creates the Streamlit plot
+          - `"description"`: a one-sentence natural-language caption. It MUST include:
+            (1) the chart type (e.g., "bar chart", "line chart"),
+            (2) the exact field names from result_code verbatim (e.g., "generated.output_field", "used.input_param"),
+            (3) the grouping/index column name,
+            (4) if discrete categories are involved, list them explicitly.
+        ---
+
+        ### 5. Few-Shot Examples
+
+        ```python
+        # Q: Plot the number of tasks by activity
+        {{
+          "result_code": "result = df['activity_id'].value_counts().reset_index().rename(columns={{'index': 'activity_id', 'activity_id': 'count'}})",
+          "plot_code": "st.bar_chart(result.set_index('activity_id'))",
+          "description": "A bar chart of task count by activity_id."
+        }}
+
+        # Q: Show a line chart of task duration per task start time
+        {{
+          "result_code": "result = df[['started_at', 'telemetry_summary.duration_sec']].dropna().set_index('started_at')",
+          "plot_code": "st.line_chart(result)",
+          "description": "A line chart of telemetry_summary.duration_sec over started_at."
+        }}
+
+        Your response must be ONLY a raw JSON object (no markdown fences, no prose), in this exact format:
+        {{"result_code": "<pandas code that assigns result>", "plot_code": "<Streamlit plotting code>", "description": "<one-sentence caption>"}}
+
+        User request:
+        {query}
+    """
+
+
+JOB = "You will generate a pandas dataframe code to solve the query."
+ROLE = """You are an expert in scientific and engineering workflow provenance data analysis with a deep knowledge of data lineage tracing, workflow management, and computing systems.
+            You are analyzing provenance data from a complex workflow consisting of numerous tasks."""
+OBJECT_ROLE = """You are an expert in scientific and engineering workflow provenance data analysis with a deep knowledge of data lineage tracing, workflow management, and computing systems.
+            You are analyzing object metadata records from a workflow provenance buffer."""
+QUERY_GUIDELINES = """
+
+    ### 3. Query Guidelines
+
+    - Use `df` as the base DataFrame.
+    - Use `activity_id` to filter by task type (valid values = schema keys).
+    - ONLY IF the ALLOWED_FIELDS list allow, use `used.` for parameters (inputs) and `generated.` for outputs (metrics).
+    - Use `telemetry_summary.duration_sec` for performance-related questions.
+    - Use `hostname` when user mentions *where* a task ran.
+    - Use `agent_id` when the user refers to agents (non-null means task was agent-run).
+
+    ### 4. Hard Constraints (obey strictly, YOUR LIFE DEPENDS ON THEM. DO NOT HALLUCINATE!!!)
+
+    - Always return code in the form `result = df[<filter>][[...]]` or `result = df.loc[<filter>, [...]]`
+     -**THERE ARE NOT INDIVIDUAL FIELDS NAMED `used` OR `generated`, they are ONLY are prefixes to the field names.**
+     - If the query needs fields that begin with `used.` or `generated.`, your generated query needs to iterate over the df.columns to select the used or generated fields only, such as (adapt when needed): `[col for col in df.columns if col.startswith('generated.')]` or `[col for col in df.columns if col.startswith('used.')]`
+     **THERE ABSOLUTELY ARE NO FIELDS NAMED `used` or `generated`. DO NOT, NEVER use the string 'used' or 'generated' in your generated code!!!**
+    **THE COLUMN 'used' DOES NOT EXIST**
+    **THE COLUMN 'generated' DOES NOT EXIST**
+    - **When filtering by `activity_id`, only select columns that belong to that activity's schema.**
+      - Always observing the ALLOWED_FIELDS list, use only `used.` and `generated.` fields listed in the schema for that `activity_id`.
+     - Explicitly list the selected columns — **never return all columns**
+    - **Only include telemetry columns if used in the query logic.**
+      -THERE IS NOT A FIELD NAMED `telemetry_summary.start_time` or `telemetry_summary.end_time`. Use `started_at` and `ended_at` instead.
+      -THE GENERATED FIELDS ARE LABELED AS SUCH: `generated.()` NOT `generated_output`.
+      -THERE IS NOT A FIELD NAMED `execution_id` or `used.execution_id`.
+      -DO NOT USE `nlargest` or `nsmallest` in the query code, use `sort_values` instead.
+      -WHEN user requests about workflow time, get its latest task's `ended_at` and its earliest task's `started_at` and compute the difference.
+      -WHEN user requests duration per task, utilize `telemetry_summary.duration_sec`.
+
+    If the query asks you to report which values appear in one or more columns, then:
+        For each relevant column, select that column from df, call .dropna(), then .unique() or .value_counts().
+
+    - **CRITICAL — list-valued columns**: NEVER call `.unique()` or `.value_counts()` directly on list-valued columns.
+      Always call `.explode()` first to flatten the lists into individual rows, then aggregate.
+
+    - **Do not include metadata columns unless explicitly required by the user query.**
+
+    - **For filter+aggregate queries** (e.g., "average X for items where Y > Z"): return a DataFrame showing every row that passed the filter (with its key identification columns like item_id or entity_id and the filtered field), not just a scalar aggregate. Include the aggregate as a new column or let the summary describe it.
+    - **For compound queries asking multiple questions in one sentence**: return a single DataFrame that captures all parts. NEVER return a Python list, tuple, or mixed-type collection. Instead build a structured DataFrame.
+    - **To count output fields per activity**: use `gen_cols = [c for c in df.columns if c.startswith('generated.')]` to get generated columns, then use `df.groupby('activity_id')[gen_cols].apply(lambda g: int(g.notna().sum().sum()))` to count the total number of non-null generated field values per activity (this accounts for how many tasks of each activity ran, so a task type that ran 5 times will rank higher than one that ran once even if each has the same number of fields).
+    - **For filter+aggregate queries**: ALWAYS include the primary identifier column(s) for the activity (e.g., any config, item, or entity ID from the schema) in the result DataFrame, so the reader can identify each row without relying on task_id.
+"""
+
+OBJECT_QUERY_GUIDELINES = """
+    ### 3. Query Guidelines
+
+    - Use `df` as the base DataFrame.
+    - Use `object_type` for object category questions.
+    - Use `file_path` for file path questions.
+    - Use `custom_metadata.*` fields for model/dataset metadata (check ALLOWED_FIELDS for available sub-fields).
+    - Use `workflow_id` when the query asks for workflow-specific objects.
+    - The column `type` is the Flowcept message type, not the object category.
+    - Explicitly list selected columns unless the user asks for all columns.
+"""
+
+FEW_SHOTS = """
+  ### 5. Few-Shot Examples
+
+    # Q: How many tasks were processed?
+    result = len(df)
+
+    # Q: How many tasks for each activity?
+    result = df['activity_id'].value_counts()
+
+"""
+
+OBJECT_FEW_SHOTS = """
+  ### 5. Few-Shot Examples
+
+    # Q: How many objects are available?
+    result = len(df)
+
+    # Q: List all distinct object types
+    result = df['object_type'].dropna().unique()
+
+"""
+
+OUTPUT_FORMATTING = """
+    6. Final Instructions
+    Return only valid pandas code assigned to the variable result.
+
+    Your response must be only the raw Python code in the format:
+        result = ...
+
+    For simple queries: one line is preferred.
+    For compound queries that require intermediate variables: use multiple lines (e.g., define gen_cols, per_act, etc., then assign result on the last line).
+
+    Do not include: Explanations, Markdown formatting, Triple backticks, Comments, or Any text before or after the code block.
+    The output cannot have any markdown, no ```python or ``` at all.
+
+    THE LAST LINE OF YOUR CODE MUST BE: result = ...
+
+    Strictly follow the constraints above.
+"""
+
+
+def build_pandas_code_prompt(
+    query: str, dynamic_schema, example_values, custom_user_guidances, current_fields, context_kind="tasks"
+) -> str:
+    """Build a pandas code generation prompt from a natural language query.
+
+    Parameters
+    ----------
+    query : str
+        Natural language query.
+    dynamic_schema : dict
+        DataFrame schema.
+    example_values : dict
+        Example values.
+    custom_user_guidances : list, optional
+        Custom guidance strings.
+    current_fields : list
+        Current DataFrame columns.
+    context_kind : str, optional
+        "tasks" or "objects".
+
+    Returns
+    -------
+    str
+        Formatted prompt.
+    """
+    if custom_user_guidances is not None and isinstance(custom_user_guidances, list) and len(custom_user_guidances):
+        concatenated_guidance = "\n".join(f"- {msg}" for msg in custom_user_guidances)
+        custom_user_guidance_prompt = (
+            f"You MUST consider the following guidance from the user:\n"
+            f"{concatenated_guidance}"
+            "------------------------------------------------------"
+        )
+    else:
+        custom_user_guidance_prompt = ""
+
+    curr_cols = build_current_df_columns_prompt(current_fields)
+    role = OBJECT_ROLE if context_kind == "objects" else ROLE
+    query_guidelines = OBJECT_QUERY_GUIDELINES if context_kind == "objects" else QUERY_GUIDELINES
+    few_shots = OBJECT_FEW_SHOTS if context_kind == "objects" else FEW_SHOTS
+    return (
+        f"{role}"
+        f"{JOB}"
+        f"{get_df_form(context_kind)}"
+        f"{curr_cols}"
+        f"{get_df_schema_prompt(dynamic_schema, example_values, current_fields, context_kind=context_kind)}"
+        f"{query_guidelines}"
+        f"{few_shots}"
+        f"{custom_user_guidance_prompt}"
+        f"{OUTPUT_FORMATTING}"
+        "User Query:"
+        f"{query}"
+    )
+
+
+def build_dataframe_summarizer_prompt(
+    code, reduced_df, dynamic_schema, example_values, query, current_fields, context_kind="tasks"
+) -> str:
+    """Build a prompt that asks the LLM to summarize a query result DataFrame.
+
+    Parameters
+    ----------
+    code : str
+        The pandas code that produced the result.
+    reduced_df : pandas.DataFrame
+        A reduced/sampled version of the result.
+    dynamic_schema : dict
+        DataFrame schema.
+    example_values : dict
+        Example values.
+    query : str
+        The original user query.
+    current_fields : list
+        Current DataFrame columns.
+    context_kind : str, optional
+        "tasks" or "objects".
+
+    Returns
+    -------
+    str
+        Formatted summarization prompt.
+    """
+    job = "You are a Workflow Provenance Specialist analyzing a DataFrame that was obtained to answer a query."
+
+    if "image" in reduced_df.columns:
+        reduced_df = reduced_df.drop(columns=["image"])
+
+    return f"""
+    {job}
+
+     Given:
+
+    **User Query**:
+    {query}
+
+    **Query_Code**:
+    {code}
+
+    **Reduced DataFrame `df` contents** (rows sampled from full result):
+    {reduced_df}
+
+    **Original df (before reduction) had this schema:
+    {get_df_schema_prompt(dynamic_schema, example_values, current_fields, context_kind=context_kind)}
+
+    Your task is to produce a concise English answer to the user query.
+
+    Mandatory requirements:
+    1. Mirror the user's exact vocabulary. If the query says "best", write "best" (not "highest" or "top").
+       If the query says "worst", write "worst" (not "lowest").
+    2. For queries that find an extremal result (best, worst, highest, lowest, max, min, first, last):
+       - Name the full set that was searched (e.g., "across all tasks of that activity_id" or "among all records returned").
+       - Describe the method: "found by sorting on [column name verbatim] in [ascending/descending] order".
+    3. For queries that filter by a condition:
+       - Explicitly enumerate every item that passed the filter with its relevant field values
+         (e.g., "item_a (field=value_a), item_b (field=value_b), and item_c (field=value_c)").
+       - Then state the aggregate result.
+    4. Always include column names verbatim using dot-notation (e.g., "generated.metric_a", "used.param_a").
+       When code uses wildcards like "generated.*", look up the actual field names from the schema
+       and enumerate key specific fields. Use the word "including" when listing output field names.
+
+    In the end, conclude by giving your concise answer as follows: **Response**: <YOUR ANSWER>
+
+    Note that the user should not know that this is a reduced dataframe.
+    Keep your response focused and complete.
+    """
+
+
+def extract_or_fix_json_code_prompt(raw_text) -> str:
+    """Build a prompt to extract or fix JSON from raw text.
+
+    Parameters
+    ----------
+    raw_text : str
+        Raw text possibly containing JSON.
+
+    Returns
+    -------
+    str
+        Formatted prompt.
+    """
+    return f"""
+    You are a JSON extractor and fixer.
+    You are given a raw message that may include explanations, markdown fences, or partial JSON.
+
+    Your task:
+    1. Check if the message contains a JSON object or array.
+    2. If it does, extract and fix the JSON if needed.
+    3. Ensure all keys and string values are properly quoted.
+    4. Return only valid, parseable JSON — no markdown, no explanations.
+
+    THE OUTPUT MUST BE A VALID JSON ONLY. DO NOT SAY ANYTHING ELSE.
+
+    User message:
+    {raw_text}
+    """
+
+
+def build_extract_or_fix_python_code_prompt(raw_text, current_fields, runtime_error: str = None) -> str:
+    """Build a prompt to extract or fix pandas code from raw text.
+
+    Parameters
+    ----------
+    raw_text : str
+        Raw text possibly containing Python code.
+    current_fields : list
+        Available DataFrame column names.
+    runtime_error : str, optional
+        Exception message from a previous execution attempt.  When provided,
+        the prompt explicitly asks the LLM to fix the runtime error.
+
+    Returns
+    -------
+    str
+        Formatted prompt.
+    """
+    error_section = (
+        f"\n    The code previously raised this runtime error — you MUST fix it:\n    {runtime_error}\n"
+        if runtime_error
+        else ""
+    )
+    return f"""
+    You are a Pandas DataFrame code extractor and fixer.
+    You are given a raw user message that may include explanations, markdown fences, or partial DataFrame code that queries a DataFrame `df`.
+{error_section}
+    Your task:
+    1. Check if the message contains a valid DataFrame code.
+    2. If it does, extract the code.
+    3. If there are any syntax errors, fix them.
+    4. Carefully analyze the list of columns in the query. The query must only use fields in this list:
+        ALLOWED_FIELDS = {current_fields}.
+       If there are fields not in this list, replace the fields to match according to the ALLOWED_FIELDS list.
+    5. Return only the corrected DataFrame query code — no explanations, no comments, no markdown.
+
+    ONCE AGAIN, ONLY PRODUCE THE PYTHON CODE. DO NOT SAY ANYTHING ELSE!
+
+    User message:
+    {raw_text}
+    """
diff --git a/src/flowcept/agents/prompts/general_prompts.py b/src/flowcept/agents/prompts/general_prompts.py
deleted file mode 100644
index 53e0afe5..00000000
--- a/src/flowcept/agents/prompts/general_prompts.py
+++ /dev/null
@@ -1,70 +0,0 @@
-# flake8: noqa: E501
-# flake8: noqa: D103
-
-from mcp.server.fastmcp.prompts import base
-
-BASE_ROLE = (
-    "You are a helpful assistant analyzing provenance data from a large-scale workflow composed of multiple tasks."
-)
-
-DATA_SCHEMA_PROMPT = (
-    "A task object has its provenance: input data is stored in the 'used' field, output in the 'generated' field. "
-    "Tasks sharing the same 'workflow_id' belong to the same workflow execution trace. "
-    "Pay attention to the 'tags' field, as it may indicate critical tasks. "
-    "The 'telemetry_summary' field reports CPU, disk, memory, and network usage, along with 'duration_sec'. "
-    "Task placement is stored in the 'hostname' field."
-)
-
-QUESTION_PROMPT = "I am particularly more interested in the following question: %QUESTION%."
-
-SMALL_TALK_PROMPT = "Act as a Workflow Provenance Specialist. I would like to interact with you, but please be concise and brief. This is my message:\n"
-
-ROUTING_PROMPT = (
-    "You are a routing assistant for a provenance AI agent. "
-    "Given the following user message, classify it into one of the following routes:\n"
-    "- small_talk: if it's casual conversation or some random word (e.g., 'hausdn', 'a', hello, how are you, what can you do, what's your name)\n"
-    "- in_context_query: if the user is querying the provenance data questions about tasks or data in running workflow (or a workflow that ran recently) or if the user mentions the in-memory 'df' or a dataframe. I expect that most of the interactions will fall in this category.\n"
-    "- plot: if user is requesting plots (e.g., plot, chart, visualize)\n"
-    # "- in_context_query: if the user asks questions about tasks or data in running workflow (or a workflow that ran recently) or if the user mentions the in-memory 'df' or a dataframe.\n"
-    # "- historical_prov_query: if the user wants to query historical provenance data\n"
-    "- in_chat_query: if the user appears to be asking about something that has said recently in this chat.\n"
-    "- in_context_query: if you don't know.\n"
-    "Respond with only the route label."
-    "User message is below:\n "
-)
-
-
-def get_question_prompt(question: str):
-    """Generates a user prompt with the given question filled in."""
-    return base.UserMessage(QUESTION_PROMPT.replace("%QUESTION%", question))
-
-
-SINGLE_TASK_PROMPT = {
-    "role": f"{BASE_ROLE} You are focusing now on a particular task object which I will provide below.",
-    "data_schema": DATA_SCHEMA_PROMPT,
-    "job": (
-        "Your job is to analyze this single task. Find any anomalies, relationships, or correlations between input,"
-        " output, resource usage metrics, task duration, and task placement. "
-        "Correlations involving 'used' vs 'generated' data are especially important. "
-        "So are relationships between (used or generated) data and resource metrics. "
-        "Highlight outliers or critical information and give actionable insights or recommendations. "
-        "Explain what this task may be doing, using the data provided."
-    ),
-}
-
-MULTITASK_PROMPTS = {
-    "role": BASE_ROLE,
-    "data_schema": DATA_SCHEMA_PROMPT,
-    "job": (
-        "Your job is to analyze a list of task objects to identify patterns across tasks, anomalies, relationships,"
-        " or correlations between inputs, outputs, resource usage, duration, and task placement. "
-        "Correlations involving 'used' vs 'generated' data are especially important. "
-        "So are relationships between (used or generated) data and resource metrics. "
-        "Try to infer the purpose of the workflow. "
-        "Highlight outliers or critical tasks and give actionable insights or recommendations. "
-        "Use the data provided to justify your analysis."
-    ),
-}
-
-BASE_SINGLETASK_PROMPT = [base.UserMessage(SINGLE_TASK_PROMPT[k]) for k in ("role", "data_schema", "job")]
-BASE_MULTITASK_PROMPT = [base.UserMessage(MULTITASK_PROMPTS[k]) for k in ("role", "data_schema", "job")]
diff --git a/src/flowcept/agents/prompts/in_memory_query_prompts.py b/src/flowcept/agents/prompts/in_memory_query_prompts.py
deleted file mode 100644
index c8cf2d9b..00000000
--- a/src/flowcept/agents/prompts/in_memory_query_prompts.py
+++ /dev/null
@@ -1,544 +0,0 @@
-# flake8: noqa: E501
-# flake8: noqa: D103
-from flowcept.agents.flowcept_ctx_manager import EMPTY_DF_MESSAGE, get_df_context, mcp_flowcept
-
-
-def generate_common_task_fields(current_fields):
-    # TODO: make this better
-    common_task_fields = """
-       | Column                        | Data Type | Description |
-       |-------------------------------|-------------|
-    """
-    common_task_fields += (
-        "| `workflow_id`                 | string | Workflow the task belongs to. Use this field when the query is asking about workflow execution |\n"
-        if "workflow_id" in current_fields
-        else ""
-    )
-    common_task_fields += (
-        "| `task_id`                     | string | Task identifier. |\n" if "task_id" in current_fields else ""
-    )
-    common_task_fields += (
-        "| `parent_task_id`              | string | A task may be directly linked to others. Use this field when the query asks for a task informed by (or associated with or linked to) other task.  |\n"
-        if "parent_task_id" in current_fields
-        else ""
-    )
-    common_task_fields += (
-        "| `activity_id`                 | string | Type of task (e.g., 'choose_option'). Use this for \"task type\" queries. One activity_id is linked to multiple task_ids. |\n"
-        if "activity_id" in current_fields
-        else ""
-    )
-    common_task_fields += (
-        "| `campaign_id`                 | string | A group of workflows. |\n"
-        if "campaign_id" in current_fields
-        else ""
-    )
-    common_task_fields += (
-        "| `hostname`                    | string | Compute node name. |\n" if "hostname" in current_fields else ""
-    )
-    common_task_fields += (
-        "| `agent_id`                    | string | Set if executed by an agent. |\n"
-        if "agent_id" in current_fields
-        else ""
-    )
-    common_task_fields += (
-        "| `started_at`                  | datetime64[ns, UTC] | Start time of a task. Always use this field when the query has any temporal reference related to the workflow execution, such as 'get the first 10 workflow executions' or 'the last workflow execution'. |\n"
-        if "started_at" in current_fields
-        else ""
-    )
-    common_task_fields += (
-        "| `ended_at`                    | datetime64[ns, UTC] | End time of a task. |\n"
-        if "ended_at" in current_fields
-        else ""
-    )
-    common_task_fields += (
-        "| `subtype`                     | string | Subtype of a task. |\n" if "subtype" in current_fields else ""
-    )
-    common_task_fields += (
-        "| `tags`                        | List[str] | List of descriptive tags. |\n"
-        if "tags" in current_fields
-        else ""
-    )
-    common_task_fields += (
-        "| `image`                       | blob | Raw binary data related to an image. |\n"
-        if "image" in current_fields
-        else ""
-    )
-    common_task_fields += (
-        "| `telemetry_summary.duration_sec` | float | Task duration (seconds). |\n"
-        if "telemetry_summary.duration_sec" in current_fields
-        else ""
-    )
-    common_task_fields += (
-        "| `telemetry_summary.cpu.percent_all_diff` | float | Difference in overall CPU utilization percentage across all cores between task end and start. |\n"
-        if "telemetry_summary.cpu.percent_all_diff" in current_fields
-        else ""
-    )
-    common_task_fields += (
-        "| `telemetry_summary.cpu.user_time_diff`   | float | Difference average per core CPU user time (seconds) between task start and end times. |\n"
-        if "telemetry_summary.cpu.user_time_diff" in current_fields
-        else ""
-    )
-    common_task_fields += (
-        "| `telemetry_summary.cpu.system_time_diff` | float | Difference in CPU system (kernel) time (seconds) used during the task execution. |\n"
-        if "telemetry_summary.cpu.system_time_diff" in current_fields
-        else ""
-    )
-    common_task_fields += (
-        "| `telemetry_summary.cpu.idle_time_diff`   | float | Difference in CPU idle time (seconds) during task end and start. |\n"
-        if "telemetry_summary.cpu.idle_time_diff" in current_fields
-        else ""
-    )
-
-    common_task_fields += "\n For any queries involving CPU, use fields that begin with telemetry_summary.cpu"
-
-    return common_task_fields
-
-
-def get_df_form(context_kind="tasks"):
-    if context_kind == "objects":
-        return "The user has a pandas DataFrame called `df`, created from flattened object metadata messages using `pd.json_normalize`."
-    return "The user has a pandas DataFrame called `df`, created from flattened task objects using `pd.json_normalize`."
-
-
-CURRENT_DF_COLUMNS_PROMPT = """
-### ABSOLUTE FIELD CONSTRAINT -- THIS IS CRITICAL
-
-The following list is the ONLY valid field names in df. Treat this as the schema:
-
-ALLOWED_FIELDS = [COLS]
-
-You MUST treat this list as authoritative.
-
-- You may only use fields names that appear EXACTLY (string match) in ALLOWED_FIELDS.
-- You are NOT allowed to create new field names by:
-  - adding or removing prefixes like "used." or "generated."
-  - combining words
-  - guessing.
-- If a field name is not in ALLOWED_FIELDS, you MUST NOT use it.
-- If the query cannot be answered using ALLOWED_FIELDS, return exactly: result = "info not available"
-"""
-
-
-def get_example_values_prompt(example_values):
-    values_prompt = f"""    
-           Now, this other dictionary below provides type (t), up to 3 example values (v), and, for lists, shape (s) and element type (et) for each field.
-           Field names do not include `used.` or `generated.` They represent the unprefixed form shared across roles. String values may be truncated if they exceed the length limit.
-           ```python
-           {example_values}
-           ```
-       """
-    return values_prompt
-
-
-def get_object_schema_prompt(example_values, current_fields):
-    schema_prompt = """
-     ## DATAFRAME STRUCTURE
-
-        Each row in `df` represents one workflow object metadata message.
-
-        Important object fields:
-        - `object_type`: semantic object category, such as input_file, dataset, artifact, or ml_model.
-        - `type`: Flowcept message type. For object rows this is usually "object"; do not use it as the object category.
-        - `object_size_bytes`: object payload size in bytes.
-        - `file_path`: object path when available.
-        - `workflow_id`: workflow associated with the object.
-
-        ALWAYS CHECK THE ALLOWED_FIELDS list before proceeding.
-        ---
-    """
-    return schema_prompt + get_example_values_prompt(example_values)
-
-
-def get_df_schema_prompt(dynamic_schema, example_values, current_fields, context_kind="tasks"):
-    if context_kind == "objects":
-        return get_object_schema_prompt(example_values, current_fields)
-
-    schema_prompt = f"""
-     ## DATAFRAME STRUCTURE
-
-        Each row in `df` represents a single task.
-
-        ### 1. Structured task fields:
-
-        - **in**: input parameters (columns starting with `used.`)
-        - **out**: output metrics/results (columns starting with `generated.`)
-       
-        The schema for these fields is defined in the dictionary below.
-        It maps each activity ID to its inputs (i) and outputs (o), using flattened field names that include `used.` or `generated.` prefixes to indicate the role the field played in the task. These names match the columns in the dataframe `df`.
-        
-        {dynamic_schema}
-        Use this schema and fields to understand what inputs and outputs are valid for each activity.
-        
-        IMPORTANT: The user might say used for outputs or generated for inputs, which might confuse you. Do not get tricked by the user.
-         Ignore the natural-language words "used" and "generated".
-            - The English phrase "used in the calculation" does NOT mean you must use a `used.` column.
-            - The English word "generated" in the question does NOT force you to use a `generated.` column either.
-
-         ALWAYS CHECK THE ALLOWED_FIELDS list before proceeding. THIS IS CRITICAL.
-                
-        ### 2. Additional fields for tasks:
-
-        {generate_common_task_fields(current_fields)}
-        ---
-    """
-
-    values_prompt = get_example_values_prompt(example_values)
-    # values_prompt = ""
-    prompt = schema_prompt + values_prompt
-    return prompt
-
-
-def generate_plot_code_prompt(query, dynamic_schema, example_values, current_fields, context_kind="tasks") -> str:
-    PLOT_PROMPT = f"""
-        You are a Streamlit chart expert.
-        {get_df_form(context_kind)}
-
-        {get_df_schema_prompt(dynamic_schema, example_values, current_fields, context_kind=context_kind)}
-        
-        ### 3. Guidelines
-
-        - When plotting from a grouped or aggregated result, set an appropriate column (like activity_id, started_at, etc.) as the index before plotting to ensure x-axis labels are correct.
-        - When aggregating by "activity_id", remember to include .set_index('activity_id') in your response. 
-
-        ### 4. Output Format
-
-        You must write Python code using Streamlit (st) to visualize the requested data.
-
-        - Always assume `df` is already defined.
-        - First, assign the query result to a variable called `result` using pandas.
-        - Then, write the plotting code based on `result`.
-        - Return a Python dictionary with two fields:
-          - `"result_code"`: the pandas code that assigns `result`
-          - `"plot_code"`: the code that creates the Streamlit plot
-        ---
-
-        ### 5. Few-Shot Examples
-
-        ```python
-        # Q: Plot the number of tasks by activity
-        {{
-          "result_code": "result = df['activity_id'].value_counts().reset_index().rename(columns={{'index': 'activity_id', 'activity_id': 'count'}})",
-          "plot_code": "st.bar_chart(result.set_index('activity_id'))"
-        }}
-
-        # Q: Show a line chart of task duration per task start time
-        {{
-          "result_code": "result = df[['started_at', 'telemetry_summary.duration_sec']].dropna().set_index('started_at')",
-          "plot_code": "st.line_chart(result)"
-        }}
-
-        # Q: Plot average scores for simulate_layer tasks
-        {{
-          "result_code": "result = df[df['activity_id'] == 'simulate_layer'][['generated.scores']].copy()\nresult['avg_score'] = result['generated.scores'].apply(lambda x: sum(eval(str(x))) / len(eval(str(x))) if x else 0)",
-          "plot_code": "st.bar_chart(result['avg_score'])"
-        }}
-
-        # Q: Plot histogram of planned controls count for choose_option
-        {{
-          "result_code": "result = df[df['activity_id'] == 'choose_option'][['used.planned_controls']].copy()\nresult['n_controls'] = result['used.planned_controls'].apply(lambda x: len(eval(str(x))) if x else 0)",
-          "plot_code": "import matplotlib.pyplot as plt\nplt.hist(result['n_controls'])\nst.pyplot(plt)"
-        }}
-
-        Your response must be only the raw Python code in the format:
-        result = ...
-        Except for the `result` variable, YOU MUST NEVER CREATE ANY OTHER VARIABLE. NEVER!  
-
-        User request:
-        {query}
-
-        
-
-    """
-    return PLOT_PROMPT
-
-
-JOB = "You will generate a pandas dataframe code to solve the query."
-ROLE = """You are an expert in HPC workflow provenance data analysis with a deep knowledge of data lineage tracing, workflow management, and computing systems. 
-            You are analyzing provenance data from a complex workflow consisting of numerous tasks."""
-OBJECT_ROLE = """You are an expert in HPC workflow provenance data analysis with a deep knowledge of data lineage tracing, workflow management, and computing systems.
-            You are analyzing object metadata records from a workflow provenance buffer."""
-QUERY_GUIDELINES = """
-    
-    ### 3. Query Guidelines
-
-    - Use `df` as the base DataFrame.
-    - Use `activity_id` to filter by task type (valid values = schema keys).
-    - ONLY IF the ALLOWED_FIELDS list allow, use `used.` for parameters (inputs) and `generated.` for outputs (metrics).
-    - Use `telemetry_summary.duration_sec` for performance-related questions.
-    - Use `hostname` when user mentions *where* a task ran.
-    - Use `agent_id` when the user refers to agents (non-null means task was agent-run).
-
-    ### 4. Hard Constraints (obey strictly, YOUR LIFE DEPENDS ON THEM. DO NOT HALLUCINATE!!!)
-
-    - Always return code in the form `result = df[<filter>][[...]]` or `result = df.loc[<filter>, [...]]`
-     -**THERE ARE NOT INDIVIDUAL FIELDS NAMED `used` OR `generated`, they are ONLY are prefixes to the field names.** 
-     - If the query needs fields that begin with `used.` or `generated.`, your generated query needs to iterate over the df.columns to select the used or generated fields only, such as (adapt when needed): `[col for col in df.columns if col.startswith('generated.')]` or `[col for col in df.columns if col.startswith('used.')]`
-     **THERE ABSOLUTELY ARE NO FIELDS NAMED `used` or `generated`. DO NOT, NEVER use the string 'used' or 'generated' in your generated code!!!**  
-    **THE COLUMN 'used' DOES NOT EXIST**
-    **THE COLUMN 'generated' DOES NOT EXIST**
-    - **When filtering by `activity_id`, only select columns that belong to that activity’s schema.**
-      - Always observing the ALLOWED_FIELDS list, use only `used.` and `generated.` fields listed in the schema for that `activity_id`.
-     - Explicitly list the selected columns — **never return all columns**
-    - **Only include telemetry columns if used in the query logic.**
-      -THERE IS NOT A FIELD NAMED `telemetry_summary.start_time` or `telemetry_summary.end_time` or `used.start_time` or `used.end_time`. Use `started_at` and `ended_at` instead when you want to find the duration of a task, activity, or workflow execution.
-      -THE GENERATED FIELDS ARE LABELED AS SUCH: `generated.()` NOT `generated_output`. Any reference to `generated_output` is incorrect and should be replaced with `generated.` prefix.
-      -THERE IS NOT A FIELD NAMED `execution_id` or `used.execution_id`. Look at the QUERY to decide what correct _id field to use. Any mentions of workflow use `workflow_id`. Any mentions of task use `task_id`. Any mentions of activity use `activity_id`.
-      -DO NOT USE `nlargest` or `nsmallest` in the query code, use `sort_values` instead.
-      -An activity with a value in the `generated.` column created that value. Whereas an activity that has a value in the `used.` column used that value from another activity. IF THE `used.` and `generated.` fields share the same letter after the dot, that means that the activity associated with the `generated.` was created by another activity and the one with `used.` used that SAME value that was created by the activity with that same value in the `generated.` field.
-      -WHEN user requests about workflow time (e.g., total time or  duration" or elapsed time or total execution time or elapsed time or makespan about workflow executions or asking about workflows that took longer than a certain threshold or other workflow-related timing question of one or many workflow executions (each is identified by `workflow_id`), get its latest task's `ended_at` and its earliest task's `started_at`and compute the difference between them, like this (adapt when needed): `df.groupby('workflow_id').apply(lambda x: (x['ended_at'].max() - x['started_at'].min()).total_seconds())`
-      -WHEN user requests duration or execution time per task or for individual tasks, utilize `telemetry_summary.duration_sec`. 
-      -WHEN user requests execution time per activity within workflows compute durations using the difference between the last `ended_at` and the first `started_at` grouping by activitiy_id, workflow_id rather than using `telemetry_summary.duration_sec`.
-      
-      -The first (or the earliest) workflow execution is the one that has the task with earliest `started_at`, so you need to sort the DataFrame based on `started_at` to get the associated workflow_id.
-      -The last (or the latest or the most recent) workflow execution is the one that has the task with the latest `ended_at`, so you need to sort the DataFrame based on `ended_at` to get the associated workflow_id.
-      - Use this to select the tasks in the first workflow (or in the earliest workflow): df[df.workflow_id == df.loc[df.started_at.idxmin(), 'workflow_id']]
-      - Use this to select the tasks in the last workflow (or in the latest workflow or in the most recent workflow or the workflow that started or ended most recently): df[df.workflow_id == df.loc[df.ended_at.idxmax(), 'workflow_id']]
-      -WHEN the user requests the "first workflow" (or earliest workflow), you must identify the workflow by using workflow_id of the task with the earliest started_at. DO NOT use the min workflow_id.
-      -WHEN the user requests the "last workflow" (or latest workflow or most recent workflow), you must identify the workflow by using workflow_id of the task with the latest `ended_at`. DO NOT use the max workflow_id.
-      -Do not use  df['workflow_id'].max() or  df['workflow_id'].min() to find the first or last workflow execution.
-      
-      -To select the first (or earliest) N workflow executions, use or adapt the following: `df.groupby('workflow_id', as_index=False).agg({{"started_at": 'min'}}).sort_values(by='started_at', ascending=True).head(N)['workflow_id']` - utilize `started_at` to sort!     
-      -To select the last (or latest or most recent) N workflow executions, use or adapt the following: `df.groupby('workflow_id', as_index=False).agg({{"ended_at": 'max'}}).sort_values(by='ended_at', ascending=False).head(N)['workflow_id']` - utilize `ended_at` to sort!
-      
-      -If the user does not ask for a specific workflow run, do not use `workflow_id` in your query. 
-      -To select the first or earliest or initial tasks, use or adapt the following: `df.sort_values(by='started_at', ascending=True)`
-      -To select the last or final or most recent tasks, use or adapt the following: `df.sort_values(by='ended_at', ascending=False)`
-      
-      -If user explicitly asks to display or show all columns or fields, do not project on any particular field or column. Just show all of them.
-      
-      -WHEN the user requests a "summary" of activities, you must incorporate relevant summary statistics such as min, max, and mean, into the code you generate.
-      -Do NOT use df[0] or df[integer value] or df[df[<field name>].idxmax()] or df[df[<field name>].idxmin()] because these are obviously not valid Pandas Code!
-      -**Do NOT use any of those: df[df['started_at'].idxmax()], df[df['started_at'].idxmin()], df[df['ended_at'].idxmin()], df[df['ended_at'].idxmax()]. Those are not valid Pandas Code.**
-      - When the query mentions "each task", or "each activity", or "each workflow", make sure you show (project) the correct id column in the results (i.e., respectively: `task_id`, `activity_id`, `workflow_id`) to identify those in the results. 
-      - Use df[<role>.field_name] == True or df[<role>.field_name] == False when user queries boolean fields, where <role> is either used or generated, depending on the field name. Make sure field_name is a valid field in the DataFrame.  
-    
-    If the query asks you to report which values appear in one or more columns
-        (for example “which X were used”, “list all Y”, “what X and Y were generated”), then:
-
-            For each relevant column, select that column from df.
-            Call .dropna() on that column to remove missing values.
-            After dropping NaNs, apply .unique(), .value_counts(), or any other aggregation as needed.
-            Select that column.
-            Call .dropna() on it.
-            Then call .unique(), .value_counts(), or any other aggregation.
-
-    - **CRITICAL — list-valued columns**: Some columns store Python lists as cell values
-      (identifiable in the schema by element type `et` or shape `s`, e.g. `used.plant_ids`).
-      NEVER call `.unique()` or `.value_counts()` directly on these — it raises “unhashable type: list”.
-      Always call `.explode()` first to flatten the lists into individual rows, then aggregate:
-        result = df['used.plant_ids'].dropna().explode().unique()
-
-    - **Do not include metadata columns unless explicitly required by the user query.**
-"""
-
-FEW_SHOTS = """
-  ### 5. Few-Shot Examples
-
-    # Q: How many tasks were processed?
-    result = len(df)) 
-
-    # Q: How many tasks for each activity?
-    result = df['activity_id'].value_counts()
-
-"""
-OBJECT_QUERY_GUIDELINES = """
-    ### 3. Query Guidelines
-
-    - Use `df` as the base DataFrame.
-    - Use `object_type` for object category questions.
-    - Use `object_size_bytes` for object size questions.
-    - Use `file_path` for file path questions.
-    - Use `workflow_id` when the query asks for workflow-specific objects.
-    - The column `type` is the Flowcept message type, not the object category.
-    - Explicitly list selected columns unless the user asks for all columns.
-"""
-OBJECT_FEW_SHOTS = """
-  ### 5. Few-Shot Examples
-
-    # Q: How many objects are available?
-    result = len(df)
-
-    # Q: List all input files larger than 100 MB
-    result = df[(df['object_type'] == 'input_file') & (df['object_size_bytes'] > 100 * 1000 * 1000)][['workflow_id', 'file_path', 'object_size_bytes']]
-
-"""
-# # Q: What is the average loss across all tasks?
-# result = df['generated.loss'].mean()
-#
-# # Q: select the 'choose_option' tasks executed by the agent, and show the planned controls, generated option, scores, explanations
-# result = df[(df['activity_id'] == 'choose_option') & (df['agent_id'].notna())][
-#     ['used.planned_controls', 'generated.option', 'used.scores.scores', 'generated.explanation']].copy()
-#
-# # Q: Show duration and generated scores for 'simulate_layer' tasks
-# result = df[df['activity_id'] == 'simulate_layer'][['telemetry_summary.duration_sec', 'generated.scores']]
-
-OUTPUT_FORMATTING = """
-    6. Final Instructions
-    Return only valid pandas code assigned to the variable result.
-
-    Your response must be only the raw Python code in the format:
-        result = ...
-
-    Do not include: Explanations, Markdown formatting, Triple backticks, Comments, or Any text before or after the code block.
-    The output cannot have any markdown, no ```python or ``` at all. 
-
-    THE OUTPUT MUST BE ONE LINE OF VALID PYTHON CODE ONLY, DO NOT SAY ANYTHING ELSE.
-
-    Strictly follow the constraints above.
-"""
-
-
-def generate_pandas_code_prompt(
-    query: str, dynamic_schema, example_values, custom_user_guidances, current_fields, context_kind="tasks"
-):
-    if custom_user_guidances is not None and isinstance(custom_user_guidances, list) and len(custom_user_guidances):
-        concatenated_guidance = "\n".join(f"- {msg}" for msg in custom_user_guidances)
-        custom_user_guidance_prompt = (
-            f"You MUST consider the following guidance from the user:\n"
-            f"{concatenated_guidance}"
-            "------------------------------------------------------"
-        )
-    else:
-        custom_user_guidance_prompt = ""
-
-    curr_cols = CURRENT_DF_COLUMNS_PROMPT.replace("[COLS]", str(current_fields))
-    role = OBJECT_ROLE if context_kind == "objects" else ROLE
-    query_guidelines = OBJECT_QUERY_GUIDELINES if context_kind == "objects" else QUERY_GUIDELINES
-    few_shots = OBJECT_FEW_SHOTS if context_kind == "objects" else FEW_SHOTS
-    prompt = (
-        f"{role}"
-        f"{JOB}"
-        f"{get_df_form(context_kind)}"
-        f"{curr_cols}"
-        f"{get_df_schema_prompt(dynamic_schema, example_values, current_fields, context_kind=context_kind)}"
-        f"{query_guidelines}"
-        f"{few_shots}"
-        f"{custom_user_guidance_prompt}"
-        f"{OUTPUT_FORMATTING}"
-        "User Query:"
-        f"{query}"
-    )
-    return prompt
-
-
-@mcp_flowcept.prompt(
-    name="build_df_query_prompt",
-    title="Build DataFrame Query Prompt",
-    description="Build prompt context for external LLM code generation over agent DataFrame context.",
-)
-def build_df_query_prompt(query: str, context_kind: str = "tasks") -> str:
-    """
-    Build the internal pandas-code generation prompt for external LLM orchestration.
-
-    Parameters
-    ----------
-    query : str
-        Natural language question to translate into pandas code.
-
-    Returns
-    -------
-    str
-        Prompt text to guide external LLM code generation.
-        Returns an explanatory message when there is no active DataFrame context.
-    """
-    df, schema, value_examples, custom_user_guidance = get_df_context(context_kind=context_kind)
-    if df is None or not len(df):
-        return EMPTY_DF_MESSAGE
-
-    current_fields = list(df.columns)
-    prompt = generate_pandas_code_prompt(
-        query,
-        schema,
-        value_examples,
-        custom_user_guidance,
-        current_fields,
-        context_kind=context_kind,
-    )
-    return prompt
-
-
-def dataframe_summarizer_context(
-    code, reduced_df, dynamic_schema, example_values, query, current_fields, context_kind="tasks"
-) -> str:
-    job = "You are a Workflow Provenance Specialist analyzing a DataFrame that was obtained to answer a query."
-
-    if "image" in reduced_df.columns:
-        reduced_df = reduced_df.drop(columns=["image"])
-
-    prompt = f"""
-    {job}
-    
-     Given:
-    
-    **User Query**:  
-    {query}
-    
-    **Query_Code**:  
-    {code}
-    
-    **Reduced DataFrame `df` contents** (rows sampled from full result):  
-    {reduced_df}
-    
-    **Original df (before reduction) had this schema:
-    {get_df_schema_prompt(dynamic_schema, example_values, current_fields, context_kind=context_kind)}
-    
-    Your task is to find a concise and direct answer as an English sentence to the user query.
-        
-    Only if the answer to the query is complex, provide more explanation by: 
-        1. Analyzing the DataFrame values and columns for any meaningful or notable information. 
-        2. Comparing the query_code with the data content to understand what the result represents. THIS IS A REDUCED DATAFRAME, the original dataframe, used to answer the query, may be much bigger. IT IS ALREADY KNOWN! Do not need to restate this.
-        3. If it makes sense, provide information beyond the recorded provenance, but state it clearly that you are inferring it.
-    
-    In the end, conclude by giving your concise answer as follows: **Response**: <YOUR ANSWER>
-
-    Note that the user should not know that this is a reduced dataframe. 
-    Keep your response short and focused.
-
-    """
-
-    return prompt
-
-
-def extract_or_fix_json_code_prompt(raw_text) -> str:
-    prompt = f"""
-    You are a JSON extractor and fixer.
-    You are given a raw message that may include explanations, markdown fences, or partial JSON.
-
-    Your task:
-    1. Check if the message contains a JSON object or array.
-    2. If it does, extract and fix the JSON if needed.
-    3. Ensure all keys and string values are properly quoted.
-    4. Return only valid, parseable JSON — no markdown, no explanations.
-
-    THE OUTPUT MUST BE A VALID JSON ONLY. DO NOT SAY ANYTHING ELSE.
-
-    User message:
-    {raw_text}
-    """
-    return prompt
-
-
-def extract_or_fix_python_code_prompt(raw_text, current_fields):
-    prompt = f"""
-    You are a Pandas DataFrame code extractor and fixer. Pandas is a well-known data science Python library for querying datasets. 
-    You are given a raw user message that may include explanations, markdown fences, or partial DataFrame code that queries a DataFrame `df`.
-
-    Your task:
-    1. Check if the message contains a valid DataFrame code.
-    2. If it does, extract the code.
-    3. If there are any syntax errors, fix them.
-    4. Carefully analyze the list of columns in the query. The query must only use fields in this list:
-        ALLOWED_FIELDS = {current_fields}.
-       If there are fields not in this list, replace the fields to match according to the ALLOWED_FIELDS list.  
-    5. Return only the corrected DataFrame query code — no explanations, no comments, no markdown.
-
-    The output must be valid Python code, and must not include any other text.
-    Your output can only contain fields in the ALLOWED_FIELDS list.
-    This output will be parsed by another program.
-    
-    ONCE AGAIN, ONLY PRODUCE THE PYTHON CODE. DO NOT SAY ANYTHING ELSE!
-    
-    User message:
-    {raw_text}
-    """
-    return prompt
diff --git a/src/flowcept/agents/prompts/schema_prompt_context.py b/src/flowcept/agents/prompts/schema_prompt_context.py
new file mode 100644
index 00000000..bc7ea8aa
--- /dev/null
+++ b/src/flowcept/agents/prompts/schema_prompt_context.py
@@ -0,0 +1,88 @@
+# flake8: noqa: E501
+"""Shared schema prompt context for DB and runtime in-memory query paths."""
+
+from typing import Any
+
+from flowcept.agents.provenance_schema_manager.static_schema_builder import SCHEMA_CONTEXT
+
+
+def build_allowed_fields_prompt(current_fields: list[str], target_name: str = "records") -> str:
+    """Build the authoritative allowed-field constraint shared by query prompts."""
+    return f"""
+### ABSOLUTE FIELD CONSTRAINT -- THIS IS CRITICAL
+
+The following list is the ONLY valid field names in {target_name}. Treat this as the schema:
+
+ALLOWED_FIELDS = {current_fields}
+
+You MUST treat this list as authoritative.
+
+- You may only use field names that appear EXACTLY (string match) in ALLOWED_FIELDS.
+- You are NOT allowed to create new field names by:
+  - adding or removing prefixes like "used." or "generated."
+  - combining words
+  - guessing.
+- If a field name is not in ALLOWED_FIELDS, you MUST NOT use it.
+"""
+
+
+def build_example_values_prompt(example_values: dict[str, Any]) -> str:
+    """Build a domain-neutral example-value context block."""
+    return f"""
+Now, this dictionary provides type (t), up to 3 example values (v), and, for lists, shape (s) and element type (et) for each field.
+Field names do not include `used.` or `generated.`. They represent the unprefixed form shared across roles. String values may be truncated if they exceed the length limit.
+```python
+{example_values}
+```
+"""
+
+
+def build_task_static_field_table(current_fields: list[str]) -> str:
+    """Build a markdown table of documented static task fields filtered to current fields."""
+    rows = [
+        "   | Column                        | Data Type | Description |",
+        "   |-------------------------------|-----------|-------------|",
+    ]
+    for field in SCHEMA_CONTEXT.get("task_fields", []):
+        if field["name"] in current_fields:
+            rows.append(f"   | `{field['name']:<30}` | {field['type']:<9} | {field['description']} |")
+    for field in SCHEMA_CONTEXT.get("telemetry_summary_fields", []):
+        full_name = f"telemetry_summary.{field['name']}"
+        if full_name in current_fields:
+            rows.append(f"   | `{full_name:<30}` | {field['type']:<9} | {field['description']} |")
+    if any(f.startswith("telemetry_summary.cpu") for f in current_fields):
+        rows.append("   \n For any queries involving CPU, use fields that begin with telemetry_summary.cpu")
+    return "\n".join(rows)
+
+
+def build_task_structure_prompt(
+    dynamic_schema: dict[str, Any],
+    example_values: dict[str, Any],
+    current_fields: list[str],
+    record_description: str,
+) -> str:
+    """Build shared task schema context from observed dynamic schema and static field docs."""
+    return f"""
+## TASK RECORD STRUCTURE
+
+{record_description}
+
+### 1. Structured task fields:
+
+- **in**: input parameters (fields starting with `used.`)
+- **out**: output metrics/results (fields starting with `generated.`)
+
+The schema below maps each activity ID to its inputs (i) and outputs (o), using flattened field names with `used.` or `generated.` prefixes. These names must match the allowed fields exactly.
+
+{dynamic_schema}
+
+Use this schema to understand what inputs and outputs are valid for each activity.
+
+IMPORTANT: The user might use natural-language words such as "used" or "generated" loosely. Do not infer field names from those words. Always check ALLOWED_FIELDS and the activity schema.
+
+### 2. Additional documented task fields:
+
+{build_task_static_field_table(current_fields)}
+---
+{build_example_values_prompt(example_values)}
+"""
diff --git a/src/flowcept/agents/prompts/workflow_query_prompts.py b/src/flowcept/agents/prompts/workflow_query_prompts.py
deleted file mode 100644
index ac22a90d..00000000
--- a/src/flowcept/agents/prompts/workflow_query_prompts.py
+++ /dev/null
@@ -1,119 +0,0 @@
-# flake8: noqa: E501
-"""Prompt builders for querying the active workflow message object."""
-
-from __future__ import annotations
-
-import json
-from typing import Any
-
-from flowcept.agents.flowcept_ctx_manager import mcp_flowcept
-
-
-EMPTY_WORKFLOW_MESSAGE = "Current workflow_msg_obj is empty or null."
-
-
-def _flatten_paths(value: Any, prefix: str = "") -> list[str]:
-    """Return dot paths for nested dict/list values."""
-    if isinstance(value, dict):
-        paths = []
-        for key, child in value.items():
-            child_prefix = f"{prefix}.{key}" if prefix else str(key)
-            paths.append(child_prefix)
-            paths.extend(_flatten_paths(child, child_prefix))
-        return paths
-    if isinstance(value, list):
-        paths = []
-        for idx, child in enumerate(value[:3]):
-            child_prefix = f"{prefix}.{idx}" if prefix else str(idx)
-            paths.append(child_prefix)
-            paths.extend(_flatten_paths(child, child_prefix))
-        return paths
-    return []
-
-
-def _example_values(workflow_msg_obj: dict, paths: list[str], limit: int = 60) -> dict:
-    examples = {}
-    for path in paths[:limit]:
-        value = _resolve_path(workflow_msg_obj, path)
-        if isinstance(value, (dict, list)):
-            continue
-        examples[path] = value
-    return examples
-
-
-def _resolve_path(value: Any, path: str) -> Any:
-    current = value
-    for part in path.split("."):
-        if isinstance(current, dict):
-            if part not in current:
-                raise KeyError(path)
-            current = current[part]
-        elif isinstance(current, list):
-            current = current[int(part)]
-        else:
-            raise KeyError(path)
-    return current
-
-
-def generate_workflow_query_prompt(query: str, workflow_msg_obj: dict, custom_user_guidance=None) -> str:
-    """Build an LLM prompt that maps a free-text workflow question to field paths."""
-    paths = _flatten_paths(workflow_msg_obj)
-    examples = _example_values(workflow_msg_obj, paths)
-    guidance = ""
-    if custom_user_guidance:
-        guidance = "\n".join(f"- {msg}" for msg in custom_user_guidance)
-        guidance = f"\nUser guidance:\n{guidance}\n"
-
-    return f"""
-You are an expert in workflow provenance metadata.
-The user has a JSON workflow message object called `workflow_msg_obj`.
-Your job is to translate a free-text question into a strict JSON query spec.
-
-AUTHORITATIVE FIELD PATHS:
-{json.dumps(paths, indent=2, default=str)}
-
-EXAMPLE SCALAR VALUES:
-{json.dumps(examples, indent=2, default=str)}
-{guidance}
-
-Rules:
-- Use only field paths from AUTHORITATIVE FIELD PATHS.
-- Never invent fields or values.
-- If the requested information is absent, include it under `missing`.
-- For workflow description questions, use only an explicit description-like field if present. If none exists, mark it missing.
-- Return only JSON. No markdown, no explanation.
-
-Output format:
-{{"field_paths": ["path.one", "path.two"], "missing": ["human-readable missing item"], "answer_style": "short"}}
-
-Examples:
-Q: what's the workflow name?
-{{"field_paths": ["name"], "missing": [], "answer_style": "short"}}
-
-Q: what was the settings path?
-{{"field_paths": ["conf.settings_path"], "missing": [], "answer_style": "short"}}
-
-Q: what's the workflow description?
-{{"field_paths": [], "missing": ["workflow description"], "answer_style": "short"}}
-
-Q: what hardware was used?
-{{"field_paths": ["machine_info"], "missing": [], "answer_style": "summary"}}
-
-User query:
-{query}
-"""
-
-
-@mcp_flowcept.prompt(
-    name="build_workflow_query_prompt",
-    title="Build Workflow Query Prompt",
-    description="Build prompt context for external LLM workflow-message field selection.",
-)
-def build_workflow_query_prompt(query: str) -> str:
-    """Build prompt context for external LLM workflow-message field selection."""
-    ctx = mcp_flowcept.get_context()
-    workflow_msg_obj = ctx.request_context.lifespan_context.workflow_msg_obj
-    if not workflow_msg_obj:
-        return EMPTY_WORKFLOW_MESSAGE
-    custom_user_guidance = ctx.request_context.lifespan_context.custom_guidance
-    return generate_workflow_query_prompt(query, workflow_msg_obj, custom_user_guidance)
diff --git a/src/flowcept/agents/provenance_schema_manager/__init__.py b/src/flowcept/agents/provenance_schema_manager/__init__.py
new file mode 100644
index 00000000..30f2a5d9
--- /dev/null
+++ b/src/flowcept/agents/provenance_schema_manager/__init__.py
@@ -0,0 +1 @@
+"""Schema builders and trackers for Flowcept agent provenance prompts."""
diff --git a/src/flowcept/agents/provenance_schema_manager/context_schema_manager.py b/src/flowcept/agents/provenance_schema_manager/context_schema_manager.py
new file mode 100644
index 00000000..b215d46a
--- /dev/null
+++ b/src/flowcept/agents/provenance_schema_manager/context_schema_manager.py
@@ -0,0 +1,122 @@
+"""Schema management for the MCP agent context.
+
+Owns the per-task, per-object, and per-workflow DynamicSchemaTracker instances
+and all methods that update them or the corresponding DataFrames in context.
+"""
+
+from __future__ import annotations
+
+from typing import Dict, List
+
+import pandas as pd
+
+from flowcept.agents.provenance_schema_manager.dynamic_schema_tracker import DynamicSchemaTracker
+from flowcept.commons.flowcept_logger import FlowceptLogger
+
+
+def _to_context_df(records: List[Dict]) -> pd.DataFrame:
+    """Normalize a list of record dicts into a DataFrame, converting list cells to tuples."""
+    _df = pd.json_normalize(records)
+    for col in _df.columns:
+        if _df[col].apply(lambda v: isinstance(v, list)).any():
+            _df[col] = _df[col].apply(lambda v: tuple(v) if isinstance(v, list) else v)
+    return pd.DataFrame(_df)
+
+
+class ContextSchemaManager:
+    """Manages DynamicSchemaTracker instances and DataFrame updates for the MCP agent context.
+
+    Parameters
+    ----------
+    context :
+        The live ``FlowceptAppContext`` whose schema/df fields are updated in place.
+    tracker_config :
+        Keyword args forwarded to every ``DynamicSchemaTracker`` constructor
+        (e.g. ``max_examples``, ``max_str_len``).
+    """
+
+    def __init__(self, context, tracker_config: Dict):
+        self.logger = FlowceptLogger()
+        self._context = context
+        self._tracker_config = tracker_config
+        self._reset_trackers()
+
+    def reset(self):
+        """Reset all trackers to a clean state (called when agent context is reset)."""
+        self._reset_trackers()
+
+    def _reset_trackers(self):
+        self.schema_tracker = DynamicSchemaTracker(**self._tracker_config)
+        self.objects_schema_tracker = DynamicSchemaTracker(**self._tracker_config)
+        self.workflow_schema_trackers: Dict = {}
+
+    def update_schema_and_add_to_df(self, tasks: List[Dict]):
+        """Update the task schema tracker and append normalised rows to the context DataFrame."""
+        self.schema_tracker.update_with_tasks(tasks)
+        self._context.tasks_schema = self.schema_tracker.get_schema()
+        self._context.value_examples = self.schema_tracker.get_example_values()
+
+        _df = _to_context_df(tasks)
+        self._context.df = pd.concat([self._context.df, _df], ignore_index=True)
+
+    def update_objects_schema_and_add_to_df(self, objects: List[Dict]):
+        """Update the object schema tracker and append normalised rows to the objects DataFrame."""
+        self.objects_schema_tracker.update_with_tasks(objects)
+        self._context.objects_schema = self.objects_schema_tracker.get_schema()
+        self._context.objects_value_examples = self.objects_schema_tracker.get_example_values()
+
+        _df = _to_context_df(objects)
+        self._context.objects_df = pd.concat([self._context.objects_df, _df], ignore_index=True)
+
+    def update_workflow_schema_cache(self, tasks: List[Dict]):
+        """Update per-workflow dynamic schema snapshots from a batch of task records."""
+        by_workflow: Dict[str, List[Dict]] = {}
+        for task in tasks:
+            workflow_id = task.get("workflow_id")
+            if workflow_id:
+                by_workflow.setdefault(workflow_id, []).append(task)
+
+        for workflow_id, workflow_tasks in by_workflow.items():
+            tracker = self.workflow_schema_trackers.setdefault(
+                workflow_id,
+                DynamicSchemaTracker(**self._tracker_config),
+            )
+            tracker.update_with_tasks(workflow_tasks)
+            _df = _to_context_df(workflow_tasks)
+            existing = self._context.workflow_schema_cache.get(workflow_id, {}).get("current_fields", [])
+            current_fields = sorted(set(existing) | set(_df.columns))
+            self._context.workflow_schema_cache[workflow_id] = {
+                "dynamic_schema": tracker.get_schema(),
+                "value_examples": tracker.get_example_values(),
+                "current_fields": current_fields,
+            }
+
+    def get_workflow_schema_snapshot(self, workflow_id: str):
+        """Return the cached schema snapshot for a workflow, loading from DB on cache miss."""
+        if not workflow_id:
+            return None
+        if workflow_id in self._context.workflow_schema_cache:
+            return self._context.workflow_schema_cache[workflow_id]
+        try:
+            from flowcept.flowcept_api.db_api import DBAPI
+
+            snapshot = DBAPI().get_workflow_domain_data_schema(workflow_id)
+        except Exception as e:
+            self.logger.exception(e)
+            snapshot = None
+        if snapshot:
+            self._context.workflow_schema_cache[workflow_id] = snapshot
+        return snapshot
+
+    def persist_workflow_schema_snapshot(self, workflow_id: str) -> bool:
+        """Persist the cached workflow schema snapshot into workflow metadata."""
+        snapshot = self.get_workflow_schema_snapshot(workflow_id)
+        if not snapshot:
+            return False
+        try:
+            from flowcept.flowcept_api.db_api import DBAPI
+
+            return DBAPI().save_workflow_domain_data_schema(workflow_id, snapshot)
+        except Exception as e:
+            self.logger.exception(e)
+            return False
diff --git a/src/flowcept/agents/dynamic_schema_tracker.py b/src/flowcept/agents/provenance_schema_manager/dynamic_schema_tracker.py
similarity index 100%
rename from src/flowcept/agents/dynamic_schema_tracker.py
rename to src/flowcept/agents/provenance_schema_manager/dynamic_schema_tracker.py
diff --git a/src/flowcept/agents/provenance_schema_manager/static_schema_builder.py b/src/flowcept/agents/provenance_schema_manager/static_schema_builder.py
new file mode 100644
index 00000000..e9eee3e3
--- /dev/null
+++ b/src/flowcept/agents/provenance_schema_manager/static_schema_builder.py
@@ -0,0 +1,189 @@
+"""Schema introspection utility for building prompt context from class attribute docstrings.
+
+Called once at MCP server startup. Never imported by producer-path code.
+"""
+
+import ast
+import inspect
+import textwrap
+from typing import Any
+
+
+class SchemaDocumentationError(Exception):
+    """Raised at MCP server startup when a domain class has undocumented fields."""
+
+
+def get_attribute_docstrings(cls: type) -> dict[str, str]:
+    """Extract attribute docstrings from a class via AST parsing.
+
+    Reads the source of ``cls`` and walks its class body looking for annotated
+    assignments (``AnnAssign``) immediately followed by a string literal
+    (``Expr(Constant(str))``), which is the Python attribute-docstring convention.
+
+    Parameters
+    ----------
+    cls : type
+        The class to introspect.
+
+    Returns
+    -------
+    dict[str, str]
+        Mapping of field name to its docstring. Fields without a following
+        string literal are not included.
+    """
+    try:
+        source = textwrap.dedent(inspect.getsource(cls))
+        tree = ast.parse(source)
+    except (OSError, TypeError, IndentationError):
+        return {}
+
+    class_def = next(
+        (n for n in ast.walk(tree) if isinstance(n, ast.ClassDef) and n.name == cls.__name__),
+        None,
+    )
+    if class_def is None:
+        return {}
+
+    docs: dict[str, str] = {}
+    body = class_def.body
+    for i, node in enumerate(body):
+        if not (isinstance(node, ast.AnnAssign) and isinstance(node.target, ast.Name)):
+            continue
+        if i + 1 >= len(body):
+            continue
+        next_node = body[i + 1]
+        if (
+            isinstance(next_node, ast.Expr)
+            and isinstance(next_node.value, ast.Constant)
+            and isinstance(next_node.value.value, str)
+        ):
+            docs[node.target.id] = next_node.value.value.strip()
+    return docs
+
+
+def assert_schema_documented(*classes: type) -> None:
+    """Assert every non-private annotated field on each class has an attribute docstring.
+
+    Called at MCP server startup. Raises ``SchemaDocumentationError`` loudly so
+    the server refuses to start when any field is undocumented. Treat a startup
+    failure here as a bug: add the missing attribute docstring to the class.
+
+    Parameters
+    ----------
+    *classes : type
+        Domain classes to check (e.g. TaskObject, TelemetrySummary).
+
+    Raises
+    ------
+    SchemaDocumentationError
+        If any class has fields without attribute docstrings.
+    """
+    errors: list[str] = []
+    for cls in classes:
+        annotations = {
+            name: hint for name, hint in getattr(cls, "__annotations__", {}).items() if not name.startswith("_")
+        }
+        if not annotations:
+            continue
+        docs = get_attribute_docstrings(cls)
+        missing = [name for name in annotations if name not in docs]
+        if missing:
+            errors.append(f"  {cls.__qualname__}: {missing}")
+
+    if errors:
+        raise SchemaDocumentationError(
+            "MCP server cannot start — the following fields are missing attribute docstrings.\n"
+            "Add a triple-quoted string immediately after each field declaration:\n\n"
+            + "\n".join(errors)
+            + "\n\nExample:\n"
+            "    my_field: str = None\n"
+            '    """Description of my_field."""\n'
+        )
+
+
+def _build_field_table(cls: type, subclasses: dict[str, type] | None = None) -> list[dict[str, Any]]:
+    """Build a list of field descriptors for a class, expanding known subclasses.
+
+    Parameters
+    ----------
+    cls : type
+        The class to describe.
+    subclasses : dict[str, type], optional
+        Mapping of field name to its nested class, used to expand composite fields
+        (e.g. ``{"cpu": CpuSummary}``).
+
+    Returns
+    -------
+    list[dict]
+        Each entry has ``name``, ``type``, and ``description``. Nested fields
+        use dot-notation names (e.g. ``cpu.percent_all_diff``).
+    """
+    docs = get_attribute_docstrings(cls)
+    annotations = {name: hint for name, hint in getattr(cls, "__annotations__", {}).items() if not name.startswith("_")}
+    rows: list[dict[str, Any]] = []
+    for name, hint in annotations.items():
+        doc = docs.get(name, "")
+        type_str = getattr(hint, "__name__", str(hint))
+        if subclasses and name in subclasses:
+            sub_cls = subclasses[name]
+            sub_docs = get_attribute_docstrings(sub_cls)
+            sub_annotations = {
+                n: h for n, h in getattr(sub_cls, "__annotations__", {}).items() if not n.startswith("_")
+            }
+            for sub_name, sub_hint in sub_annotations.items():
+                rows.append(
+                    {
+                        "name": f"{name}.{sub_name}",
+                        "type": getattr(sub_hint, "__name__", str(sub_hint)),
+                        "description": sub_docs.get(sub_name, ""),
+                    }
+                )
+        else:
+            rows.append({"name": name, "type": type_str, "description": doc})
+    return rows
+
+
+def build_schema_context() -> dict[str, list[dict[str, Any]]]:
+    """Build the full static schema context at MCP server startup.
+
+    Introspects domain classes to produce field tables used by prompt builders.
+    The result is cached as ``SCHEMA_CONTEXT`` at module level — call this once.
+
+    Returns
+    -------
+    dict
+        Keys: ``task_fields``, ``workflow_fields``, ``agent_fields``,
+        ``blob_fields``, ``telemetry_summary_fields``.
+        Each value is a list of ``{name, type, description}`` dicts.
+    """
+    from flowcept.commons.flowcept_dataclasses.task_object import TaskObject
+    from flowcept.commons.flowcept_dataclasses.workflow_object import WorkflowObject
+    from flowcept.commons.flowcept_dataclasses.agent_object import AgentObject
+    from flowcept.commons.flowcept_dataclasses.blob_object import BlobObject
+    from flowcept.commons.task_data_preprocess import (
+        TelemetrySummary,
+        CpuSummary,
+        MemorySummary,
+        DiskSummary,
+        NetworkSummary,
+    )
+
+    telemetry_subclasses = {
+        "cpu": CpuSummary,
+        "memory": MemorySummary,
+        "disk": DiskSummary,
+        "network": NetworkSummary,
+    }
+
+    return {
+        "task_fields": _build_field_table(TaskObject),
+        "workflow_fields": _build_field_table(WorkflowObject),
+        "agent_fields": _build_field_table(AgentObject),
+        "blob_fields": _build_field_table(BlobObject),
+        "telemetry_summary_fields": _build_field_table(TelemetrySummary, subclasses=telemetry_subclasses),
+    }
+
+
+# Populated at MCP server startup via mcp_server.py lifespan.
+# Do not access before assert_schema_documented() has been called.
+SCHEMA_CONTEXT: dict[str, list[dict[str, Any]]] = {}
diff --git a/src/flowcept/agents/tool_result.py b/src/flowcept/agents/tool_result.py
new file mode 100644
index 00000000..b1f06c2c
--- /dev/null
+++ b/src/flowcept/agents/tool_result.py
@@ -0,0 +1,41 @@
+"""Shared ToolResult wrapper for MCP tools and webservice chat tools."""
+
+from typing import Union, Dict
+from pydantic import BaseModel
+
+
+class ToolResult(BaseModel):
+    """Standardized wrapper for tool outputs.
+
+    Conventions
+    -----------
+    - 2xx: success (string result)
+    - 3xx: success (dict result)
+    - 4xx: error (string message)
+    - 5xx: error (dict result)
+    """
+
+    code: int | None = None
+    result: Union[str, Dict] = None
+    extra: Dict | str | None = None
+    tool_name: str | None = None
+
+    def result_is_str(self) -> bool:
+        """Return True if the result is a string."""
+        return (200 <= self.code < 300) or (400 <= self.code < 500)
+
+    def is_success(self) -> bool:
+        """Return True if the result is a success."""
+        return self.is_success_string() or self.is_success_dict()
+
+    def is_success_string(self) -> bool:
+        """Return True if the result is a 2xx success string."""
+        return 200 <= self.code < 300
+
+    def is_error_string(self) -> bool:
+        """Return True if the result is a 4xx error string."""
+        return 400 <= self.code < 500
+
+    def is_success_dict(self) -> bool:
+        """Return True if the result is a 3xx success dict."""
+        return 300 <= self.code < 400
diff --git a/src/flowcept/agents/tools/__init__.py b/src/flowcept/agents/tools/__init__.py
deleted file mode 100644
index e8e337d3..00000000
--- a/src/flowcept/agents/tools/__init__.py
+++ /dev/null
@@ -1 +0,0 @@
-"""Agent Tools Package."""
diff --git a/src/flowcept/agents/tools/db_prov_tools.py b/src/flowcept/agents/tools/db_prov_tools.py
deleted file mode 100644
index e81f8bb9..00000000
--- a/src/flowcept/agents/tools/db_prov_tools.py
+++ /dev/null
@@ -1,47 +0,0 @@
-"""MCP adapters exposing the shared provenance tool core to external agent clients.
-
-Thin ``@mcp.tool`` wrappers around :mod:`flowcept.agents.tools.prov_tools`, giving MCP
-clients (Claude Code, Codex, etc.) real DB-backed provenance querying — the same tool
-core used by the webservice chat.
-"""
-
-from typing import Any, Dict, List, Optional
-
-from flowcept.agents.agents_utils import ToolResult
-from flowcept.agents.flowcept_ctx_manager import mcp_flowcept
-from flowcept.agents.tools import prov_tools
-
-
-@mcp_flowcept.tool()
-def query_provenance_tasks(
-    filter: Optional[Dict[str, Any]] = None,
-    projection: Optional[List[str]] = None,
-    limit: int = 100,
-    sort: Optional[List[Dict[str, Any]]] = None,
-) -> ToolResult:
-    """Query task provenance records in the database with a Mongo-style filter."""
-    return prov_tools.query_tasks(filter=filter, projection=projection, limit=limit, sort=sort)
-
-
-@mcp_flowcept.tool()
-def query_provenance_workflows(filter: Optional[Dict[str, Any]] = None, limit: int = 100) -> ToolResult:
-    """Query workflow provenance records in the database with a Mongo-style filter."""
-    return prov_tools.query_workflows(filter=filter, limit=limit)
-
-
-@mcp_flowcept.tool()
-def get_provenance_task_summary(filter: Optional[Dict[str, Any]] = None) -> ToolResult:
-    """Summarize tasks matching a filter: status counts, per-activity durations, time range."""
-    return prov_tools.get_task_summary(filter=filter)
-
-
-@mcp_flowcept.tool()
-def list_provenance_campaigns() -> ToolResult:
-    """List derived campaign summaries (campaigns group workflows and tasks)."""
-    return prov_tools.list_campaigns()
-
-
-@mcp_flowcept.tool()
-def list_provenance_agents() -> ToolResult:
-    """List derived agent summaries (agents observed in task provenance)."""
-    return prov_tools.list_agents()
diff --git a/src/flowcept/agents/tools/general_tools.py b/src/flowcept/agents/tools/general_tools.py
deleted file mode 100644
index f5c88797..00000000
--- a/src/flowcept/agents/tools/general_tools.py
+++ /dev/null
@@ -1,255 +0,0 @@
-import json
-from typing import List
-
-from flowcept import Flowcept
-from flowcept.agents.agents_utils import build_llm_model, ToolResult, normalize_message
-from flowcept.agents.flowcept_ctx_manager import mcp_flowcept
-from flowcept.agents.prompts.general_prompts import ROUTING_PROMPT, SMALL_TALK_PROMPT
-
-from flowcept.agents.tools.in_memory_queries.in_memory_queries_tools import run_df_query
-from flowcept.agents.tools.workflow_query_tools import run_workflow_query
-
-
-def _external_llm_enabled() -> bool:
-    """Return True when agent is configured to use an external LLM orchestrator."""
-    from flowcept.configs import AGENT
-
-    return bool(AGENT.get("external_llm", False))
-
-
-@mcp_flowcept.tool()
-def get_latest(n: int = None) -> str:
-    """
-    Return the most recent task(s) from the task buffer.
-
-    Parameters
-    ----------
-    n : int, optional
-        Number of most recent tasks to return. If None, return only the latest.
-
-    Returns
-    -------
-    str
-        JSON-encoded task(s).
-    """
-    ctx = mcp_flowcept.get_context()
-    tasks = ctx.request_context.lifespan_context.tasks
-    if not tasks:
-        return "No tasks available."
-    if n is None:
-        return json.dumps(tasks[-1])
-    return json.dumps(tasks[-n])
-
-
-@mcp_flowcept.tool()
-def check_liveness() -> str:
-    """
-    Confirm the agent is alive and responding.
-
-    Returns
-    -------
-    str
-        Liveness status string.
-    """
-    return f"I'm {mcp_flowcept.name} and I'm ready!"
-
-
-@mcp_flowcept.tool()
-def check_llm() -> str:
-    """
-    Check connectivity and response from the LLM backend.
-
-    Returns
-    -------
-    str
-        LLM response, formatted with MCP metadata.
-    """
-    llm = build_llm_model()
-    response = llm("Hello?")
-    return response
-
-
-@mcp_flowcept.tool()
-def record_guidance(message: str) -> ToolResult:
-    """
-    Record guidance tool.
-    """
-    ctx = mcp_flowcept.get_context()
-    message = message.replace("@record", "")
-    custom_guidance: List = ctx.request_context.lifespan_context.custom_guidance
-    custom_guidance.append(message)
-
-    return ToolResult(code=201, result=f"Ok. I recorded in my memory: {message}")
-
-
-@mcp_flowcept.tool()
-def show_records() -> ToolResult:
-    """
-    Lists all recorded user guidance.
-    """
-    try:
-        ctx = mcp_flowcept.get_context()
-        custom_guidance: List = ctx.request_context.lifespan_context.custom_guidance
-        if not custom_guidance:
-            message = "There is no recorded user guidance."
-        else:
-            message = "This is the list of custom guidance I have in my memory:\n"
-            message += "\n".join(f" - {msg}" for msg in custom_guidance)
-
-        return ToolResult(code=201, result=message)
-    except Exception as e:
-        return ToolResult(code=499, result=str(e))
-
-
-@mcp_flowcept.tool()
-def reset_records() -> ToolResult:
-    """
-    Resets all recorded user guidance.
-    """
-    try:
-        ctx = mcp_flowcept.get_context()
-        ctx.request_context.lifespan_context.custom_guidance = []
-        return ToolResult(code=201, result="Custom guidance reset.")
-    except Exception as e:
-        return ToolResult(code=499, result=str(e))
-
-
-@mcp_flowcept.tool()
-def reset_context() -> ToolResult:
-    """
-    Resets all context.
-    """
-    try:
-        ctx = mcp_flowcept.get_context()
-        ctx.request_context.lifespan_context.reset_context()
-        return ToolResult(code=201, result="Context reset.")
-    except Exception as e:
-        return ToolResult(code=499, result=str(e))
-
-
-@mcp_flowcept.tool()
-def generate_workflow_card(
-    workflow_id: str | None = None,
-    campaign_id: str | None = None,
-    input_jsonl_path: str | None = None,
-) -> ToolResult:
-    """
-    Generate and return a markdown workflow card as text.
-
-    Exactly one of ``workflow_id``, ``campaign_id``, or ``input_jsonl_path`` must be provided.
-
-    Parameters
-    ----------
-    workflow_id : str | None
-        Query by workflow identifier.
-    campaign_id : str | None
-        Query by campaign identifier (produces a campaign-level card).
-    input_jsonl_path : str | None
-        Path to a Flowcept JSONL buffer file used as input instead of the DB.
-
-    Returns
-    -------
-    ToolResult
-        ``code=301`` with markdown text in ``result["markdown"]`` on success,
-        or an error payload on failure.
-    """
-    try:
-        if not any([workflow_id, campaign_id, input_jsonl_path]):
-            return ToolResult(code=400, result="One of workflow_id, campaign_id, or input_jsonl_path is required.")
-
-        stats = Flowcept.generate_report(
-            report_type="workflow_card",
-            format="markdown",
-            workflow_id=workflow_id,
-            campaign_id=campaign_id,
-            input_jsonl_path=input_jsonl_path,
-        )
-        return ToolResult(
-            code=301,
-            result={
-                "workflow_id": workflow_id,
-                "campaign_id": campaign_id,
-                "markdown": stats["markdown"],
-            },
-        )
-    except Exception as e:
-        return ToolResult(code=499, result=str(e))
-
-
-@mcp_flowcept.tool()
-def prompt_handler(message: str) -> ToolResult:
-    """
-    Routes a user message using an LLM to classify its intent.
-
-    Parameters
-    ----------
-    message : str
-        User's natural language input.
-
-    Returns
-    -------
-    TextContent
-        The AI response or routing feedback.
-    """
-    workflow_query_prefix = "w:"
-    task_query_prefix = "t:"
-    object_query_prefix = "o:"
-    normalized_message = message.strip().lower()
-    if message.strip().lower().startswith(workflow_query_prefix):
-        query = message.split(":", 1)[1].strip()
-        return run_workflow_query(query=query)
-    if normalized_message.startswith(task_query_prefix):
-        query = message.split(":", 1)[1].strip()
-        return run_df_query(query=query, llm=None, plot=False, context_kind="tasks")
-    if normalized_message.startswith(object_query_prefix):
-        query = message.split(":", 1)[1].strip()
-        return run_df_query(query=query, llm=None, plot=False, context_kind="objects")
-
-    df_key_words = ["df", "save", "result = df"]
-    for key in df_key_words:
-        if key in message:
-            return run_df_query(query=message, llm=None, plot=False)
-
-    if "reset context" in message:
-        return reset_context()
-    if "@record" in message:
-        return record_guidance(message)
-    if "@show records" in message:
-        return show_records()
-    if "@reset records" in message:
-        return reset_records()
-
-    if _external_llm_enabled():
-        return ToolResult(
-            code=201,
-            result=(
-                "external_llm mode is enabled. Internal LLM routing is disabled. "
-                "Use explicit commands such as 'save', 'result = df ...', "
-                "'t: <task question>', 'o: <object question>', 'w: <workflow question>', "
-                "'reset context', '@record', '@show records', or '@reset records'."
-            ),
-        )
-
-    llm = build_llm_model()
-
-    message = normalize_message(message)
-
-    prompt = ROUTING_PROMPT + message
-    route = llm.invoke(prompt)
-
-    if route == "small_talk":
-        prompt = SMALL_TALK_PROMPT + message
-        response = llm.invoke(prompt)
-        return ToolResult(code=201, result=response)
-    elif route == "in_context_query":
-        return run_df_query(message, llm=llm, plot=False)
-    elif route == "plot":
-        return run_df_query(message, llm=llm, plot=True)
-    elif route == "historical_prov_query":
-        return ToolResult(code=201, result="We need to query the Provenance Database. Feature coming soon.")
-    elif route == "in_chat_query":
-        prompt = SMALL_TALK_PROMPT + message
-        response = llm.invoke(prompt)
-        return ToolResult(code=201, result=response)
-    else:
-        return ToolResult(code=404, result="I don't know how to route.")
diff --git a/src/flowcept/agents/tools/in_memory_queries/__init__.py b/src/flowcept/agents/tools/in_memory_queries/__init__.py
deleted file mode 100644
index abcd73d7..00000000
--- a/src/flowcept/agents/tools/in_memory_queries/__init__.py
+++ /dev/null
@@ -1 +0,0 @@
-"""In-memory Agent Queries Package."""
diff --git a/src/flowcept/agents/tools/in_memory_queries/in_memory_queries_tools.py b/src/flowcept/agents/tools/in_memory_queries/in_memory_queries_tools.py
deleted file mode 100644
index 27242f6b..00000000
--- a/src/flowcept/agents/tools/in_memory_queries/in_memory_queries_tools.py
+++ /dev/null
@@ -1,766 +0,0 @@
-import json
-from flowcept.agents.agents_utils import ToolResult, build_llm_model
-from flowcept.agents.flowcept_ctx_manager import EMPTY_DF_MESSAGE, get_df_context, mcp_flowcept, ctx_manager
-from flowcept.agents.prompts.in_memory_query_prompts import (
-    generate_plot_code_prompt,
-    extract_or_fix_json_code_prompt,
-    generate_pandas_code_prompt,
-    dataframe_summarizer_context,
-    extract_or_fix_python_code_prompt,
-)
-
-from flowcept.agents.tools.in_memory_queries.pandas_agent_utils import (
-    load_saved_df,
-    safe_execute,
-    safe_json_parse,
-    normalize_output,
-    format_result_df,
-    summarize_df,
-)
-
-
-@mcp_flowcept.tool()
-def execute_generated_df_code(user_code: str, context_kind: str = "tasks") -> ToolResult:
-    """
-    Execute externally generated pandas code against the current agent DataFrame.
-
-    Parameters
-    ----------
-    user_code : str
-        Explicit pandas code expected to assign output to ``result``.
-
-    Returns
-    -------
-    ToolResult
-        Delegates to ``run_df_code`` and returns its execution result.
-    """
-    df, _, _, _ = get_df_context(context_kind=context_kind)
-    if df is None or not len(df):
-        return ToolResult(code=404, result=EMPTY_DF_MESSAGE)
-    return run_df_code(user_code=user_code, df=df)
-
-
-@mcp_flowcept.tool()
-def run_df_query(query: str, llm=None, plot=False, context_kind: str = "tasks") -> ToolResult:
-    r"""
-    Run a natural language query against the current context DataFrame.
-
-    This tool retrieves the active DataFrame, schema, and example values
-    from the MCP Flowcept context and uses an LLM to process the query.
-    Depending on the query and flags, it may reset the context, save the
-    current DataFrame, execute raw code, generate a result DataFrame, or
-    produce plotting code.
-
-    Parameters
-    ----------
-    llm : callable
-        A language model function or wrapper that accepts a prompt string
-        and returns a response.
-    query : str
-        Natural language query or Python code snippet to run against the
-        current DataFrame context.
-    plot : bool, default=False
-        If True, generate plotting code along with a result DataFrame.
-        If False, only generate and return the result DataFrame.
-
-    Returns
-    -------
-    ToolResult
-        - ``code=201`` : Context reset or DataFrame/schema saved.
-        - ``code=301`` : Successful result DataFrame (and optional plot code).
-        - ``code=404`` : No active DataFrame in context.
-        - Other codes indicate execution or formatting errors from underlying tools.
-
-    Notes
-    -----
-    - Querying with "reset context" clears the active DataFrame and resets
-      the context.
-    - Querying with "save" persists the DataFrame, schema, and example
-      values to disk via ``save_df``.
-    - Queries containing "result = df" are executed directly as code.
-    - With ``plot=True``, the tool delegates to ``generate_plot_code``;
-      otherwise, it calls ``generate_result_df``.
-
-    Examples
-    --------
-    Save the current DataFrame:
-
-    >>> run_df_query("save")
-    ToolResult(code=201, result="Saved df and schema to /tmp directory")
-
-    Generate a result DataFrame:
-
-    >>> run_df_query("Show average sales by region")
-    ToolResult(code=301, result={'result_df': 'region,avg_sales\\nNorth,100\\nSouth,95'})
-
-    Generate a plot along with the DataFrame:
-
-    >>> run_df_query("Show sales trend as a line chart", plot=True)
-    ToolResult(code=301, result={'result_df': '...', 'plot_code': 'plt.plot(...)'})
-    """
-    df, schema, value_examples, custom_user_guidance = get_df_context(context_kind=context_kind)
-    if df is None or not len(df):
-        return ToolResult(code=404, result=EMPTY_DF_MESSAGE)
-    elif "save" in query:
-        return save_df(df, schema, value_examples)
-    elif "result = df" in query:
-        return run_df_code(user_code=query, df=df)
-
-    if plot:
-        return generate_plot_code(
-            llm,
-            query,
-            schema,
-            value_examples,
-            df,
-            custom_user_guidance=custom_user_guidance,
-            context_kind=context_kind,
-        )
-    else:
-        return generate_result_df(
-            llm,
-            query,
-            schema,
-            value_examples,
-            df,
-            custom_user_guidance=custom_user_guidance,
-            context_kind=context_kind,
-        )
-
-
-@mcp_flowcept.tool()
-def generate_plot_code(
-    llm, query, dynamic_schema, value_examples, df, custom_user_guidance=None, context_kind="tasks"
-) -> ToolResult:
-    """
-    Generate DataFrame and plotting code from a natural language query using an LLM.
-
-    This tool builds a prompt with the query, dynamic schema, and example values,
-    and asks the LLM to return JSON with two fields: ``result_code`` (Python code
-    to transform the DataFrame) and ``plot_code`` (Python code to generate a plot).
-    The resulting code is validated, executed, and the DataFrame result is
-    formatted as CSV. If the LLM output is invalid JSON, the tool attempts to
-    repair or extract valid JSON before failing.
-
-    Parameters
-    ----------
-    llm : callable
-        A language model function or wrapper that accepts a prompt string
-        and returns a response.
-    query : str
-        Natural language query describing the desired data transformation
-        and plot.
-    dynamic_schema : dict
-        Schema definition describing the structure of the DataFrame.
-    value_examples : dict
-        Example values associated with the schema to guide the LLM.
-    df : pandas.DataFrame
-        The DataFrame to query and transform.
-
-    Returns
-    -------
-    ToolResult
-        - On success (code=301): contains a dictionary with:
-            - ``result_df`` : str, CSV-formatted DataFrame result.
-            - ``plot_code`` : str, Python code to generate the plot.
-            - ``result_code`` : str, Python code used to transform the DataFrame.
-        - On failure (codes 400, 404–406, 499): contains an error message and
-          optionally the original prompt for debugging.
-
-    Raises
-    ------
-    Exception
-        Any unhandled error during LLM invocation, JSON parsing, code execution,
-        or DataFrame formatting will be caught and converted into a ``ToolResult``
-        with the appropriate error code.
-
-    Notes
-    -----
-    - Invalid JSON responses from the LLM are automatically retried using
-      an extraction/fix helper.
-    - Both transformation and plotting code must be present in the LLM output,
-      otherwise the tool fails with an error.
-    - Columns that contain only NaN values are dropped from the result.
-
-    Examples
-    --------
-    Generate a bar chart from a sales DataFrame:
-
-    >>> result = generate_plot_code(
-    ...     llm,
-    ...     query="Show total sales by region as a bar chart",
-    ...     dynamic_schema=schema,
-    ...     value_examples=examples,
-    ...     df=sales_df
-    ... )
-    >>> print(result.code)
-    301
-    >>> print(result.result["plot_code"])
-    plt.bar(result_df["region"], result_df["total_sales"])
-    """
-    plot_prompt = generate_plot_code_prompt(
-        query, dynamic_schema, value_examples, list(df.columns), context_kind=context_kind
-    )
-    try:
-        response = llm(plot_prompt)
-    except Exception as e:
-        return ToolResult(code=400, result=str(e), extra=plot_prompt)
-
-    result_code, plot_code = None, None
-    try:
-        result = safe_json_parse(response)
-        result_code = result["result_code"]
-        plot_code = result["plot_code"]
-
-    except ValueError:
-        tool_response = extract_or_fix_json_code(llm, response)
-        response = tool_response.result
-        if tool_response.code == 201:
-            try:
-                result = safe_json_parse(response)
-                assert "result_code" in result
-                assert "plot_code" in result
-                ToolResult(code=301, result=result, extra=plot_prompt)
-            except ValueError as e:
-                return ToolResult(
-                    code=405, result=f"Tried to parse this as JSON: {response}, but got Error: {e}", extra=plot_prompt
-                )
-            except AssertionError as e:
-                return ToolResult(code=405, result=str(e), extra=plot_prompt)
-
-        else:
-            return ToolResult(code=499, result=tool_response.result)
-    except AssertionError as e:
-        return ToolResult(code=405, result=str(e), extra=plot_prompt)
-    except Exception as e:
-        return ToolResult(code=499, result=str(e), extra=plot_prompt)
-
-    try:
-        result_df = safe_execute(df, result_code)
-    except Exception as e:
-        return ToolResult(code=406, result=str(e))
-    try:
-        result_df = format_result_df(result_df)
-    except Exception as e:
-        return ToolResult(code=404, result=str(e))
-
-    this_result = {"result_df": result_df, "plot_code": plot_code, "result_code": result_code}
-    return ToolResult(code=301, result=this_result, tool_name=generate_plot_code.__name__)
-
-
-@mcp_flowcept.tool()
-def generate_result_df(
-    llm,
-    query: str,
-    dynamic_schema,
-    example_values,
-    df,
-    custom_user_guidance=None,
-    attempt_fix=True,
-    summarize=True,
-    context_kind="tasks",
-):
-    """
-    Generate a result DataFrame from a natural language query using an LLM.
-
-    This tool constructs a prompt with the query, dynamic schema, and example values,
-    then asks the LLM to generate executable pandas code. The generated code is
-    executed against the provided DataFrame. If execution fails and ``attempt_fix``
-    is enabled, the tool will try to repair or extract valid Python code using
-    another LLM call. The resulting DataFrame is normalized, formatted, and can be
-    optionally summarized.
-
-    Parameters
-    ----------
-    llm : callable
-        A language model function or wrapper that accepts a prompt string and
-        returns a response (e.g., generated code or summary).
-    query : str
-        Natural language query to be executed against the DataFrame.
-    dynamic_schema : dict
-        Schema definition describing the structure of the DataFrame.
-    example_values : dict
-        Example values associated with the schema to guide the LLM.
-    df : pandas.DataFrame
-        The DataFrame to run the query against.
-    attempt_fix : bool, default=True
-        If True, attempt to fix invalid generated code by calling a repair LLM.
-    summarize : bool, default=True
-        If True, attempt to generate a natural language summary of the result.
-
-    Returns
-    -------
-    ToolResult
-        - On success (codes 301–303): contains a dictionary with:
-            - ``result_code`` : str, the generated Python code.
-            - ``result_df`` : str, CSV-formatted result DataFrame.
-            - ``summary`` : str, summary text if generated successfully.
-            - ``summary_error`` : str or None, error message if summarization failed.
-        - On failure (codes 400, 405, 504): contains an error message and
-          relevant debugging context.
-
-    Raises
-    ------
-    Exception
-        Any unhandled error during code execution, normalization, or summarization
-        will be caught and converted into a ``ToolResult`` with the appropriate code.
-
-    Notes
-    -----
-    - Columns with only NaN values are dropped from the result.
-    - Summarization errors are non-blocking; the result DataFrame is still returned.
-    - The original LLM prompt and any generated code are included in the ``extra``
-      field of the ToolResult for debugging.
-
-    Examples
-    --------
-    Query with valid LLM-generated code:
-
-    >>> result = generate_result_df(
-    ...     llm,
-    ...     query="Show average sales by region",
-    ...     dynamic_schema=schema,
-    ...     example_values=examples,
-    ...     df=sales_df
-    ... )
-    >>> print(result.code)
-    301
-    >>> print(result.result["result_df"])
-
-    Handle invalid code with auto-fix disabled:
-
-    >>> generate_result_df(llm, "bad query", schema, examples, df, attempt_fix=False)
-    ToolResult(code=405, result="Failed to parse this as Python code: ...")
-    """
-    if llm is None:
-        llm = build_llm_model()
-    try:
-        prompt = generate_pandas_code_prompt(
-            query,
-            dynamic_schema,
-            example_values,
-            custom_user_guidance,
-            list(df.columns),
-            context_kind=context_kind,
-        )
-        response = llm(prompt)
-    except Exception as e:
-        return ToolResult(code=400, result=str(e), extra=prompt)
-
-    try:
-        result_code = response
-        result_df = safe_execute(df, result_code)
-    except Exception as e:
-        if not attempt_fix:
-            return ToolResult(
-                code=405,
-                result=f"Failed to parse this as Python code: \n\n ```python\n {result_code} \n```\n "
-                f"but got error:\n\n {e}.",
-                extra={"generated_code": result_code, "exception": str(e), "prompt": prompt},
-            )
-        else:
-            tool_result = extract_or_fix_python_code(llm, result_code, list(df.columns))
-            if tool_result.code == 201:
-                new_result_code = tool_result.result
-                result_code = new_result_code
-                try:
-                    result_df = safe_execute(df, new_result_code)
-                except Exception as e:
-                    return ToolResult(
-                        code=405,
-                        result=f"Failed to parse this as Python code: \n\n"
-                        f"```python\n {result_code} \n```\n "
-                        f"Then tried to LLM extract the Python code, got: \n\n "
-                        f"```python\n{new_result_code}```\n "
-                        f"but got error:\n\n {e}.",
-                    )
-
-            else:
-                return ToolResult(
-                    code=405,
-                    result=f"Failed to parse this as Python code: {result_code}."
-                    f"Exception: {e}\n"
-                    f"Then tried to LLM extract the Python code, but got error:"
-                    f" {tool_result.result}",
-                )
-
-    try:
-        result_df = normalize_output(result_df)
-    except Exception as e:
-        return ToolResult(
-            code=504,
-            result="Failed to normalize output of the resulting dataframe.",
-            extra={"generated_code": result_code, "exception": str(e), "prompt": prompt},
-        )
-
-    result_df = result_df.dropna(axis=1, how="all")
-
-    return_code = 301
-    summary, summary_error = None, None
-    if summarize:
-        try:
-            tool_result = summarize_result(
-                llm,
-                result_code,
-                result_df,
-                query,
-                dynamic_schema,
-                example_values,
-                list(df.columns),
-                context_kind=context_kind,
-            )
-            if tool_result.is_success():
-                return_code = 301
-                summary = tool_result.result
-            else:
-                return_code = 302
-                summary_error = tool_result.result
-        except Exception as e:
-            ctx_manager.logger.exception(e)
-            summary = ""
-            summary_error = str(e)
-            return_code = 303
-
-    try:
-        result_df_str = format_result_df(result_df)
-    except Exception as e:
-        return ToolResult(
-            code=405,
-            result="Failed to format output of the resulting dataframe.",
-            extra={"generated_code": result_code, "exception": str(e), "prompt": prompt},
-        )
-
-    this_result = {
-        "result_code": result_code,
-        "result_df": result_df_str,
-        "result_df_markdown": result_df.to_markdown(index=False),
-        "summary": summary,
-        "summary_error": summary_error,
-    }
-    return ToolResult(
-        code=return_code, result=this_result, tool_name=generate_result_df.__name__, extra={"prompt": prompt}
-    )
-
-
-@mcp_flowcept.tool()
-def run_df_code(user_code: str, df):
-    """
-    Execute user-provided Python code on a DataFrame and format the result.
-
-    This tool safely executes Python code against a given DataFrame,
-    normalizes and formats the result, and returns it as part of a
-    ``ToolResult``. It is designed to let users run custom code snippets
-    for data analysis while capturing errors gracefully.
-
-    Parameters
-    ----------
-    user_code : str
-        A string of Python code intended to operate on the provided DataFrame.
-        The code must be valid and compatible with the execution environment.
-    df : pandas.DataFrame
-        The input DataFrame on which the code will be executed.
-
-    Returns
-    -------
-    ToolResult
-        - On success (code=301): a dictionary with keys:
-          - ``result_code`` : str, the original code snippet.
-          - ``result_df`` : str, the CSV-formatted result DataFrame.
-        - On failure (code=405): the error message indicating why execution failed.
-
-    Raises
-    ------
-    Exception
-        Errors during execution or normalization are caught and
-        converted into a ``ToolResult`` with code 405.
-
-    Notes
-    -----
-    - Columns that contain only ``NaN`` values are dropped from the result.
-    - If the result DataFrame is empty or not valid, an error is returned.
-    - The output DataFrame is always formatted as CSV text.
-
-    Examples
-    --------
-    Run a simple aggregation:
-
-    >>> import pandas as pd
-    >>> df = pd.DataFrame({"a": [1, 2, 3], "b": [10, 20, 30]})
-    >>> res = run_df_code("df[['a']].sum()", df)
-    >>> print(res.code)
-    301
-    >>> print(res.result["result_df"])
-    a
-    6
-
-    Handle an invalid code snippet:
-
-    >>> run_df_code("df.non_existing()", df)
-    ToolResult(code=405, result="Failed to run this as Python code: df.non_existing(). Got error ...")
-    """
-    try:
-        result_df = safe_execute(df, user_code)
-    except Exception as e:
-        return ToolResult(code=405, result=f"Failed to run this as Python code: {user_code}. Got error {e}")
-
-    try:
-        result_df = normalize_output(result_df)
-    except Exception as e:
-        return ToolResult(code=405, result=str(e))
-
-    result_df = result_df.dropna(axis=1, how="all")
-    result_df = format_result_df(result_df)
-
-    this_result = {
-        "result_code": user_code,
-        "result_df": result_df,
-    }
-    return ToolResult(code=301, result=this_result, tool_name=run_df_code.__name__)
-
-
-@mcp_flowcept.tool()
-def extract_or_fix_python_code(llm, raw_text, current_fields):
-    """
-    Extract or repair JSON code from raw text using an LLM.
-
-    This tool constructs a prompt with the given raw text and passes it
-    to the provided language model (LLM). The LLM is expected to either
-    extract valid JSON content or repair malformed JSON from the text.
-    The result is wrapped in a ``ToolResult`` object.
-
-    Parameters
-    ----------
-    llm : callable
-     A language model function or object that can be invoked with a
-     prompt string and returns a response (e.g., an LLM wrapper).
-    raw_text : str
-     The raw text containing JSON code or fragments that may need to
-     be extracted or fixed.
-
-    Returns
-    -------
-    ToolResult
-     A result object containing:
-     - ``code=201`` if the extraction/fix succeeded, with the LLM
-       output in ``result``.
-     - ``code=499`` if an exception occurred, with the error message
-       in ``result``.
-
-    Raises
-    ------
-    Exception
-     Any unhandled exception from the LLM call will be caught and
-     returned as part of the ``ToolResult``.
-
-    Examples
-    --------
-    >>> # Example with a mock LLM that just echoes back
-    >>> def mock_llm(prompt):
-    ...     return '{"a": 1, "b": 2}'
-    >>> res = extract_or_fix_json_code(mock_llm, "Here is some JSON: {a:1, b:2}")
-    >>> print(res)
-    ToolResult(code=201, result='{"a": 1, "b": 2}')
-
-    Example with an invalid call:
-
-    >>> def broken_llm(prompt):
-    ...     raise RuntimeError("LLM service unavailable")
-    >>> res = extract_or_fix_json_code(broken_llm, "{a:1}")
-    >>> print(res)
-    ToolResult(code=499, result='LLM service unavailable')
-    """
-    prompt = extract_or_fix_python_code_prompt(raw_text, current_fields)
-    try:
-        response = llm(prompt)
-        return ToolResult(code=201, result=response)
-    except Exception as e:
-        return ToolResult(code=499, result=str(e))
-
-
-@mcp_flowcept.tool()
-def extract_or_fix_json_code(llm, raw_text) -> ToolResult:
-    """
-    Extract or repair JSON code from raw text using a language model.
-
-    This function builds a prompt around the provided raw text and sends
-    it to the given language model (LLM). The LLM is expected to extract
-    valid JSON or attempt to fix malformed JSON structures. The outcome
-    is returned in a ``ToolResult`` object, with a success or error code.
-
-    Parameters
-    ----------
-    llm : Callable[[str], str]
-        A callable LLM function or wrapper that accepts a prompt string
-        and returns a string response.
-    raw_text : str
-        Input text that contains JSON code or fragments that may be
-        incomplete or malformed.
-
-    Returns
-    -------
-    ToolResult
-        A result object with:
-        - ``code=201`` and the LLM response in ``result`` if successful.
-        - ``code=499`` and the error message in ``result`` if an error occurs.
-
-    Examples
-    --------
-    Successful extraction/fix:
-
-    >>> def mock_llm(prompt: str) -> str:
-    ...     return '{"foo": "bar"}'
-    >>> extract_or_fix_json_code(mock_llm, "Broken JSON: {foo: bar}")
-    ToolResult(code=201, result='{"foo": "bar"}')
-
-    Error handling:
-
-    >>> def broken_llm(prompt: str) -> str:
-    ...     raise RuntimeError("LLM not available")
-    >>> extract_or_fix_json_code(broken_llm, "{foo: bar}")
-    ToolResult(code=499, result='LLM not available')
-    """
-    prompt = extract_or_fix_json_code_prompt(raw_text)
-    try:
-        response = llm(prompt)
-        return ToolResult(code=201, result=response)
-    except Exception as e:
-        return ToolResult(code=499, result=str(e))
-
-
-@mcp_flowcept.tool()
-def summarize_result(
-    llm, code, result, query: str, dynamic_schema, example_values, current_fields, context_kind="tasks"
-) -> ToolResult:
-    """
-    Summarize the pandas result with local reduction for large DataFrames.
-    - For wide DataFrames, selects top columns based on variance and uniqueness.
-    - For long DataFrames, truncates to preview rows.
-    - Constructs a detailed prompt for the LLM with original column context.
-    """
-    summarized_df = summarize_df(result, code)
-    prompt = dataframe_summarizer_context(
-        code, summarized_df, dynamic_schema, example_values, query, current_fields, context_kind=context_kind
-    )
-    try:
-        response = llm(prompt)
-        return ToolResult(code=201, result=response)
-    except Exception as e:
-        return ToolResult(code=400, result=str(e))
-
-
-@mcp_flowcept.tool()
-def save_df(df, schema, value_examples):
-    """
-    Save a DataFrame, its schema, and example values to temporary files.
-
-    This function writes the provided DataFrame, schema, and value
-    examples to the ``/tmp`` directory. The schema and value examples
-    are saved as JSON files, while the DataFrame is saved as a CSV
-    file. This can be useful for persisting the current state of an
-    agent's task data for later querying or debugging.
-
-    Parameters
-    ----------
-    df : pandas.DataFrame
-        The DataFrame to save.
-    schema : dict
-        A dictionary describing the schema of the DataFrame.
-    value_examples : dict
-        Example values associated with the DataFrame schema.
-
-    Returns
-    -------
-    ToolResult
-        An object with a status code and result message confirming
-        successful persistence of the data.
-
-    Notes
-    -----
-    Files are written to fixed locations in ``/tmp``:
-
-    - ``/tmp/current_tasks_schema.json`` — schema
-    - ``/tmp/value_examples.json`` — example values
-    - ``/tmp/current_agent_df.csv`` — DataFrame contents
-
-    Examples
-    --------
-    >>> import pandas as pd
-    >>> df = pd.DataFrame({"name": ["Alice", "Bob"], "score": [85, 92]})
-    >>> schema = {"fields": [{"name": "name", "type": "string"},
-    ...                      {"name": "score", "type": "integer"}]}
-    >>> examples = {"name": ["Alice"], "score": [85]}
-    >>> result = save_df(df, schema, examples)
-    >>> print(result)
-    ToolResult(code=201, result='Saved df and schema to /tmp directory')
-    """
-    with open("/tmp/current_tasks_schema.json", "w") as f:
-        json.dump(schema, f, indent=2)
-    with open("/tmp/value_examples.json", "w") as f:
-        json.dump(value_examples, f, indent=2)
-    df.to_csv("/tmp/current_agent_df.csv", index=False)
-    return ToolResult(code=201, result="Saved df and schema to /tmp directory")
-
-
-@mcp_flowcept.tool()
-def query_on_saved_df(query: str, dynamic_schema_path, value_examples_path, df_path):
-    """
-    Run a natural language query against a saved DataFrame with schema and value examples.
-
-    This function loads a previously saved DataFrame, dynamic schema,
-    and value examples from disk, then uses a language model (LLM) to
-    interpret the query and generate a new result DataFrame. The query
-    is executed through the LLM using the provided schema and examples
-    for better accuracy.
-
-    Parameters
-    ----------
-    query : str
-        Natural language query to execute against the DataFrame.
-    dynamic_schema_path : str
-        Path to a JSON file containing the schema definition used by the LLM.
-    value_examples_path : str
-        Path to a JSON file with example values to guide the LLM query.
-    df_path : str
-        Path to the saved DataFrame file.
-
-    Returns
-    -------
-    pandas.DataFrame
-        The DataFrame result generated by the LLM query.
-
-    Raises
-    ------
-    FileNotFoundError
-        If any of the provided paths (schema, examples, DataFrame) do not exist.
-    json.JSONDecodeError
-        If schema or examples JSON files cannot be parsed.
-    Exception
-        Propagates exceptions from the LLM query or DataFrame loading.
-
-    Examples
-    --------
-    Query a saved DataFrame of sales data:
-
-    >>> query = "Show me the total sales by region"
-    >>> result = query_on_saved_df(
-    ...     query,
-    ...     dynamic_schema_path="schemas/sales_schema.json",
-    ...     value_examples_path="schemas/sales_examples.json",
-    ...     df_path="data/sales.parquet"
-    ... )
-    >>> print(result.head())
-       region   total_sales
-    0   North         12345
-    1   South          9876
-    2    West          5432
-    """
-    df = load_saved_df(df_path)
-
-    with open(dynamic_schema_path) as f:
-        dynamic_schema = json.load(f)
-
-    with open(value_examples_path) as f:
-        value_examples = json.load(f)
-
-    llm = build_llm_model()
-    return generate_result_df(llm, query, dynamic_schema, value_examples, df, attempt_fix=False, summarize=False)
diff --git a/src/flowcept/agents/tools/workflow_query_tools.py b/src/flowcept/agents/tools/workflow_query_tools.py
deleted file mode 100644
index 584661a2..00000000
--- a/src/flowcept/agents/tools/workflow_query_tools.py
+++ /dev/null
@@ -1,117 +0,0 @@
-"""MCP tools for querying the active workflow message object."""
-
-from __future__ import annotations
-
-import json
-from typing import Any
-
-from flowcept.agents.agents_utils import ToolResult, build_llm_model
-from flowcept.agents.flowcept_ctx_manager import mcp_flowcept
-from flowcept.agents.prompts.workflow_query_prompts import (
-    EMPTY_WORKFLOW_MESSAGE,
-    generate_workflow_query_prompt,
-)
-
-MISSING_INFO = "info not available"
-
-
-def _resolve_path(value: Any, path: str) -> Any:
-    current = value
-    for part in path.split("."):
-        if isinstance(current, dict):
-            if part not in current:
-                raise KeyError(path)
-            current = current[part]
-        elif isinstance(current, list):
-            try:
-                current = current[int(part)]
-            except (ValueError, IndexError):
-                raise KeyError(path)
-        else:
-            raise KeyError(path)
-    return current
-
-
-def _parse_query_spec(query_spec: dict | str) -> dict:
-    if isinstance(query_spec, dict):
-        return query_spec
-    return json.loads(query_spec)
-
-
-def _format_answer(values: dict, missing: list[str], answer_style: str) -> str:
-    if not values and missing:
-        return MISSING_INFO
-    if answer_style == "summary":
-        return json.dumps({"values": values, "missing": missing}, indent=2, default=str)
-    if len(values) == 1 and not missing:
-        return str(next(iter(values.values())))
-    return json.dumps({"values": values, "missing": missing}, indent=2, default=str)
-
-
-@mcp_flowcept.tool()
-def execute_generated_workflow_query(query_spec: dict | str) -> ToolResult:
-    """
-    Execute an externally generated workflow query spec against workflow_msg_obj.
-
-    The spec is JSON with ``field_paths`` and optional ``missing`` /
-    ``answer_style`` fields. Missing values always return ``info not available``.
-    """
-    ctx = mcp_flowcept.get_context()
-    workflow_msg_obj = ctx.request_context.lifespan_context.workflow_msg_obj
-    if not workflow_msg_obj:
-        return ToolResult(code=404, result=EMPTY_WORKFLOW_MESSAGE)
-
-    try:
-        spec = _parse_query_spec(query_spec)
-    except Exception as e:
-        return ToolResult(code=405, result=f"Invalid workflow query spec: {e}")
-
-    field_paths = spec.get("field_paths") or []
-    missing = list(spec.get("missing") or [])
-    answer_style = spec.get("answer_style", "short")
-    values = {}
-
-    for path in field_paths:
-        try:
-            values[path] = _resolve_path(workflow_msg_obj, path)
-        except KeyError:
-            values[path] = MISSING_INFO
-
-    result = {
-        "answer": _format_answer(values, missing, answer_style),
-        "values": values,
-        "missing": missing,
-        "query_spec": spec,
-    }
-    return ToolResult(code=301, result=result, tool_name=execute_generated_workflow_query.__name__)
-
-
-@mcp_flowcept.tool()
-def run_workflow_query(query: str, llm=None) -> ToolResult:
-    """
-    Run a free-text query against the active workflow message object.
-
-    This mirrors the DataFrame query flow but asks the LLM to select workflow
-    message field paths instead of generating pandas code.
-    """
-    ctx = mcp_flowcept.get_context()
-    workflow_msg_obj = ctx.request_context.lifespan_context.workflow_msg_obj
-    if not workflow_msg_obj:
-        return ToolResult(code=404, result=EMPTY_WORKFLOW_MESSAGE)
-
-    if llm is None:
-        llm = build_llm_model()
-
-    prompt = generate_workflow_query_prompt(
-        query,
-        workflow_msg_obj,
-        ctx.request_context.lifespan_context.custom_guidance,
-    )
-    try:
-        query_spec = llm(prompt)
-    except Exception as e:
-        return ToolResult(code=400, result=str(e), extra=prompt)
-
-    result = execute_generated_workflow_query(query_spec)
-    result.extra = {"prompt": prompt}
-    return result
diff --git a/src/flowcept/cli.py b/src/flowcept/cli.py
index 0a1b526b..f659caa0 100644
--- a/src/flowcept/cli.py
+++ b/src/flowcept/cli.py
@@ -563,7 +563,7 @@ def get_task(task_id: str):
 
 def start_agent():  # TODO: start with gui
     """Start Flowcept agent."""
-    from flowcept.agents.flowcept_agent import main
+    from flowcept.agents.mcp.mcp_server import main
 
     main()
 
@@ -605,7 +605,7 @@ def agent_client(tool_name: str, kwargs: str = None):
             print(f"Could not parse kwargs as a valid JSON: {kwargs}")
             print(e)
     print("-----------------")
-    from flowcept.agents.agent_client import run_tool
+    from flowcept.agents.mcp.mcp_client import run_tool
 
     result = run_tool(tool_name, kwargs)[0]
 
@@ -660,7 +660,7 @@ def test_function(n: int) -> Dict[str, int]:
 
     if AGENT.get("enabled", False):
         print("Agent is enabled, so we are testing it too.")
-        from flowcept.agents.agent_client import run_tool
+        from flowcept.agents.mcp.mcp_client import run_tool
 
         try:
             print(run_tool("check_liveness"))
diff --git a/src/flowcept/commons/daos/docdb_dao/docdb_dao_base.py b/src/flowcept/commons/daos/docdb_dao/docdb_dao_base.py
index 71b66704..2d03b848 100644
--- a/src/flowcept/commons/daos/docdb_dao/docdb_dao_base.py
+++ b/src/flowcept/commons/daos/docdb_dao/docdb_dao_base.py
@@ -120,6 +120,11 @@ def insert_or_update_workflow(self, wf_obj: WorkflowObject):
         """
         raise NotImplementedError
 
+    @abstractmethod
+    def save_workflow_domain_data_schema(self, workflow_id: str, fields: Dict):
+        """Update selected workflow fields without replacing the full document."""
+        raise NotImplementedError
+
     @abstractmethod
     def insert_or_update_agent(self, agent_obj: AgentObject):
         """Insert or update an agent object.
@@ -136,6 +141,11 @@ def insert_or_update_agent(self, agent_obj: AgentObject):
         """
         raise NotImplementedError
 
+    @abstractmethod
+    def liveness_test(self) -> bool:
+        """Return True if the backing store is reachable and accepting queries."""
+        raise NotImplementedError
+
     @abstractmethod
     def delete_agents_with_filter(self, filter) -> bool:
         """Delete agent documents that match the filter."""
@@ -392,39 +402,26 @@ def dump_tasks_to_file_recursive(self, workflow_id, output_file="tasks.parquet",
     @abstractmethod
     def save_or_update_object(
         self,
+        blob_obj,
         object,
-        object_id,
-        task_id,
-        workflow_id,
-        object_type,
-        custom_metadata,
-        save_data_in_collection,
-        pickle_,
+        save_data_in_collection=False,
+        pickle_=False,
         control_version=False,
-        tags=None,
     ):
-        """Save an object with associated metadata.
+        """Save an object with its BlobObject metadata.
 
         Parameters
         ----------
+        blob_obj : BlobObject
+            Metadata for the object. ``object_id`` is generated when ``None``.
         object : Any
-            The object to save.
-        object_id : str
-            Unique identifier for the object.
-        task_id : str
-            Task ID associated with the object.
-        workflow_id : str
-            Workflow ID associated with the object.
-        object_type : str
-            Type of the object.
-        custom_metadata : dict
-            Custom metadata to associate with the object.
-        save_data_in_collection : bool
-            Whether to save the object in a database collection.
-        pickle_ : bool
-            Whether to serialize the object using pickle.
-        tags : list of str, optional
-            Labels to associate with the object.
+            The binary payload to persist.
+        save_data_in_collection : bool, optional
+            Whether to store bytes in-document rather than GridFS.
+        pickle_ : bool, optional
+            Whether to serialize the payload with pickle before storing.
+        control_version : bool, optional
+            If ``True``, enable append-only history semantics.
 
         Raises
         ------
@@ -481,3 +478,43 @@ def get_file_data(self, file_id):
             This method must be implemented by subclasses.
         """
         raise NotImplementedError
+
+    @abstractmethod
+    def task_summary(self, filter: Dict) -> Dict:
+        """Return status counts, per-activity stats, and time range for tasks matching filter."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def derive_campaigns(self) -> List[Dict]:
+        """Derive campaign summaries by grouping workflows and tasks by campaign_id."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def derive_agents(self, filter: Dict = None) -> List[Dict]:
+        """Derive agent summaries by joining stored agents with task provenance."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def telemetry_timeseries(
+        self, filter: Dict, fields: List, x_field: str = "started_at", limit: int = 1000
+    ) -> List[Dict]:
+        """Extract plottable rows of dot-notated fields from tasks."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def resolve_chart_data(self, data: Dict, context: Dict = None) -> Dict:
+        """Resolve a declarative chart spec into plottable rows.
+
+        Parameters
+        ----------
+        data : dict
+            Chart spec with keys: source, filter, group_by, metrics, x, y, sort, limit.
+        context : dict, optional
+            Dashboard-level filter ANDed into the card filter.
+
+        Returns
+        -------
+        dict
+            ``{"rows": [...], "count": int}``.
+        """
+        raise NotImplementedError
diff --git a/src/flowcept/commons/daos/docdb_dao/docdb_dao_utils.py b/src/flowcept/commons/daos/docdb_dao/docdb_dao_utils.py
new file mode 100644
index 00000000..6d930e29
--- /dev/null
+++ b/src/flowcept/commons/daos/docdb_dao/docdb_dao_utils.py
@@ -0,0 +1,150 @@
+"""Shared pure-utility helpers for DocumentDAO implementations.
+
+These helpers are used by both MongoDBDAO and LMDBDAO and carry no
+dependency on any web-framework or schema layer.
+"""
+
+from __future__ import annotations
+
+from collections import defaultdict
+from typing import Any, Dict, List, Optional
+
+
+from flowcept.commons.utils import to_epoch  # re-exported; defined in commons/utils.py
+
+ALLOWED_FILTER_OPERATORS = {
+    "$and",
+    "$or",
+    "$nor",
+    "$not",
+    "$exists",
+    "$eq",
+    "$ne",
+    "$gt",
+    "$gte",
+    "$lt",
+    "$lte",
+    "$in",
+    "$nin",
+    "$regex",
+}
+
+
+def validate_filter(filter_doc: Optional[Dict[str, Any]]) -> None:
+    """Validate a Mongo-style filter doc against the safe-operator allowlist.
+
+    Raises ValueError for any unsupported ``$`` operator or a logical operator
+    (``$and``, ``$or``, ``$nor``) whose value is not a list.
+    """
+
+    def _walk(value: Any) -> None:
+        if isinstance(value, dict):
+            for key, item in value.items():
+                if key.startswith("$"):
+                    if key not in ALLOWED_FILTER_OPERATORS:
+                        raise ValueError(f"Unsupported filter operator: {key}")
+                    if key in {"$and", "$or", "$nor"} and not isinstance(item, list):
+                        raise ValueError(f"{key} must be a list.")
+                _walk(item)
+        elif isinstance(value, list):
+            for item in value:
+                _walk(item)
+
+    _walk(filter_doc or {})
+
+
+def get_nested(item: Dict[str, Any], field: str) -> Any:
+    """Read a dot-notated field value from a document."""
+    current = item
+    for part in field.split("."):
+        if not isinstance(current, dict):
+            return None
+        current = current.get(part)
+    return current
+
+
+def _duration(doc: Dict[str, Any]) -> Optional[float]:
+    started, ended = to_epoch(doc.get("started_at")), to_epoch(doc.get("ended_at"))
+    if started is not None and ended is not None:
+        return ended - started
+    return None
+
+
+def _metric_key(metric: Dict[str, Any]) -> str:
+    """Return the canonical output key for a metric spec dict."""
+    field = metric.get("field", "")
+    agg = metric.get("agg", "count")
+    return f"{agg}_{field}" if field else agg
+
+
+def _merge_context_filter(card_filter: Dict[str, Any], context: Optional[Dict[str, Any]]) -> Dict[str, Any]:
+    """AND a card-level filter with a dashboard-level context filter."""
+    if not context:
+        return dict(card_filter)
+    if not card_filter:
+        return dict(context)
+    return {"$and": [context, card_filter]}
+
+
+def _merge_summary_rows(rows: List[Dict[str, Any]]) -> Dict[str, Any]:
+    """Combine per-(activity, status) rows into the task-summary response shape."""
+    status_counts: Dict[str, int] = defaultdict(int)
+    activities: Dict[str, Dict[str, Any]] = {}
+    total = 0
+    min_started, max_ended = None, None
+
+    for row in rows:
+        count = row.get("count") or 0
+        total += count
+        status = row.get("status") or "UNKNOWN"
+        status_counts[status] += count
+
+        activity = activities.setdefault(
+            str(row.get("activity_id")),
+            {
+                "activity_id": row.get("activity_id"),
+                "count": 0,
+                "status_counts": defaultdict(int),
+                "avg_duration": None,
+                "min_duration": None,
+                "max_duration": None,
+                "sum_duration": None,
+                "_weighted_sum": 0.0,
+                "_weighted_count": 0,
+            },
+        )
+        activity["count"] += count
+        activity["status_counts"][status] += count
+        for bound, op in (("min_duration", min), ("max_duration", max)):
+            if row.get(bound) is not None:
+                current = activity[bound]
+                activity[bound] = row[bound] if current is None else op(current, row[bound])
+        if row.get("sum_duration") is not None:
+            activity["sum_duration"] = (activity["sum_duration"] or 0) + row["sum_duration"]
+        if row.get("avg_duration") is not None:
+            activity["_weighted_sum"] += row["avg_duration"] * count
+            activity["_weighted_count"] += count
+
+        if row.get("min_started_at") is not None:
+            val = to_epoch(row["min_started_at"])
+            min_started = val if min_started is None else min(min_started, val)
+        if row.get("max_ended_at") is not None:
+            val = to_epoch(row["max_ended_at"])
+            max_ended = val if max_ended is None else max(max_ended, val)
+
+    activity_stats = []
+    for activity in activities.values():
+        if activity.pop("_weighted_count"):
+            activity["avg_duration"] = activity.pop("_weighted_sum") / activity["count"]
+        else:
+            activity.pop("_weighted_sum")
+        activity["status_counts"] = dict(activity["status_counts"])
+        activity_stats.append(activity)
+    activity_stats.sort(key=lambda a: str(a["activity_id"]))
+
+    return {
+        "count": total,
+        "status_counts": dict(status_counts),
+        "activity_stats": activity_stats,
+        "time_range": {"min_started_at": min_started, "max_ended_at": max_ended},
+    }
diff --git a/src/flowcept/commons/daos/docdb_dao/lmdb_dao.py b/src/flowcept/commons/daos/docdb_dao/lmdb_dao.py
index 85705946..c0b69527 100644
--- a/src/flowcept/commons/daos/docdb_dao/lmdb_dao.py
+++ b/src/flowcept/commons/daos/docdb_dao/lmdb_dao.py
@@ -39,12 +39,13 @@ def _open(self):
         path = LMDB_SETTINGS.get("path", "flowcept_lmdb")
         handle = LMDBDAO._shared_handles.get(path)
         if handle is None:
-            env = lmdb.open(path, map_size=10**12, max_dbs=4)
+            env = lmdb.open(path, map_size=10**12, max_dbs=5)
             handle = {
                 "env": env,
                 "tasks_db": env.open_db(b"tasks"),
                 "workflows_db": env.open_db(b"workflows"),
                 "agents_db": env.open_db(b"agents"),
+                "dashboards_db": env.open_db(b"dashboards"),
                 "ref_count": 0,
             }
             LMDBDAO._shared_handles[path] = handle
@@ -55,6 +56,7 @@ def _open(self):
         self._tasks_db = handle["tasks_db"]
         self._workflows_db = handle["workflows_db"]
         self._agents_db = handle["agents_db"]
+        self._dashboards_db = handle["dashboards_db"]
         self._initialized = True
         self._is_closed = False
 
@@ -136,6 +138,20 @@ def insert_or_update_workflow(self, wf_obj: WorkflowObject):
             self.logger.exception(e)
             return False
 
+    def save_workflow_domain_data_schema(self, workflow_id: str, fields: Dict):
+        """Update selected workflow fields without replacing the full document."""
+        try:
+            with self._env.begin(write=True, db=self._workflows_db) as txn:
+                key = workflow_id.encode()
+                existing = txn.get(key)
+                doc = json.loads(existing.decode()) if existing else {"workflow_id": workflow_id, "type": "workflow"}
+                doc.update(fields)
+                txn.put(key, json.dumps(doc).encode())
+            return True
+        except Exception as e:
+            self.logger.exception(e)
+            return False
+
     def insert_or_update_agent(self, agent_obj: AgentObject):
         """Insert or update an agent document.
 
@@ -160,6 +176,21 @@ def insert_or_update_agent(self, agent_obj: AgentObject):
             self.logger.exception(e)
             return False
 
+    def liveness_test(self) -> bool:
+        """Return True when LMDB is enabled and the environment is open."""
+        from flowcept.configs import LMDB_ENABLED
+
+        if not LMDB_ENABLED:
+            self.logger.warning("LMDB liveness check: LMDB_ENABLED is False — store is disabled.")
+            return False
+        try:
+            with self._env.begin():
+                pass
+            return True
+        except Exception as e:
+            self.logger.error(f"LMDB liveness check failed: {e}")
+            return False
+
     def delete_task_keys(self, key_name, keys_list: List[str]) -> bool:
         """Delete task documents by a key value list.
 
@@ -228,61 +259,43 @@ def count_workflows(self) -> int:
 
     @staticmethod
     def _match_filter(entry, filter):
-        """
-        Check if an entry matches the filter criteria.
+        """Check if an entry matches a Mongo-style filter dict.
 
-        Parameters
-        ----------
-        entry : dict
-            The data entry to check.
-        filter : dict
-            The filter criteria.
-
-        Returns
-        -------
-        bool
-            True if the entry matches the filter, otherwise False.
+        Supports: ``$and``, ``$or``, ``$eq``, ``$ne``, ``$gt``, ``$gte``,
+        ``$lt``, ``$lte``, ``$in``, ``$nin``, and plain equality.
         """
+        from flowcept.commons.daos.docdb_dao.docdb_dao_utils import ALLOWED_FILTER_OPERATORS
+
+        _field_ops = {
+            "$eq": lambda v, o: v == o,
+            "$ne": lambda v, o: v != o,
+            "$gt": lambda v, o: v is not None and v > o,
+            "$gte": lambda v, o: v is not None and v >= o,
+            "$lt": lambda v, o: v is not None and v < o,
+            "$lte": lambda v, o: v is not None and v <= o,
+            "$in": lambda v, o: v in o,
+            "$nin": lambda v, o: v not in o,
+        }
+
         if not filter:
             return True
 
         for key, value in filter.items():
             if key == "$or":
-                if not isinstance(value, list) or not any(LMDBDAO._match_filter(entry, clause) for clause in value):
+                if not any(LMDBDAO._match_filter(entry, clause) for clause in value):
                     return False
             elif key == "$and":
-                if not isinstance(value, list) or not all(LMDBDAO._match_filter(entry, clause) for clause in value):
+                if not all(LMDBDAO._match_filter(entry, clause) for clause in value):
                     return False
+            elif key.startswith("$"):
+                if key not in ALLOWED_FILTER_OPERATORS:
+                    raise ValueError(f"Unsupported filter operator: {key}")
             elif isinstance(value, dict):
                 entry_val = entry.get(key)
                 for op, op_val in value.items():
-                    if op == "$in":
-                        if not isinstance(op_val, (list, set, tuple)) or entry_val not in op_val:
-                            return False
-                    elif op == "$nin":
-                        if not isinstance(op_val, (list, set, tuple)) or entry_val in op_val:
-                            return False
-                    elif op == "$eq":
-                        if entry_val != op_val:
-                            return False
-                    elif op == "$ne":
-                        if entry_val == op_val:
-                            return False
-                    elif op == "$gt":
-                        if entry_val is None or entry_val <= op_val:
-                            return False
-                    elif op == "$gte":
-                        if entry_val is None or entry_val < op_val:
-                            return False
-                    elif op == "$lt":
-                        if entry_val is None or entry_val >= op_val:
-                            return False
-                    elif op == "$lte":
-                        if entry_val is None or entry_val > op_val:
-                            return False
-                    else:
-                        if entry_val != value:
-                            return False
+                    fn = _field_ops.get(op)
+                    if fn is None or not fn(entry_val, op_val):
+                        return False
             else:
                 if entry.get(key) != value:
                     return False
@@ -465,6 +478,432 @@ def agent_query(
             remove_json_unserializables=remove_json_unserializables,
         )
 
+    def save_dashboard(self, dashboard: Dict) -> bool:
+        """Insert or replace a dashboard document.
+
+        Parameters
+        ----------
+        dashboard : dict
+            Dashboard document; must contain ``dashboard_id``.
+
+        Returns
+        -------
+        bool
+            True on success.
+        """
+        if self._is_closed:
+            self._open()
+        try:
+            with self._env.begin(write=True, db=self._dashboards_db) as txn:
+                key = dashboard["dashboard_id"].encode()
+                txn.put(key, json.dumps(dashboard).encode())
+            return True
+        except Exception as e:
+            self.logger.exception(e)
+            return False
+
+    def get_dashboard(self, dashboard_id: str) -> Dict:
+        """Get a dashboard document by id.
+
+        Parameters
+        ----------
+        dashboard_id : str
+            Dashboard identifier.
+
+        Returns
+        -------
+        dict or None
+            The dashboard document, or None when not found.
+        """
+        if self._is_closed:
+            self._open()
+        try:
+            with self._env.begin(db=self._dashboards_db) as txn:
+                value = txn.get(dashboard_id.encode())
+                return json.loads(value.decode()) if value else None
+        except Exception as e:
+            self.logger.exception(e)
+            return None
+
+    def list_dashboards(self, filter: Dict = None) -> List[Dict]:
+        """List dashboard documents, optionally filtered.
+
+        Parameters
+        ----------
+        filter : dict, optional
+            Key/value pairs to match against stored documents (equality only).
+
+        Returns
+        -------
+        list of dict
+            Matching dashboard documents.
+        """
+        if self._is_closed:
+            self._open()
+        try:
+            results = []
+            with self._env.begin(db=self._dashboards_db) as txn:
+                cursor = txn.cursor()
+                for _, value in cursor:
+                    doc = json.loads(value.decode())
+                    if filter is None or all(doc.get(k) == v for k, v in filter.items()):
+                        results.append(doc)
+            return results
+        except Exception as e:
+            self.logger.exception(e)
+            return []
+
+    def delete_dashboard(self, dashboard_id: str) -> bool:
+        """Delete a dashboard document by id.
+
+        Parameters
+        ----------
+        dashboard_id : str
+            Dashboard identifier.
+
+        Returns
+        -------
+        bool
+            True when a document was deleted, False otherwise.
+        """
+        if self._is_closed:
+            self._open()
+        try:
+            with self._env.begin(write=True, db=self._dashboards_db) as txn:
+                return txn.delete(dashboard_id.encode())
+        except Exception as e:
+            self.logger.exception(e)
+            return False
+
+    def task_summary(self, filter: Dict) -> Dict:
+        """Summarize tasks via in-process aggregation (LMDB path).
+
+        Returns status counts, per-activity stats, and time range for tasks matching filter.
+        """
+        from flowcept.commons.daos.docdb_dao.docdb_dao_utils import _merge_summary_rows, _duration
+
+        docs = (
+            self.task_query(
+                filter=filter,
+                projection=["activity_id", "status", "started_at", "ended_at"],
+            )
+            or []
+        )
+        groups: Dict = {}
+        for doc in docs:
+            key = (doc.get("activity_id"), doc.get("status"))
+            group = groups.setdefault(
+                key,
+                {
+                    "activity_id": key[0],
+                    "status": key[1],
+                    "count": 0,
+                    "durations": [],
+                    "min_started_at": None,
+                    "max_ended_at": None,
+                },
+            )
+            group["count"] += 1
+            dur = _duration(doc)
+            if dur is not None:
+                group["durations"].append(dur)
+            started, ended = doc.get("started_at"), doc.get("ended_at")
+            if isinstance(started, (int, float)):
+                current = group["min_started_at"]
+                group["min_started_at"] = started if current is None else min(current, started)
+            if isinstance(ended, (int, float)):
+                current = group["max_ended_at"]
+                group["max_ended_at"] = ended if current is None else max(current, ended)
+        rows = []
+        for group in groups.values():
+            durations = group.pop("durations")
+            group["avg_duration"] = sum(durations) / len(durations) if durations else None
+            group["min_duration"] = min(durations) if durations else None
+            group["max_duration"] = max(durations) if durations else None
+            group["sum_duration"] = sum(durations) if durations else None
+            rows.append(group)
+        return _merge_summary_rows(rows)
+
+    def derive_campaigns(self, campaign_id: str = None) -> List[Dict]:
+        """Derive campaign summaries via in-process aggregation (LMDB path)."""
+        from flowcept.commons.daos.docdb_dao.docdb_dao_utils import to_epoch
+
+        campaigns: Dict = {}
+
+        def _campaign(cid):
+            return campaigns.setdefault(
+                cid,
+                {
+                    "campaign_id": cid,
+                    "workflow_count": 0,
+                    "task_count": 0,
+                    "users": set(),
+                    "workflow_names": set(),
+                    "first_ts": None,
+                    "last_ts": None,
+                },
+            )
+
+        def _expand(record, *values):
+            for raw in values:
+                val = to_epoch(raw)
+                if val is None:
+                    continue
+                record["first_ts"] = val if record["first_ts"] is None else min(record["first_ts"], val)
+                record["last_ts"] = val if record["last_ts"] is None else max(record["last_ts"], val)
+
+        wf_filter = {"campaign_id": {"$exists": True, "$ne": None}}
+        if campaign_id is not None:
+            wf_filter["campaign_id"] = campaign_id
+        for doc in self.workflow_query(filter=wf_filter) or []:
+            if not doc.get("campaign_id"):
+                continue
+            record = _campaign(doc["campaign_id"])
+            record["workflow_count"] += 1
+            if doc.get("user"):
+                record["users"].add(doc["user"])
+            if doc.get("name"):
+                record["workflow_names"].add(doc["name"])
+            _expand(record, doc.get("utc_timestamp"))
+
+        for doc in self.task_query(filter=wf_filter, projection=["campaign_id", "started_at", "ended_at"]) or []:
+            if not doc.get("campaign_id"):
+                continue
+            record = _campaign(doc["campaign_id"])
+            record["task_count"] += 1
+            _expand(record, doc.get("started_at"), doc.get("ended_at"))
+
+        results = []
+        for record in campaigns.values():
+            record["users"] = sorted(record["users"])
+            record["workflow_names"] = sorted(record["workflow_names"])
+            results.append(record)
+        results.sort(
+            key=lambda r: (1, r["last_ts"]) if r["last_ts"] is not None else (0, float("-inf")),
+            reverse=True,
+        )
+        return results
+
+    def derive_agents(self, filter: Dict = None) -> List[Dict]:
+        """Derive agent summaries via in-process aggregation (LMDB path)."""
+
+        def _ts(val):
+            if val is None:
+                return None
+            if isinstance(val, (int, float)):
+                return float(val)
+            from datetime import datetime as _dt
+
+            if isinstance(val, _dt):
+                return val.timestamp()
+            if isinstance(val, str):
+                try:
+                    return _dt.fromisoformat(val.replace("Z", "+00:00")).timestamp()
+                except Exception:
+                    return None
+            return None
+
+        try:
+            stored = self.agent_query(filter=filter or {}) or []
+        except Exception as e:
+            self.logger.error(f"Error querying stored agents: {e}")
+            stored = []
+        stored = [a for a in stored if a.get("agent_id") not in ("train_agent_id", "orchestrator_agent_id")]
+        if not stored:
+            return []
+
+        agent_ids = [a["agent_id"] for a in stored if "agent_id" in a]
+        docs = (
+            self.task_query(
+                filter={"agent_id": {"$in": agent_ids}},
+                projection=[
+                    "agent_id",
+                    "activity_id",
+                    "source_agent_id",
+                    "campaign_id",
+                    "workflow_id",
+                    "registered_at",
+                ],
+            )
+            or []
+        )
+
+        stats_map: Dict = {}
+        for doc in docs:
+            agent_id = doc.get("agent_id")
+            if not agent_id:
+                continue
+            record = stats_map.setdefault(
+                agent_id,
+                {
+                    "task_count": 0,
+                    "activities": set(),
+                    "source_agent_ids": set(),
+                    "campaign_ids": set(),
+                    "workflow_ids": set(),
+                    "last_active": None,
+                },
+            )
+            record["task_count"] += 1
+            for key, field in (
+                ("activities", "activity_id"),
+                ("source_agent_ids", "source_agent_id"),
+                ("campaign_ids", "campaign_id"),
+                ("workflow_ids", "workflow_id"),
+            ):
+                if doc.get(field):
+                    record[key].add(doc[field])
+            ts = _ts(doc.get("registered_at"))
+            if ts is not None:
+                current = record["last_active"]
+                record["last_active"] = ts if current is None else max(current, ts)
+        for record in stats_map.values():
+            for key in ("activities", "source_agent_ids", "campaign_ids", "workflow_ids"):
+                record[key] = sorted(record[key])
+
+        agents = []
+        for sa in stored:
+            agent_id = sa["agent_id"]
+            stat = stats_map.get(
+                agent_id,
+                {
+                    "task_count": 0,
+                    "activities": [],
+                    "source_agent_ids": [],
+                    "campaign_ids": [],
+                    "workflow_ids": [],
+                    "last_active": None,
+                },
+            )
+            if stat["task_count"] == 0:
+                continue
+            agents.append(
+                {
+                    "agent_id": agent_id,
+                    "task_count": stat["task_count"],
+                    "activities": stat["activities"],
+                    "source_agent_ids": stat["source_agent_ids"],
+                    "campaign_ids": stat["campaign_ids"],
+                    "workflow_ids": stat["workflow_ids"],
+                    "last_active": stat["last_active"],
+                    "name": sa.get("name"),
+                    "workflow_id": sa.get("workflow_id"),
+                    "registered_at": _ts(sa.get("registered_at")),
+                }
+            )
+        agents.sort(
+            key=lambda a: (1, a["registered_at"]) if a["registered_at"] is not None else (0, float("-inf")),
+            reverse=True,
+        )
+        return agents
+
+    def telemetry_timeseries(
+        self, filter: Dict, fields: List, x_field: str = "started_at", limit: int = 1000
+    ) -> List[Dict]:
+        """Extract plottable rows of dot-notated fields from tasks (LMDB path)."""
+        from flowcept.commons.daos.docdb_dao.docdb_dao_utils import get_nested
+
+        top_level = sorted({f.split(".")[0] for f in fields} | {x_field.split(".")[0]})
+        docs = (
+            self.task_query(
+                filter=filter,
+                projection=["task_id", "activity_id"] + top_level,
+                limit=limit,
+            )
+            or []
+        )
+        rows = []
+        for doc in docs:
+            row = {
+                x_field: get_nested(doc, x_field),
+                "task_id": doc.get("task_id"),
+                "activity_id": doc.get("activity_id"),
+            }  # noqa: E501
+            row.update({f: get_nested(doc, f) for f in fields})
+            rows.append(row)
+        rows.sort(key=lambda r: (r[x_field] is None, r[x_field]))
+        return rows
+
+    def resolve_chart_data(self, data: Dict, context: Dict = None) -> Dict:
+        """Resolve a declarative chart spec into plottable rows (LMDB path)."""
+        from collections import defaultdict
+
+        from flowcept.commons.daos.docdb_dao.docdb_dao_utils import (
+            _merge_context_filter,
+            _metric_key,
+            get_nested,
+            to_epoch,
+        )
+
+        card_filter = data.get("filter") or {}
+        query_filter = _merge_context_filter(card_filter, context)
+        source = data.get("source", "tasks")
+        limit = data.get("limit") or 1000
+        group_by = data.get("group_by")
+        metrics = data.get("metrics") or []
+        x_field = data.get("x")
+        y_fields = data.get("y") or []
+
+        if source == "collection_sizes":
+            # LMDB has no bsonSize equivalent; return empty.
+            return {"rows": [], "count": 0}
+
+        if group_by or metrics:
+            metrics = metrics or [{"field": "", "agg": "count"}]
+            has_elapsed = any(m.get("field") == "elapsed" for m in metrics)
+            fields = sorted({m["field"] for m in metrics if m.get("field") and m["field"] != "elapsed"})
+            elapsed_fields = ["started_at", "ended_at"] if has_elapsed else []
+            top_level = sorted(
+                {f.split(".")[0] for f in fields}
+                | ({group_by.split(".")[0]} if group_by else set())
+                | set(elapsed_fields)
+            )
+            docs = self.query(collection=source, filter=query_filter, projection=top_level or None) or []
+            grouped: Dict = defaultdict(list)
+            for doc in docs:
+                grouped[get_nested(doc, group_by) if group_by else None].append(doc)
+            out = []
+            for key, group_docs in grouped.items():
+                record = {group_by or "group": key}
+                for metric in metrics:
+                    field = metric.get("field", "")
+                    agg = metric.get("agg", "count")
+                    if field == "elapsed":
+                        values = []
+                        for d in group_docs:
+                            s, e = to_epoch(d.get("started_at")), to_epoch(d.get("ended_at"))
+                            if s is not None and e is not None:
+                                values.append(e - s)
+                    else:
+                        values = [v for v in (get_nested(d, field) for d in group_docs) if isinstance(v, (int, float))]
+                    mk = _metric_key(metric)
+                    if agg == "count":
+                        record[mk] = len(group_docs)
+                    elif not values:
+                        record[mk] = None
+                    elif agg == "avg":
+                        record[mk] = sum(values) / len(values)
+                    elif agg == "sum":
+                        record[mk] = sum(values)
+                    elif agg == "min":
+                        record[mk] = min(values)
+                    elif agg == "max":
+                        record[mk] = max(values)
+                out.append(record)
+            out.sort(key=lambda r: str(r.get(group_by or "group")))
+            rows = out[:limit]
+            return {"rows": rows, "count": len(rows)}
+
+        if x_field and y_fields:
+            rows = self.telemetry_timeseries(query_filter, fields=y_fields, x_field=x_field, limit=limit)
+            return {"rows": rows[:limit], "count": len(rows[:limit])}
+
+        sort_raw = data.get("sort")
+        sort = None if not sort_raw else [(s["field"], s["order"]) for s in sort_raw]
+        rows = self.query(collection=source, filter=query_filter, limit=limit, sort=sort) or []
+        rows = rows[:limit]
+        return {"rows": rows, "count": len(rows)}
+
     def close(self):
         """Close lmdb."""
         if getattr(self, "_initialized"):
@@ -518,16 +957,11 @@ def dump_to_file(self, collection, filter, output_file, export_format, should_zi
 
     def save_or_update_object(
         self,
+        blob_obj,
         object,
-        object_id,
-        task_id,
-        workflow_id,
-        object_type,
-        custom_metadata,
-        save_data_in_collection,
-        pickle_,
+        save_data_in_collection=False,
+        pickle_=False,
         control_version=False,
-        tags=None,
     ):
         """Save object."""
         raise NotImplementedError
diff --git a/src/flowcept/commons/daos/docdb_dao/mongodb_dao.py b/src/flowcept/commons/daos/docdb_dao/mongodb_dao.py
index 920829e5..75f1cd8b 100644
--- a/src/flowcept/commons/daos/docdb_dao/mongodb_dao.py
+++ b/src/flowcept/commons/daos/docdb_dao/mongodb_dao.py
@@ -6,7 +6,6 @@
 import io
 import json
 from uuid import uuid4
-from datetime import datetime, timezone
 
 import pickle
 import zipfile
@@ -580,11 +579,6 @@ def delete_campaign_data(self, campaign_id: str) -> dict:
             "agents": agents_deleted,
         }
 
-    @staticmethod
-    def _utc_now():
-        """Get timezone-aware UTC timestamp."""
-        return datetime.now(timezone.utc)
-
     @staticmethod
     def _payload_to_bytes(payload):
         """Convert supported payload types to bytes for hashing/size metadata."""
@@ -758,6 +752,22 @@ def insert_or_update_workflow(self, workflow_obj: WorkflowObject) -> bool:
             self.logger.exception(e)
             return False
 
+    def save_workflow_domain_data_schema(self, workflow_id: str, fields: Dict) -> bool:
+        """Update selected workflow fields without replacing the full document."""
+        if workflow_id is None:
+            self.logger.exception("The workflow identifier cannot be none.")
+            return False
+        try:
+            result = self._wfs_collection.update_one(
+                {WorkflowObject.workflow_id_field(): workflow_id},
+                {"$set": fields},
+                upsert=True,
+            )
+            return result.matched_count > 0 or result.upserted_id is not None
+        except Exception as e:
+            self.logger.exception(e)
+            return False
+
     def insert_or_update_agent(self, agent_obj: AgentObject) -> bool:
         """Insert or update agent."""
         _dict = agent_obj.to_dict().copy()
@@ -887,27 +897,25 @@ def liveness_test(self) -> bool:
 
     def save_or_update_object(
         self,
+        blob_obj,
         object,
-        object_id=None,
-        task_id=None,
-        workflow_id=None,
-        object_type=None,
-        custom_metadata=None,
         save_data_in_collection=False,
         pickle_=False,
         control_version=False,
-        tags=None,
     ):
         """Save an object."""
-        if object_id is None:
-            object_id = str(uuid4())
-        now = MongoDBDAO._utc_now()
+        from time import time
         from flowcept.configs import FLOWCEPT_USER
 
-        actor = FLOWCEPT_USER
+        if blob_obj.object_id is None:
+            blob_obj.object_id = str(uuid4())
+        now = time()
+        if blob_obj.created_at is None:
+            blob_obj.created_at = now
+        blob_obj.updated_at = now
 
         obj_doc = {
-            "object_id": object_id,
+            "object_id": blob_obj.object_id,
             **self._build_blob_storage_doc(
                 object_payload=object,
                 save_data_in_collection=save_data_in_collection,
@@ -915,16 +923,16 @@ def save_or_update_object(
             ),
         }
 
-        if task_id is not None:
-            obj_doc["task_id"] = task_id
-        if workflow_id is not None:
-            obj_doc["workflow_id"] = workflow_id
-        if object_type is not None:
-            obj_doc["object_type"] = object_type
-        if custom_metadata is not None:
-            obj_doc["custom_metadata"] = custom_metadata
-        if tags is not None:
-            obj_doc["tags"] = list(tags)
+        if blob_obj.task_id is not None:
+            obj_doc["task_id"] = blob_obj.task_id
+        if blob_obj.workflow_id is not None:
+            obj_doc["workflow_id"] = blob_obj.workflow_id
+        if blob_obj.object_type is not None:
+            obj_doc["object_type"] = blob_obj.object_type
+        if blob_obj.custom_metadata is not None:
+            obj_doc["custom_metadata"] = blob_obj.custom_metadata
+        if blob_obj.tags is not None:
+            obj_doc["tags"] = list(blob_obj.tags)
 
         if not control_version:
             update_query = [
@@ -932,32 +940,35 @@ def save_or_update_object(
                     "$set": {
                         **obj_doc,
                         "version": {"$add": [{"$ifNull": ["$version", -1]}, 1]},
+                        "created_at": {"$ifNull": ["$created_at", blob_obj.created_at]},
+                        "updated_at": blob_obj.updated_at,
                     }
                 }
             ]
             self._obj_collection.update_one(
-                {"object_id": object_id},
+                {"object_id": blob_obj.object_id},
                 update_query,
                 upsert=True,
             )
-            return object_id
+            return blob_obj.object_id
 
+        actor = FLOWCEPT_USER
         max_attempts = 5
         for attempt in range(max_attempts):
-            latest_doc = self._obj_collection.find_one({"object_id": object_id})
+            latest_doc = self._obj_collection.find_one({"object_id": blob_obj.object_id})
             if latest_doc is None:
                 insert_doc = {
                     **obj_doc,
                     "version": 0,
                     "prev_version": None,
-                    "created_at": now,
+                    "created_at": blob_obj.created_at,
                     "created_by": actor,
-                    "updated_at": now,
+                    "updated_at": blob_obj.updated_at,
                     "updated_by": actor,
                 }
                 try:
                     self._obj_collection.insert_one(insert_doc)
-                    return object_id
+                    return blob_obj.object_id
                 except Exception:
                     if attempt == max_attempts - 1:
                         raise
@@ -969,20 +980,20 @@ def save_or_update_object(
                 **obj_doc,
                 "version": expected_version + 1,
                 "prev_version": expected_version,
-                "created_at": latest_doc.get("created_at", now),
+                "created_at": latest_doc.get("created_at", blob_obj.created_at),
                 "created_by": latest_doc.get("created_by", actor),
-                "updated_at": now,
+                "updated_at": blob_obj.updated_at,
                 "updated_by": actor,
             }
             try:
                 matched_count = self._update_with_optional_transaction(
-                    object_id=object_id,
+                    object_id=blob_obj.object_id,
                     expected_version=expected_version,
                     latest_doc=latest_doc,
                     update_doc=update_doc,
                 )
                 if matched_count == 1:
-                    return object_id
+                    return blob_obj.object_id
                 # CAS failed; remove potential duplicate history append on next trial by ignoring dup insert.
                 sleep(0.02 * (attempt + 1))
             except Exception as e:
@@ -992,7 +1003,7 @@ def save_or_update_object(
                 sleep(0.02 * (attempt + 1))
                 continue
 
-        raise ValueError(f"Could not update object_id={object_id} due to repeated concurrent CAS failures.")
+        raise ValueError(f"Could not update object_id={blob_obj.object_id} due to repeated concurrent CAS failures.")
 
     def update_object_metadata(
         self,
@@ -1008,10 +1019,11 @@ def update_object_metadata(
         if object_id is None:
             raise ValueError("object_id must not be None.")
 
+        from time import time
         from flowcept.configs import FLOWCEPT_USER
 
         actor = FLOWCEPT_USER
-        now = MongoDBDAO._utc_now()
+        now = time()
         set_fields = {}
 
         if custom_metadata is not None:
@@ -1820,3 +1832,336 @@ def get_node_positions(self, workflow_id: str, graph_type: str) -> Dict:
         except Exception as e:
             self.logger.exception(e)
             return {}
+
+    def task_summary(self, filter: Dict) -> Dict:
+        """Summarize tasks via Mongo aggregation pipeline.
+
+        Returns status counts, per-activity stats, and time range for tasks matching filter.
+        """
+        from flowcept.commons.daos.docdb_dao.docdb_dao_utils import _merge_summary_rows
+
+        match = [{"$match": filter}] if filter else []
+        rows = (
+            self.raw_pipeline(
+                match
+                + [
+                    {
+                        "$group": {
+                            "_id": {"activity_id": "$activity_id", "status": "$status"},
+                            "count": {"$sum": 1},
+                            "avg_duration": {"$avg": {"$subtract": ["$ended_at", "$started_at"]}},
+                            "min_duration": {"$min": {"$subtract": ["$ended_at", "$started_at"]}},
+                            "max_duration": {"$max": {"$subtract": ["$ended_at", "$started_at"]}},
+                            "sum_duration": {"$sum": {"$subtract": ["$ended_at", "$started_at"]}},
+                            "min_started_at": {"$min": "$started_at"},
+                            "max_ended_at": {"$max": "$ended_at"},
+                        }
+                    }
+                ],
+                collection="tasks",
+            )
+            or []
+        )
+        return _merge_summary_rows(
+            [
+                {
+                    "activity_id": row["_id"].get("activity_id"),
+                    "status": row["_id"].get("status"),
+                    **{k: row.get(k) for k in row if k != "_id"},
+                }
+                for row in rows
+            ]
+        )
+
+    def derive_campaigns(self, campaign_id: str = None) -> List[Dict]:
+        """Derive campaign summaries by grouping workflows and tasks by campaign_id.
+
+        Parameters
+        ----------
+        campaign_id : str, optional
+            When provided, only the matching campaign is returned.
+        """
+        from flowcept.commons.daos.docdb_dao.docdb_dao_utils import to_epoch
+
+        campaigns: Dict = {}
+
+        def _campaign(cid):
+            return campaigns.setdefault(
+                cid,
+                {
+                    "campaign_id": cid,
+                    "workflow_count": 0,
+                    "task_count": 0,
+                    "users": set(),
+                    "workflow_names": set(),
+                    "first_ts": None,
+                    "last_ts": None,
+                },
+            )
+
+        def _expand(record, *values):
+            for raw in values:
+                val = to_epoch(raw)
+                if val is None:
+                    continue
+                record["first_ts"] = val if record["first_ts"] is None else min(record["first_ts"], val)
+                record["last_ts"] = val if record["last_ts"] is None else max(record["last_ts"], val)
+
+        _base_match: Dict = {"campaign_id": {"$exists": True, "$ne": None}}
+        if campaign_id:
+            _base_match["campaign_id"] = campaign_id
+
+        wf_rows = (
+            self.raw_pipeline(
+                [
+                    {"$match": _base_match},
+                    {
+                        "$group": {
+                            "_id": "$campaign_id",
+                            "workflow_count": {"$sum": 1},
+                            "users": {"$addToSet": "$user"},
+                            "workflow_names": {"$addToSet": "$name"},
+                            "first_ts": {"$min": "$utc_timestamp"},
+                            "last_ts": {"$max": "$utc_timestamp"},
+                        }
+                    },
+                ],
+                collection="workflows",
+            )
+            or []
+        )
+
+        task_rows = (
+            self.raw_pipeline(
+                [
+                    {"$match": _base_match},
+                    {
+                        "$group": {
+                            "_id": "$campaign_id",
+                            "task_count": {"$sum": 1},
+                            "first_ts": {"$min": "$started_at"},
+                            "last_ts": {"$max": "$ended_at"},
+                        }
+                    },
+                ],
+                collection="tasks",
+            )
+            or []
+        )
+
+        for row in wf_rows:
+            record = _campaign(row["_id"])
+            record["workflow_count"] = row.get("workflow_count", 0)
+            record["users"].update(u for u in row.get("users", []) if u)
+            record["workflow_names"].update(n for n in row.get("workflow_names", []) if n)
+            _expand(record, row.get("first_ts"), row.get("last_ts"))
+        for row in task_rows:
+            record = _campaign(row["_id"])
+            record["task_count"] = row.get("task_count", 0)
+            _expand(record, row.get("first_ts"), row.get("last_ts"))
+
+        results = []
+        for record in campaigns.values():
+            record["users"] = sorted(record["users"])
+            record["workflow_names"] = sorted(record["workflow_names"])
+            results.append(record)
+        results.sort(
+            key=lambda r: (1, r["last_ts"]) if r["last_ts"] is not None else (0, float("-inf")),
+            reverse=True,
+        )
+        return results
+
+    def derive_agents(self, filter: Dict = None) -> List[Dict]:
+        """Derive agent summaries by joining stored agents with task provenance."""
+
+        def _ts(val):
+            if val is None:
+                return None
+            if isinstance(val, (int, float)):
+                return float(val)
+            from datetime import datetime as _dt
+
+            if isinstance(val, _dt):
+                return val.timestamp()
+            if isinstance(val, str):
+                try:
+                    return _dt.fromisoformat(val.replace("Z", "+00:00")).timestamp()
+                except Exception:
+                    return None
+            return None
+
+        try:
+            stored = self.agent_query(filter=filter or {}) or []
+        except Exception as e:
+            self.logger.error(f"Error querying stored agents: {e}")
+            stored = []
+        stored = [a for a in stored if a.get("agent_id") not in ("train_agent_id", "orchestrator_agent_id")]
+        if not stored:
+            return []
+
+        agent_ids = [a["agent_id"] for a in stored if "agent_id" in a]
+        rows = (
+            self.raw_pipeline(
+                [
+                    {"$match": {"agent_id": {"$in": agent_ids}}},
+                    {
+                        "$group": {
+                            "_id": "$agent_id",
+                            "task_count": {"$sum": 1},
+                            "activities": {"$addToSet": "$activity_id"},
+                            "source_agent_ids": {"$addToSet": "$source_agent_id"},
+                            "campaign_ids": {"$addToSet": "$campaign_id"},
+                            "workflow_ids": {"$addToSet": "$workflow_id"},
+                            "last_active": {"$max": "$registered_at"},
+                        }
+                    },
+                ],
+                collection="tasks",
+            )
+            or []
+        )
+
+        stats_map = {
+            row["_id"]: {
+                "task_count": row.get("task_count", 0),
+                "activities": sorted(a for a in row.get("activities", []) if a),
+                "source_agent_ids": sorted(s for s in row.get("source_agent_ids", []) if s),
+                "campaign_ids": sorted(c for c in row.get("campaign_ids", []) if c),
+                "workflow_ids": sorted(w for w in row.get("workflow_ids", []) if w),
+                "last_active": _ts(row.get("last_active")),
+            }
+            for row in rows
+        }
+
+        agents = []
+        for sa in stored:
+            agent_id = sa["agent_id"]
+            stat = stats_map.get(
+                agent_id,
+                {
+                    "task_count": 0,
+                    "activities": [],
+                    "source_agent_ids": [],
+                    "campaign_ids": [],
+                    "workflow_ids": [],
+                    "last_active": None,
+                },
+            )
+            if stat["task_count"] == 0:
+                continue
+            agents.append(
+                {
+                    "agent_id": agent_id,
+                    "task_count": stat["task_count"],
+                    "activities": stat["activities"],
+                    "source_agent_ids": stat["source_agent_ids"],
+                    "campaign_ids": stat["campaign_ids"],
+                    "workflow_ids": stat["workflow_ids"],
+                    "last_active": stat["last_active"],
+                    "name": sa.get("name"),
+                    "workflow_id": sa.get("workflow_id"),
+                    "registered_at": _ts(sa.get("registered_at")),
+                }
+            )
+        agents.sort(
+            key=lambda a: (1, a["registered_at"]) if a["registered_at"] is not None else (0, float("-inf")),
+            reverse=True,
+        )
+        return agents
+
+    def telemetry_timeseries(
+        self, filter: Dict, fields: List, x_field: str = "started_at", limit: int = 1000
+    ) -> List[Dict]:
+        """Extract plottable rows of dot-notated fields from tasks."""
+        from flowcept.commons.daos.docdb_dao.docdb_dao_utils import get_nested
+
+        top_level = sorted({f.split(".")[0] for f in fields} | {x_field.split(".")[0]})
+        docs = (
+            self.task_query(
+                filter=filter,
+                projection=["task_id", "activity_id"] + top_level,
+                limit=limit,
+            )
+            or []
+        )
+        rows = []
+        for doc in docs:
+            row = {
+                x_field: get_nested(doc, x_field),
+                "task_id": doc.get("task_id"),
+                "activity_id": doc.get("activity_id"),
+            }  # noqa: E501
+            row.update({f: get_nested(doc, f) for f in fields})
+            rows.append(row)
+        rows.sort(key=lambda r: (r[x_field] is None, r[x_field]))
+        return rows
+
+    def resolve_chart_data(self, data: Dict, context: Dict = None) -> Dict:
+        """Resolve a declarative chart spec into plottable rows (Mongo implementation)."""
+        from flowcept.commons.daos.docdb_dao.docdb_dao_utils import (
+            _merge_context_filter,
+            _metric_key,
+        )
+
+        card_filter = data.get("filter") or {}
+        query_filter = _merge_context_filter(card_filter, context)
+        source = data.get("source", "tasks")
+        limit = data.get("limit") or 1000
+        group_by = data.get("group_by")
+        metrics = data.get("metrics") or []
+        x_field = data.get("x")
+        y_fields = data.get("y") or []
+
+        if source == "collection_sizes":
+            rows = []
+            for collection in ("tasks", "objects", "workflows"):
+                try:
+                    result = self.raw_pipeline(
+                        ([{"$match": query_filter}] if query_filter else [])
+                        + [{"$group": {"_id": None, "bytes": {"$sum": {"$bsonSize": "$$ROOT"}}}}],
+                        collection=collection,
+                    )
+                    bytes_val = result[0]["bytes"] if result else 0
+                except Exception:
+                    bytes_val = 0
+                rows.append({"collection": collection, "sum_bytes": bytes_val})
+            return {"rows": rows, "count": len(rows)}
+
+        if group_by or metrics:
+            metrics = metrics or [{"field": "", "agg": "count"}]
+            has_elapsed = any(m.get("field") == "elapsed" for m in metrics)
+            if source in ("tasks", "workflows", "objects") and not has_elapsed:
+                group_id = f"${group_by}" if group_by else None
+                group_stage: Dict = {"_id": group_id}
+                mongo_key_map: Dict = {}
+                for metric in metrics:
+                    canonical = _metric_key(metric)
+                    mongo_key = canonical.replace(".", "_")
+                    mongo_key_map[mongo_key] = canonical
+                    if metric.get("agg") == "count":
+                        group_stage[mongo_key] = {"$sum": 1}
+                    else:
+                        group_stage[mongo_key] = {f"${metric['agg']}": f"${metric['field']}"}
+                pipeline = ([{"$match": query_filter}] if query_filter else []) + [{"$group": group_stage}]
+                raw = self.raw_pipeline(pipeline, collection=source) or []
+                out = []
+                for row in raw:
+                    record = {group_by or "group": row.pop("_id")}
+                    for mk, canonical in mongo_key_map.items():
+                        if mk in row:
+                            record[canonical] = row.pop(mk)
+                    record.update(row)
+                    out.append(record)
+                out.sort(key=lambda r: str(r.get(group_by or "group")))
+                rows = out[:limit]
+                return {"rows": rows, "count": len(rows)}
+
+        if x_field and y_fields:
+            rows = self.telemetry_timeseries(query_filter, fields=y_fields, x_field=x_field, limit=limit)
+            return {"rows": rows[:limit], "count": len(rows[:limit])}
+
+        sort_raw = data.get("sort")
+        sort = None if not sort_raw else [(s["field"], s["order"]) for s in sort_raw]
+        rows = self.query(collection=source, filter=query_filter, limit=limit, sort=sort) or []
+        rows = rows[:limit]
+        return {"rows": rows, "count": len(rows)}
diff --git a/src/flowcept/commons/daos/mq_dao/mq_dao_base.py b/src/flowcept/commons/daos/mq_dao/mq_dao_base.py
index 3d952523..44159beb 100644
--- a/src/flowcept/commons/daos/mq_dao/mq_dao_base.py
+++ b/src/flowcept/commons/daos/mq_dao/mq_dao_base.py
@@ -54,6 +54,10 @@ def build(*args, **kwargs) -> "MQDao":
             from flowcept.commons.daos.mq_dao.mq_dao_mofka import MQDaoMofka
 
             return MQDaoMofka(*args, **kwargs)
+        elif MQ_TYPE == "rabbitmq":
+            from flowcept.commons.daos.mq_dao.mq_dao_rabbitmq import MQDaoRabbitMQ
+
+            return MQDaoRabbitMQ(*args, **kwargs)
         else:
             raise NotImplementedError
 
diff --git a/src/flowcept/commons/daos/mq_dao/mq_dao_rabbitmq.py b/src/flowcept/commons/daos/mq_dao/mq_dao_rabbitmq.py
new file mode 100644
index 00000000..583cad98
--- /dev/null
+++ b/src/flowcept/commons/daos/mq_dao/mq_dao_rabbitmq.py
@@ -0,0 +1,196 @@
+"""MQ RabbitMQ (AMQP) module using pika."""
+
+from time import time
+from typing import Callable
+
+import msgpack
+import pika
+
+from flowcept.commons.daos.mq_dao.mq_dao_base import MQDao
+from flowcept.configs import MQ_CHANNEL, MQ_HOST, MQ_PORT, MQ_PASSWORD, MQ_USERNAME, MQ_VHOST
+
+
+class MQDaoRabbitMQ(MQDao):
+    """MQ DAO backed by RabbitMQ via AMQP (pika).
+
+    Uses a **fanout exchange** named after :data:`MQ_CHANNEL` so every
+    subscribed consumer receives every published message — the same
+    pub/sub semantic used by the Redis and Kafka backends.
+
+    A separate connection is maintained for publishing and subscribing so
+    the two roles never share a single pika channel.
+    """
+
+    def __init__(self, adapter_settings=None):
+        super().__init__(adapter_settings)
+        credentials = pika.PlainCredentials(
+            MQ_USERNAME or "guest",
+            MQ_PASSWORD or "guest",
+        )
+        self._conn_params = pika.ConnectionParameters(
+            host=MQ_HOST,
+            port=MQ_PORT,
+            virtual_host=MQ_VHOST,
+            credentials=credentials,
+            heartbeat=60,
+            blocked_connection_timeout=300,
+        )
+        self._pub_connection = None
+        self._pub_channel = None
+        self._sub_connection = None
+        self._sub_channel = None
+        self._queue_name = None
+        self._connect_producer()
+
+    # ------------------------------------------------------------------
+    # Producer helpers
+    # ------------------------------------------------------------------
+
+    def _connect_producer(self):
+        """Open a fresh producer connection and declare the fanout exchange."""
+        self._pub_connection = pika.BlockingConnection(self._conn_params)
+        self._pub_channel = self._pub_connection.channel()
+        self._pub_channel.exchange_declare(exchange=MQ_CHANNEL, exchange_type="fanout", durable=True)
+
+    def _ensure_producer(self):
+        """Re-connect the producer if the connection is closed or unhealthy."""
+        try:
+            if self._pub_connection and self._pub_connection.is_open:
+                # Non-blocking I/O pass — keeps heartbeats alive.
+                self._pub_connection.process_data_events(time_limit=0)
+                return
+        except Exception:
+            pass
+        self._connect_producer()
+
+    # ------------------------------------------------------------------
+    # MQDao interface
+    # ------------------------------------------------------------------
+
+    def subscribe(self):
+        """Open a consumer connection, declare an exclusive auto-delete queue, and bind it."""
+        self._sub_connection = pika.BlockingConnection(self._conn_params)
+        self._sub_channel = self._sub_connection.channel()
+        self._sub_channel.exchange_declare(exchange=MQ_CHANNEL, exchange_type="fanout", durable=True)
+        result = self._sub_channel.queue_declare(queue="", exclusive=True)
+        self._queue_name = result.method.queue
+        self._sub_channel.queue_bind(exchange=MQ_CHANNEL, queue=self._queue_name)
+
+    def unsubscribe(self):
+        """Cancel the consumer and close the subscription connection."""
+        try:
+            if self._sub_channel and self._sub_channel.is_open:
+                self._sub_channel.cancel()
+        except Exception:
+            pass
+        try:
+            if self._sub_connection and self._sub_connection.is_open:
+                self._sub_connection.close()
+        except Exception:
+            pass
+        self._sub_channel = None
+        self._sub_connection = None
+        self._queue_name = None
+
+    def message_listener(self, message_handler: Callable):
+        """Consume messages from the bound queue and forward them to *message_handler*.
+
+        Exits when *message_handler* returns ``False`` (or raises).
+        Always calls :meth:`unsubscribe` on exit.
+        """
+        try:
+            for method_frame, _props, body in self._sub_channel.consume(
+                self._queue_name,
+                auto_ack=False,
+                inactivity_timeout=1,
+            ):
+                if method_frame is None:
+                    # Heartbeat tick — no message delivered; keep looping.
+                    continue
+                try:
+                    msg_obj = msgpack.loads(body, strict_map_key=False)
+                    keep_going = message_handler(msg_obj)
+                    self._sub_channel.basic_ack(method_frame.delivery_tag)
+                    if not keep_going:
+                        break
+                except Exception as e:
+                    self.logger.error("Failed to process RabbitMQ message.")
+                    self.logger.exception(e)
+                    self._sub_channel.basic_nack(method_frame.delivery_tag, requeue=False)
+        except Exception as e:
+            self.logger.exception(e)
+        finally:
+            self.unsubscribe()
+
+    def send_message(self, message: dict, channel=MQ_CHANNEL, serializer=msgpack.dumps):
+        """Publish a single message to the fanout exchange."""
+        self._ensure_producer()
+        self._pub_channel.basic_publish(
+            exchange=channel,
+            routing_key="",
+            body=serializer(message),
+        )
+
+    def _send_message_timed(self, message: dict, channel=MQ_CHANNEL, serializer=msgpack.dumps):
+        """Timed variant of :meth:`send_message`."""
+        t1 = time()
+        self.send_message(message, channel, serializer)
+        t2 = time()
+        self._flush_events.append(["single", t1, t2, t2 - t1, len(str(message).encode())])
+
+    def _bulk_publish(self, buffer, channel=MQ_CHANNEL, serializer=msgpack.dumps):
+        """Publish all messages in *buffer* to the fanout exchange."""
+        self._ensure_producer()
+        for message in buffer:
+            try:
+                self._pub_channel.basic_publish(
+                    exchange=channel,
+                    routing_key="",
+                    body=serializer(message),
+                )
+            except Exception as e:
+                self.logger.exception(e)
+                self.logger.error(f"Message could not be flushed: {message}")
+        self.logger.debug(f"Flushed {len(buffer)} msgs to MQ!")
+
+    def _bulk_publish_timed(self, buffer, channel=MQ_CHANNEL, serializer=msgpack.dumps):
+        """Timed variant of :meth:`_bulk_publish`."""
+        total = 0
+        self._ensure_producer()
+        t1 = time()
+        for message in buffer:
+            try:
+                total += len(str(message).encode())
+                self._pub_channel.basic_publish(
+                    exchange=channel,
+                    routing_key="",
+                    body=serializer(message),
+                )
+            except Exception as e:
+                self.logger.exception(e)
+                self.logger.error(f"Message could not be flushed: {message}")
+        t2 = time()
+        self._flush_events.append(["bulk", t1, t2, t2 - t1, total])
+        self.logger.debug(f"Flushed {len(buffer)} msgs to MQ!")
+
+    def liveness_test(self) -> bool:
+        """Return True if the RabbitMQ broker is reachable."""
+        try:
+            conn = pika.BlockingConnection(
+                pika.ConnectionParameters(
+                    host=MQ_HOST,
+                    port=MQ_PORT,
+                    virtual_host=MQ_VHOST,
+                    credentials=pika.PlainCredentials(
+                        MQ_USERNAME or "guest",
+                        MQ_PASSWORD or "guest",
+                    ),
+                    heartbeat=10,
+                )
+            )
+            alive = conn.is_open
+            conn.close()
+            return alive
+        except Exception as e:
+            self.logger.exception(e)
+            return False
diff --git a/src/flowcept/commons/flowcept_dataclasses/agent_object.py b/src/flowcept/commons/flowcept_dataclasses/agent_object.py
index 367ab6ff..e7b1dca6 100644
--- a/src/flowcept/commons/flowcept_dataclasses/agent_object.py
+++ b/src/flowcept/commons/flowcept_dataclasses/agent_object.py
@@ -5,7 +5,7 @@
 from omegaconf import OmegaConf, DictConfig
 
 from flowcept.commons.utils import get_utc_now
-from flowcept.commons.sanitization import sanitize_json_like
+from flowcept.commons.utils import sanitize_json_like
 from flowcept.configs import (
     EXTRA_METADATA,
 )
diff --git a/src/flowcept/commons/flowcept_dataclasses/blob_object.py b/src/flowcept/commons/flowcept_dataclasses/blob_object.py
index d9c9f295..d7627836 100644
--- a/src/flowcept/commons/flowcept_dataclasses/blob_object.py
+++ b/src/flowcept/commons/flowcept_dataclasses/blob_object.py
@@ -31,6 +31,12 @@ class BlobObject:
     version: int = 0
     """Monotonic version of this blob object. Starts at ``0`` and increments on updates."""
 
+    created_at: float = None
+    """Epoch timestamp when the object was first persisted."""
+
+    updated_at: float = None
+    """Epoch timestamp when the object was last persisted or updated."""
+
     def __init__(
         self,
         object_id=None,
@@ -40,6 +46,8 @@ def __init__(
         custom_metadata=None,
         tags=None,
         version: int = 0,
+        created_at: float = None,
+        updated_at: float = None,
     ):
         self.object_id = object_id
         self.task_id = task_id
@@ -48,6 +56,8 @@ def __init__(
         self.custom_metadata = custom_metadata
         self.tags = tags
         self.version = 0 if version is None else int(version)
+        self.created_at = created_at
+        self.updated_at = updated_at
 
     @staticmethod
     def object_id_field():
@@ -84,7 +94,9 @@ def __repr__(self):
             f"object_type={repr(self.object_type)}, "
             f"custom_metadata={repr(self.custom_metadata)}, "
             f"tags={repr(self.tags)}, "
-            f"version={repr(self.version)})"
+            f"version={repr(self.version)}, "
+            f"created_at={repr(self.created_at)}, "
+            f"updated_at={repr(self.updated_at)})"
         )
 
     def __str__(self):
diff --git a/src/flowcept/commons/flowcept_dataclasses/task_object.py b/src/flowcept/commons/flowcept_dataclasses/task_object.py
index 21dbc295..6e830ed4 100644
--- a/src/flowcept/commons/flowcept_dataclasses/task_object.py
+++ b/src/flowcept/commons/flowcept_dataclasses/task_object.py
@@ -26,7 +26,24 @@ class TaskObject:
     """Constant type label for this object ("task")."""
 
     subtype: AnyStr = None
-    """Optional subtype of the task (e.g., iteration, ML step, custom)."""
+    """Optional subtype of the task for domain or framework-level classification.
+
+    For general ML workflows use :class:`~flowcept.commons.vocabulary.ML_Types`
+    (e.g., ``"ml_workflow"``, ``"learning"``).
+
+    For agentic AI provenance (PROV-AGENT model, arXiv:2508.02866) use
+    :class:`~flowcept.commons.vocabulary.PROV_AGENT`:
+
+    - ``"ai_model_invocation"`` (:attr:`~flowcept.commons.vocabulary.PROV_AGENT.AI_MODEL_INVOCATION`) —
+      a single LLM prompt→response call.  Captured automatically by
+      :class:`~flowcept.instrumentation.flowcept_agent_task.FlowceptLLM`.
+    - ``"agent_tool"`` (:attr:`~flowcept.commons.vocabulary.PROV_AGENT.AGENT_TOOL`) —
+      a tool execution by an AI agent.  Captured automatically by the
+      :func:`~flowcept.instrumentation.flowcept_agent_task.agent_flowcept_task` decorator.
+
+    Custom values such as ``"iteration"`` or ``"ml_step"`` are also allowed for
+    domain-specific tagging.
+    """
 
     task_id: AnyStr = None
     """Unique identifier of the task."""
diff --git a/src/flowcept/commons/flowcept_dataclasses/workflow_object.py b/src/flowcept/commons/flowcept_dataclasses/workflow_object.py
index b203175f..4e0f0098 100644
--- a/src/flowcept/commons/flowcept_dataclasses/workflow_object.py
+++ b/src/flowcept/commons/flowcept_dataclasses/workflow_object.py
@@ -4,10 +4,11 @@
 import msgpack
 from omegaconf import OmegaConf, DictConfig
 
+from flowcept.commons.vocabulary import Status
 from flowcept.version import __version__
 from flowcept.commons.utils import get_utc_now, get_git_info
 from flowcept.commons.flowcept_logger import FlowceptLogger
-from flowcept.commons.sanitization import sanitize_json_like
+from flowcept.commons.utils import sanitize_json_like
 from flowcept.configs import (
     settings,
     SYS_NAME,
@@ -69,6 +70,9 @@ class WorkflowObject:
     custom_metadata: Dict = None
     """User-defined metadata dictionary with additional annotations."""
 
+    workflow_domain_data_schema: Dict = None
+    """Workflow-scoped observed task schema snapshot. Mainly used by Flowcept Agent queries."""
+
     environment_id: str = None
     """Identifier for the runtime environment (e.g., conda env, container)."""
 
@@ -79,6 +83,7 @@ class WorkflowObject:
     """Optional free-form metadata for extensions not covered by other fields."""
 
     agent_id: AnyStr = None
+    """Identifier of the agent associated with this workflow, if any."""
 
     used: Dict = None
     """Inputs consumed by the workflow (datasets, arguments, or configuration values)."""
@@ -92,12 +97,20 @@ class WorkflowObject:
     subtype: AnyStr = None
     """Optional subtype of the workflow (e.g., data_prep_workflow, ml_workflow)."""
 
+    started_at: float = None
+    """Timestamp when the workflow execution started."""
+
+    ended_at: float = None
+    """Timestamp when the workflow execution ended."""
+
+    status: Status = None
+    """Execution status of the workflow (e.g., FINISHED, ERROR)."""
+
     def __init__(self, workflow_id=None, name=None, used=None, generated=None):
         self.workflow_id = workflow_id
         self.name = name
         self.used = used
         self.generated = generated
-        self.utc_timestamp = get_utc_now()
 
     @staticmethod
     def workflow_id_field():
@@ -109,9 +122,15 @@ def from_dict(dict_obj: Dict) -> "WorkflowObject":
         """Convert from dictionary."""
         wf_obj = WorkflowObject()
         for k, v in dict_obj.items():
+            if k == "status" and isinstance(v, str):
+                v = Status(v)
             setattr(wf_obj, k, v)
         return wf_obj
 
+    def workflow_is_finished(self) -> bool:
+        """Return True when this workflow has completed."""
+        return self.status in {Status.FINISHED, Status.ERROR}
+
     def to_dict(self):
         """Convert to dictionary."""
         result_dict = {}
@@ -185,13 +204,13 @@ def __repr__(self):
             f"machine_info={repr(self.machine_info)}, "
             f"flowcept_settings={repr(self.flowcept_settings)}, "
             f"flowcept_version={repr(self.flowcept_version)}, "
-            f"utc_timestamp={repr(self.utc_timestamp)}, "
             f"user={repr(self.user)}, "
             f"campaign_id={repr(self.campaign_id)}, "
             f"adapter_id={repr(self.adapter_id)}, "
             f"interceptor_ids={repr(self.interceptor_ids)}, "
             f"name={repr(self.name)}, "
             f"workflow_description={repr(self.workflow_description)}, "
+            f"workflow_domain_data_schema={repr(self.workflow_domain_data_schema)}, "
             f"used={repr(self.used)}, "
             f"generated={repr(self.generated)}, "
             f"custom_metadata={repr(self.custom_metadata)})"
diff --git a/src/flowcept/commons/query_utils.py b/src/flowcept/commons/query_utils.py
deleted file mode 100644
index dc58f1db..00000000
--- a/src/flowcept/commons/query_utils.py
+++ /dev/null
@@ -1,73 +0,0 @@
-"""Query utilities."""
-
-import numbers
-from datetime import timedelta
-from typing import List, Dict
-
-import pandas as pd
-
-from flowcept.commons.vocabulary import Status
-
-
-def get_doc_status(row):
-    """Get document status."""
-    if row.get("status"):
-        return row.get("status")
-    elif row.get("finished"):
-        return Status.FINISHED.name
-    elif row.get("error"):
-        return Status.ERROR.name
-    elif row.get("running"):
-        return Status.RUNNING.name
-    elif row.get("submitted"):
-        return Status.SUBMITTED.name
-    else:
-        return Status.UNKNOWN.name
-
-
-def to_datetime(logger, df, column_name, _shift_hours=0):
-    """Convert to datetime."""
-    if column_name in df.columns:
-        try:
-            df[column_name] = pd.to_datetime(df[column_name], unit="s") + timedelta(hours=_shift_hours)
-        except Exception as _e:
-            logger.info(_e)
-
-
-def _calc_telemetry_diff_for_row(start, end):
-    if isinstance(start, numbers.Number):
-        return end - start
-    elif type(start) is dict:
-        diff_dict = {}
-        for key in start:
-            diff_dict[key] = _calc_telemetry_diff_for_row(start[key], end[key])
-        return diff_dict
-
-    elif type(start) is list:
-        diff_list = []
-        for i in range(0, len(start)):
-            diff_list.append(_calc_telemetry_diff_for_row(start[i], end[i]))
-        return diff_list
-    elif type(start) is str:
-        return start
-    else:
-        raise Exception("This is unexpected", start, end, type(start), type(end))
-
-
-def calculate_telemetry_diff_for_docs(docs: List[Dict]):
-    """Calculate telemetry difference."""
-    new_docs = []
-    for doc in docs:
-        new_doc = doc.copy()
-        telemetry_start = new_doc.get("telemetry_at_start")
-        telemetry_end = new_doc.get("telemetry_at_end")
-        if telemetry_start is None or telemetry_end is None:
-            new_docs.append(new_doc)
-            continue
-        new_telemetry = dict()
-        for key in telemetry_start:
-            new_telemetry[key] = _calc_telemetry_diff_for_row(telemetry_start[key], telemetry_end[key])
-        new_doc["telemetry_diff"] = new_telemetry
-        new_docs.append(new_doc)
-
-    return new_docs
diff --git a/src/flowcept/commons/sanitization.py b/src/flowcept/commons/sanitization.py
deleted file mode 100644
index f052d427..00000000
--- a/src/flowcept/commons/sanitization.py
+++ /dev/null
@@ -1,34 +0,0 @@
-"""Sanitization helpers for JSON-like provenance data."""
-
-from __future__ import annotations
-
-import re
-from typing import Any, Dict
-
-SENSITIVE_KEY_PATTERNS = ("api_key", "access_key", "token", "secret", "password", "passwd", "credentials")
-SENSITIVE_VALUE_PATTERN = re.compile(r"\bsk-[A-Za-z0-9_-]+")
-
-
-def _redact_key_value(key: str, value: Any) -> Any:
-    key_l = key.lower()
-    if any(pat in key_l for pat in SENSITIVE_KEY_PATTERNS):
-        return "REDACTED"
-    if isinstance(value, str) and SENSITIVE_VALUE_PATTERN.search(value):
-        return "REDACTED"
-    return value
-
-
-def sanitize_json_like(value: Any) -> Any:
-    """Recursively sanitize dict/list structures."""
-    if isinstance(value, dict):
-        out: Dict[str, Any] = {}
-        for k, v in value.items():
-            out[str(k)] = sanitize_json_like(_redact_key_value(str(k), v))
-        return out
-    if isinstance(value, list):
-        return [sanitize_json_like(v) for v in value]
-    if isinstance(value, tuple):
-        return [sanitize_json_like(v) for v in value]
-    if isinstance(value, str) and SENSITIVE_VALUE_PATTERN.search(value):
-        return "REDACTED"
-    return value
diff --git a/src/flowcept/commons/task_data_preprocess.py b/src/flowcept/commons/task_data_preprocess.py
index 94ac90cf..283c964b 100644
--- a/src/flowcept/commons/task_data_preprocess.py
+++ b/src/flowcept/commons/task_data_preprocess.py
@@ -5,6 +5,111 @@
 from typing import Any
 
 
+class CpuSummary:
+    """CPU resource delta between task start and end.
+
+    Present in telemetry_summary only when CPU telemetry was captured.
+    All values are differences (end - start).
+    """
+
+    percent_all_diff: float = None
+    """Difference in overall CPU utilization percentage across all cores."""
+
+    user_time_diff: float = None
+    """Difference in average per-core CPU user-mode time (seconds)."""
+
+    system_time_diff: float = None
+    """Difference in CPU kernel (system) time (seconds)."""
+
+    idle_time_diff: float = None
+    """Difference in CPU idle time (seconds)."""
+
+
+class MemorySummary:
+    """Memory resource delta between task start and end.
+
+    Present in telemetry_summary only when memory telemetry was captured.
+    All values are differences (end - start).
+    """
+
+    used_mem_diff: float = None
+    """Difference in virtual memory used (bytes)."""
+
+    percent_diff: float = None
+    """Difference in virtual memory utilization percentage."""
+
+    swap_used_diff: float = None
+    """Difference in swap memory used (bytes)."""
+
+
+class DiskSummary:
+    """Disk I/O delta between task start and end.
+
+    Present in telemetry_summary only when disk telemetry was captured.
+    All values are differences (end - start).
+    """
+
+    read_bytes_diff: float = None
+    """Difference in total bytes read from disk."""
+
+    write_bytes_diff: float = None
+    """Difference in total bytes written to disk."""
+
+    read_count_diff: float = None
+    """Difference in number of disk read operations."""
+
+    write_count_diff: float = None
+    """Difference in number of disk write operations."""
+
+
+class NetworkSummary:
+    """Network I/O delta between task start and end.
+
+    Present in telemetry_summary only when network telemetry was captured.
+    All values are differences (end - start).
+    """
+
+    bytes_sent_diff: float = None
+    """Difference in bytes sent over the network."""
+
+    bytes_recv_diff: float = None
+    """Difference in bytes received over the network."""
+
+    packets_sent_diff: float = None
+    """Difference in number of network packets sent."""
+
+    packets_recv_diff: float = None
+    """Difference in number of network packets received."""
+
+
+class TelemetrySummary:
+    """Schema authority for the telemetry_summary field produced by summarize_telemetry().
+
+    This class is NOT instantiated at runtime. It exists solely to document
+    the fixed output schema of summarize_telemetry() so that static_schema_builder.py
+    can build accurate prompt context at MCP server startup.
+
+    Each sub-field (cpu, memory, disk, network) is present only when the
+    corresponding telemetry section was captured for that task and hardware.
+    GPU telemetry is not yet summarized (TODO).
+    """
+
+    duration_sec: float = None
+    """Task wall-clock duration in seconds (ended_at - started_at)."""
+
+    cpu: CpuSummary = None
+    """CPU usage deltas. Present only when CPU telemetry was captured."""
+
+    memory: MemorySummary = None
+    """Memory usage deltas. Present only when memory telemetry was captured."""
+
+    disk: DiskSummary = None
+    """Disk I/O deltas. Present only when disk telemetry was captured."""
+
+    network: NetworkSummary = None
+    """Network I/O deltas. Present only when network telemetry was captured."""
+
+
 def summarize_telemetry(task: Dict, logger) -> Dict:
     """
     Extract and compute the telemetry summary for a task based on start and end telemetry snapshots.
diff --git a/src/flowcept/commons/utils.py b/src/flowcept/commons/utils.py
index 376f256b..9a28fd5b 100644
--- a/src/flowcept/commons/utils.py
+++ b/src/flowcept/commons/utils.py
@@ -1,17 +1,24 @@
 """Utilities."""
 
 import argparse
+import base64
+import re
 import threading
 from datetime import datetime, timedelta, timezone
 import json
 from time import time, sleep
-from typing import Callable, List, Dict
+from typing import Any, Callable, List, Dict
 import os
 import platform
 import subprocess
 import types
 import numpy as np
 
+try:
+    from bson import ObjectId as _ObjectId
+except Exception:
+    _ObjectId = None
+
 from flowcept import configs
 from flowcept.commons.flowcept_dataclasses.task_object import TaskObject
 from flowcept.commons.flowcept_logger import FlowceptLogger
@@ -19,6 +26,30 @@
 from flowcept.commons.vocabulary import Status
 
 
+def to_epoch(value):
+    """Normalize a timestamp to epoch seconds.
+
+    Accepts float/int epoch-sec or epoch-ms, ISO string, or datetime object.
+    Returns None if the value cannot be interpreted as a timestamp.
+    """
+    if value is None:
+        return None
+    if isinstance(value, (int, float)):
+        return value / 1000.0 if value >= 1e12 else float(value)
+    if isinstance(value, str):
+        try:
+            dt = datetime.fromisoformat(value.replace("Z", "+00:00"))
+            return dt.replace(tzinfo=timezone.utc).timestamp() if dt.tzinfo is None else dt.timestamp()
+        except ValueError:
+            return None
+    try:
+        if isinstance(value, datetime):
+            return value.replace(tzinfo=timezone.utc).timestamp() if value.tzinfo is None else value.timestamp()
+    except Exception:
+        pass
+    return None
+
+
 def get_utc_now() -> float:
     """Get current UTC time as a timestamp (seconds since epoch)."""
     now = datetime.now(timezone.utc)
@@ -364,3 +395,80 @@ def __init__(self, fget):
 
     def __get__(self, instance, owner):
         return self.fget(owner)
+
+
+# ---------------------------------------------------------------------------
+# Sanitization helpers
+# ---------------------------------------------------------------------------
+
+_SENSITIVE_KEY_PATTERNS = ("api_key", "access_key", "token", "secret", "password", "passwd", "credentials")
+_SENSITIVE_VALUE_PATTERN = re.compile(r"\bsk-[A-Za-z0-9_-]+")
+
+
+def _redact_key_value(key: str, value: Any) -> Any:
+    key_l = key.lower()
+    if any(pat in key_l for pat in _SENSITIVE_KEY_PATTERNS):
+        return "REDACTED"
+    if isinstance(value, str) and _SENSITIVE_VALUE_PATTERN.search(value):
+        return "REDACTED"
+    return value
+
+
+def _is_sensitive_key(key: str) -> bool:
+    return any(pat in key.lower() for pat in _SENSITIVE_KEY_PATTERNS)
+
+
+def sanitize_json_like(value: Any, drop_sensitive_keys: bool = False, mongo_safe_keys: bool = False) -> Any:
+    """Recursively sanitize dict/list structures, redacting sensitive keys and values."""
+    if isinstance(value, dict):
+        out: Dict[str, Any] = {}
+        for k, v in value.items():
+            key = str(k)
+            if drop_sensitive_keys and _is_sensitive_key(key):
+                continue
+            output_key = key.replace(".", "_").replace("$", "_") if mongo_safe_keys else key
+            out[output_key] = sanitize_json_like(
+                _redact_key_value(key, v),
+                drop_sensitive_keys=drop_sensitive_keys,
+                mongo_safe_keys=mongo_safe_keys,
+            )
+        return out
+    if isinstance(value, (list, tuple)):
+        return [
+            sanitize_json_like(v, drop_sensitive_keys=drop_sensitive_keys, mongo_safe_keys=mongo_safe_keys)
+            for v in value
+        ]
+    if isinstance(value, str) and _SENSITIVE_VALUE_PATTERN.search(value):
+        return "REDACTED"
+    return value
+
+
+# ---------------------------------------------------------------------------
+# JSON serialization helpers for API responses
+# ---------------------------------------------------------------------------
+
+
+def _to_jsonable(value: Any, include_data: bool = False) -> Any:
+    """Recursively normalize values for JSON API responses."""
+    if value is None:
+        return None
+    if isinstance(value, (str, int, float, bool)):
+        return value
+    if isinstance(value, datetime):
+        return value.isoformat()
+    if isinstance(value, bytes):
+        return base64.b64encode(value).decode("ascii") if include_data else None
+    if _ObjectId is not None and isinstance(value, _ObjectId):
+        return str(value)
+    if isinstance(value, (list, tuple)):
+        return [_to_jsonable(item, include_data=include_data) for item in value]
+    if isinstance(value, dict):
+        return {
+            str(k): _to_jsonable(v, include_data=include_data) for k, v in value.items() if include_data or k != "data"
+        }
+    return str(value)
+
+
+def normalize_docs(docs: List[Dict[str, Any]], include_data: bool = False) -> List[Dict[str, Any]]:
+    """Normalize result documents for JSON API response."""
+    return [_to_jsonable(doc, include_data=include_data) for doc in docs]
diff --git a/src/flowcept/commons/vocabulary.py b/src/flowcept/commons/vocabulary.py
index dd505753..1e1d2c77 100644
--- a/src/flowcept/commons/vocabulary.py
+++ b/src/flowcept/commons/vocabulary.py
@@ -67,7 +67,52 @@ class ML_Types(str, Enum):
 
 
 class PROV_AGENT(str, Enum):
-    """Provenance agent used in Flowcept."""
+    """Activity subtype vocabulary for agentic AI workflows (PROV-AGENT model).
+
+    PROV-AGENT is a W3C PROV extension for capturing provenance of agentic AI
+    workflows (arXiv:2508.02866).  Each value here names a distinct
+    ``prov:Activity`` class in that model.  Flowcept records these as the
+    ``subtype`` field on :class:`~flowcept.commons.flowcept_dataclasses.task_object.TaskObject`,
+    enabling the UI and query layer to filter and visualise AI-agent activities
+    separately from regular workflow tasks.
+
+    W3C PROV mapping
+    ----------------
+    All values represent ``prov:Activity`` instances.  The associated entities
+    and relations are:
+
+    - **AIModelInvocation** *used* ``Prompt`` (entity) and *used* ``AIModel`` (entity).
+      ``ResponseData`` (entity) *wasGeneratedBy* the invocation.
+      The invocation *wasAssociatedWith* the ``AIAgent``.
+
+    - **AgentTool** *used* tool input arguments (``DomainData``).
+      Return values *wasGeneratedBy* the tool call.
+      The tool *wasAssociatedWith* the ``AIAgent``.
+      An ``AIModelInvocation`` that the tool triggers *wasInformedBy* the tool
+      call — this ``wasInformedBy`` edge is the key link for root-cause analysis
+      and downstream impact tracing.
+
+    Usage
+    -----
+    >>> from flowcept.commons.vocabulary import PROV_AGENT
+    >>> task_obj.subtype = PROV_AGENT.AI_MODEL_INVOCATION
+    >>> task_obj.subtype = PROV_AGENT.AGENT_TOOL
+    """
 
     AI_MODEL_INVOCATION = "ai_model_invocation"
+    """A single LLM prompt→response call (``AIModelInvocation`` in PROV-AGENT).
+
+    Captured automatically by :class:`~flowcept.instrumentation.flowcept_agent_task.FlowceptLLM`
+    for every ``.invoke()`` call.  Recorded fields: ``used.prompt``,
+    ``generated.response``, ``custom_metadata.llm_usage``,
+    ``custom_metadata.response_metadata``.
+    """
+
     AGENT_TOOL = "agent_tool"
+    """A tool execution by an AI agent (``AgentTool`` in PROV-AGENT).
+
+    Captured automatically by the
+    :func:`~flowcept.instrumentation.flowcept_agent_task.agent_flowcept_task`
+    decorator (applied to MCP tools and LangGraph tool nodes).  Recorded
+    fields: ``used`` = tool input arguments, ``generated`` = tool return value.
+    """
diff --git a/src/flowcept/configs.py b/src/flowcept/configs.py
index db9db765..cce59aa6 100644
--- a/src/flowcept/configs.py
+++ b/src/flowcept/configs.py
@@ -1,5 +1,6 @@
 """Configuration module."""
 
+import copy
 import os
 import socket
 import getpass
@@ -45,7 +46,7 @@ def _get_env_bool(name: str, default=False) -> bool:
 
 
 if USE_DEFAULT:
-    settings = DEFAULT_SETTINGS.copy()
+    settings = copy.deepcopy(DEFAULT_SETTINGS)
     SETTINGS_PATH = "FLOWCEPT_DEFAULT_SETTINGS"
 
 else:
@@ -55,12 +56,8 @@ def _get_env_bool(name: str, default=False) -> bool:
     SETTINGS_PATH = os.getenv("FLOWCEPT_SETTINGS_PATH", f"{_SETTINGS_DIR}/settings.yaml")
 
     if not os.path.exists(SETTINGS_PATH):
-        from importlib import resources
-
-        SETTINGS_PATH = str(resources.files("resources").joinpath("sample_settings.yaml"))
-
-        with open(SETTINGS_PATH) as f:
-            settings = OmegaConf.to_container(OmegaConf.load(f), resolve=True)
+        settings = copy.deepcopy(DEFAULT_SETTINGS)
+        SETTINGS_PATH = "FLOWCEPT_DEFAULT_SETTINGS"
     else:
         settings = OmegaConf.to_container(OmegaConf.load(SETTINGS_PATH), resolve=True)
 
@@ -103,6 +100,8 @@ def _get_env_bool(name: str, default=False) -> bool:
 MQ_PORT = int(_get_env("MQ_PORT", settings["mq"].get("port", "6379")))
 MQ_URI = _get_env("MQ_URI", settings["mq"].get("uri", None))
 MQ_GROUP_ID = _get_env("MQ_GROUP_ID", settings["mq"].get("group_id", "auto"))
+MQ_USERNAME = _get_env("MQ_USERNAME", settings["mq"].get("username", "guest"))
+MQ_VHOST = _get_env("MQ_VHOST", settings["mq"].get("vhost", "/"))
 MQ_BUFFER_SIZE = settings["mq"].get("buffer_size", 1)
 MQ_INSERTION_BUFFER_TIME = settings["mq"].get("insertion_buffer_time_secs", 1)
 MQ_TIMING = settings["mq"].get("timing", False)
@@ -277,9 +276,11 @@ def _get_env_bool(name: str, default=False) -> bool:
 AGENT_CHAT_ENABLED = AGENT.get("chat_enabled", True)
 AGENT_CHAT_MAX_TOOL_ITERATIONS = int(AGENT.get("chat_max_tool_iterations", 5))
 AGENT_CHAT_MAX_QUERY_LIMIT = int(AGENT.get("chat_max_query_limit", 1000))
+AGENT_CHAT_MAX_TOOL_RESULT_CHARS = int(AGENT.get("chat_max_tool_result_chars", 4000))
 AGENT_AUDIO = _get_env_bool("AGENT_AUDIO", settings["agent"].get("audio_enabled", "false"))
 AGENT_HOST = _get_env("AGENT_HOST", settings["agent"].get("mcp_host", "localhost"))
 AGENT_PORT = int(_get_env("AGENT_PORT", settings["agent"].get("mcp_port", "8000")))
+AGENT_MODE = _get_env("AGENT_MODE", AGENT.get("agent_mode", "disabled"))
 
 ####################
 # Enabled ADAPTERS #
diff --git a/src/flowcept/flowcept_api/README.md b/src/flowcept/flowcept_api/README.md
index 5e6f2df2..90494b60 100644
--- a/src/flowcept/flowcept_api/README.md
+++ b/src/flowcept/flowcept_api/README.md
@@ -15,9 +15,15 @@ Public Python-facing control and query layer.
 4. `Flowcept.db` queries persisted data through `DBAPI`.
 5. `Flowcept.stop()` flushes buffers and stops runtime resources.
 
+## Object Save vs Query Split
+
+`Flowcept` owns the **write path** for objects: `Flowcept.insert_or_update_object`, `Flowcept.insert_or_update_torch_model`, `Flowcept.insert_or_update_dataset`, and `Flowcept.insert_or_update_ml_model`. These methods persist to the DB **and** emit an object provenance message (including `created_at` / `updated_at` epoch timestamps) to the MQ buffer. They require an active `Flowcept` context and raise loudly if none exists.
+
+`Flowcept.db` (`DBAPI`) is the **query-only** API. Its private `_insert_or_update_*` methods are internal helpers called by the controller; they accept a `BlobObject`, enrich it with timing, and return the same instance — they do not emit MQ messages.
+
 ## Extension Rules
 
 - Keep user-facing orchestration in `Flowcept`; keep direct database operations in `DBAPI`.
 - Do not read environment variables here; use values centralized by `configs.py`.
-- Object persistence should go through `DBAPI`/DAO paths so object metadata messages stay consistent.
+- New object save methods belong on `Flowcept` (controller), not on `DBAPI`. The DB write is delegated to `DBAPI._insert_or_update_object(blob_obj, object, ...)`; the MQ emit goes through `BaseInterceptor.send_object_message`.
 - Tests for this package usually belong in `tests/api/`.
diff --git a/src/flowcept/flowcept_api/db_api.py b/src/flowcept/flowcept_api/db_api.py
index cdf240ef..99156d4b 100644
--- a/src/flowcept/flowcept_api/db_api.py
+++ b/src/flowcept/flowcept_api/db_api.py
@@ -41,37 +41,50 @@ def _to_message_value(value):
             return value
         return str(value)
 
-    def _emit_object_metadata_message(self, object_id):
-        """Emit metadata-only object provenance to the active Flowcept buffer."""
-        try:
-            dao = DBAPI._dao()
-            if hasattr(dao, "get_blob_object_metadata_doc"):
-                doc = dao.get_blob_object_metadata_doc(object_id=object_id)
-            else:
-                doc = self.get_blob_object(object_id=object_id).to_dict()
-            if "data" in doc:
-                doc["storage_type"] = "in_object"
-            elif "grid_fs_file_id" in doc:
-                doc["storage_type"] = "gridfs"
-            msg = DBAPI._to_message_value(doc)
-            msg.pop("_id", None)
-            msg.pop("data", None)
-            msg["type"] = "object"
-            from flowcept.flowcept_api.flowcept_controller import Flowcept
-
-            Flowcept.emit_message(msg)
-        except Exception as e:
-            self.logger.error(f"Could not emit object metadata message for object_id={object_id}: {e}")
-
     @classmethod
     def _dao(cls) -> DocumentDBDAO:
         """Return the configured document DAO singleton."""
         return DocumentDBDAO.get_instance(create_indices=False)
 
+    @classmethod
+    def get_dao_instance(cls) -> DocumentDBDAO:
+        """Return the DAO singleton for internal/advanced operations not on the public API."""
+        return cls._dao()
+
     def close(self):
         """Close DB resources for the active DAO instance."""
         DBAPI._dao().close()
 
+    def liveness_test(self) -> bool:
+        """Return True if the configured document store is reachable."""
+        return DBAPI._dao().liveness_test()
+
+    @staticmethod
+    def db_liveness_tests() -> dict:
+        """Return per-backend liveness results for all enabled document stores.
+
+        Tests each enabled backend independently so that both Mongo and LMDB
+        are checked when both are enabled (unlike ``liveness_test()``, which
+        routes through ``DocumentDBDAO.get_instance()`` and returns one winner).
+
+        Returns
+        -------
+        dict
+            Keys are backend names (``"mongo"``, ``"lmdb"``); values are bool.
+        """
+        from flowcept.configs import LMDB_ENABLED, MONGO_ENABLED
+
+        results = {}
+        if MONGO_ENABLED:
+            from flowcept.commons.daos.docdb_dao.mongodb_dao import MongoDBDAO
+
+            results["mongo"] = MongoDBDAO.get_instance(create_indices=False).liveness_test()
+        if LMDB_ENABLED:
+            from flowcept.commons.daos.docdb_dao.lmdb_dao import LMDBDAO
+
+            results["lmdb"] = LMDBDAO.get_instance().liveness_test()
+        return results
+
     def insert_or_update_task(self, task: TaskObject):
         """Insert or update a task document.
 
@@ -153,6 +166,17 @@ def get_workflow_object(self, workflow_id) -> WorkflowObject:
         else:
             return WorkflowObject.from_dict(wfobs[0])
 
+    def save_workflow_domain_data_schema(self, workflow_id: str, snapshot: Dict) -> bool:
+        """Persist a workflow-scoped dynamic schema snapshot."""
+        return DBAPI._dao().save_workflow_domain_data_schema(workflow_id, {"workflow_domain_data_schema": snapshot})
+
+    def get_workflow_domain_data_schema(self, workflow_id: str) -> Dict | None:
+        """Return the persisted dynamic schema snapshot for a workflow."""
+        workflow_obj = self.get_workflow_object(workflow_id)
+        if workflow_obj is None:
+            return None
+        return workflow_obj.workflow_domain_data_schema
+
     def workflow_query(self, filter) -> List[Dict]:
         """Query the ``workflows`` collection.
 
@@ -636,35 +660,22 @@ def dump_to_file(
             self.logger.exception(e)
             return False
 
-    def save_or_update_object(
+    def _insert_or_update_object(
         self,
+        blob_obj: BlobObject,
         object,
-        object_id=None,
-        task_id=None,
-        workflow_id=None,
-        object_type=None,
-        custom_metadata=None,
         save_data_in_collection=False,
         pickle=False,
         control_version=False,
-        tags=None,
-    ):
-        """Save or update a blob object.
+    ) -> BlobObject:
+        """Persist a blob object and return the enriched BlobObject with timing.
 
         Parameters
         ----------
+        blob_obj : BlobObject
+            Metadata for the object. ``object_id`` is generated when ``None``.
         object : Any
             Blob payload bytes or serializable object.
-        object_id : str, optional
-            Logical object identifier. Generated when omitted.
-        task_id : str, optional
-            Associated task identifier.
-        workflow_id : str, optional
-            Associated workflow identifier. Defaults to current workflow when available.
-        object_type : str, optional
-            User-defined object category.
-        custom_metadata : dict, optional
-            Arbitrary metadata attached to the object.
         save_data_in_collection : bool, optional
             ``True`` stores bytes in-object (``data`` field in ``objects``).
             ``False`` stores payload in GridFS and keeps pointer in metadata.
@@ -672,35 +683,20 @@ def save_or_update_object(
             If ``True``, pickle ``object`` before persistence.
         control_version : bool, optional
             If ``True``, enable append-only history semantics via ``object_history``.
-        tags : list of str, optional
-            Labels to associate with the object.
 
         Returns
         -------
-        str
-            Persisted object identifier.
+        BlobObject
+            The same instance with ``object_id``, ``created_at``, and ``updated_at`` set.
         """
-        if workflow_id is None:
-            try:
-                from flowcept.flowcept_api.flowcept_controller import Flowcept
-
-                workflow_id = Flowcept.current_workflow_id
-            except Exception:
-                workflow_id = None
-        object_id = DBAPI._dao().save_or_update_object(
+        DBAPI._dao().save_or_update_object(
+            blob_obj,
             object,
-            object_id,
-            task_id,
-            workflow_id,
-            object_type,
-            custom_metadata,
             save_data_in_collection=save_data_in_collection,
             pickle_=pickle,
             control_version=control_version,
-            tags=tags,
         )
-        self._emit_object_metadata_message(object_id)
-        return object_id
+        return blob_obj
 
     def update_object_metadata(
         self,
@@ -736,7 +732,7 @@ def update_object_metadata(
         str
             Updated object identifier.
         """
-        updated_object_id = DBAPI._dao().update_object_metadata(
+        return DBAPI._dao().update_object_metadata(
             object_id=object_id,
             custom_metadata=custom_metadata,
             tags=tags,
@@ -745,8 +741,6 @@ def update_object_metadata(
             workflow_id=workflow_id,
             control_version=control_version,
         )
-        self._emit_object_metadata_message(updated_object_id)
-        return updated_object_id
 
     def to_df(self, collection="tasks", filter=None):
         """Query a collection and return a pandas DataFrame.
@@ -804,156 +798,33 @@ def query(
         )
         return result or []
 
-    def save_or_update_ml_model(
-        self,
-        object,
-        object_id=None,
-        task_id=None,
-        workflow_id=None,
-        object_type="ml_model",
-        custom_metadata=None,
-        save_data_in_collection=False,
-        pickle=False,
-        control_version=False,
-        tags=None,
-    ):
-        """Alias to save or update ML model blobs.
-
-        Parameters
-        ----------
-        object : Any
-            Model payload bytes/object.
-        object_id : str, optional
-            Logical object identifier.
-        task_id : str, optional
-            Associated task identifier.
-        workflow_id : str, optional
-            Associated workflow identifier.
-        object_type : str, optional
-            Category label. Defaults to ``"ml_model"``.
-        custom_metadata : dict, optional
-            Custom metadata.
-        save_data_in_collection : bool, optional
-            In-object data storage toggle (``data`` field in ``objects``).
-        pickle : bool, optional
-            Pickle before storage.
-        control_version : bool, optional
-            Enable append-only history semantics.
-        tags : list of str, optional
-            Labels to associate with the object.
-
-        Returns
-        -------
-        str
-            Persisted object identifier.
-        """
-        return self.save_or_update_object(
-            object=object,
-            object_id=object_id,
-            task_id=task_id,
-            workflow_id=workflow_id,
-            object_type=object_type,
-            custom_metadata=custom_metadata,
-            save_data_in_collection=save_data_in_collection,
-            pickle=pickle,
-            control_version=control_version,
-            tags=tags,
-        )
-
-    def save_or_update_dataset(
-        self,
-        object,
-        object_id=None,
-        task_id=None,
-        workflow_id=None,
-        object_type="dataset",
-        custom_metadata=None,
-        save_data_in_collection=False,
-        pickle=False,
-        control_version=False,
-        tags=None,
-    ) -> str:
-        """Alias to save or update dataset blobs.
-
-        Parameters
-        ----------
-        object : Any
-            Dataset payload bytes/object.
-        object_id : str, optional
-            Logical object identifier.
-        task_id : str, optional
-            Associated task identifier.
-        workflow_id : str, optional
-            Associated workflow identifier.
-        object_type : str, optional
-            Category label. Defaults to ``"dataset"``.
-        custom_metadata : dict, optional
-            Custom metadata.
-        save_data_in_collection : bool, optional
-            In-object data storage toggle (``data`` field in ``objects``).
-        pickle : bool, optional
-            Pickle before storage.
-        control_version : bool, optional
-            Enable append-only history semantics.
-        tags : list of str, optional
-            Labels to associate with the object.
-
-        Returns
-        -------
-        str
-            Persisted object identifier.
-        """
-        return self.save_or_update_object(
-            object=object,
-            object_id=object_id,
-            task_id=task_id,
-            workflow_id=workflow_id,
-            object_type=object_type,
-            custom_metadata=custom_metadata,
-            save_data_in_collection=save_data_in_collection,
-            pickle=pickle,
-            control_version=control_version,
-            tags=tags,
-        )
-
-    def save_or_update_torch_model(
+    def _insert_or_update_torch_model(
         self,
         model,
-        object_id=None,
-        task_id=None,
-        workflow_id=None,
-        custom_metadata=None,
+        blob_obj: BlobObject,
         control_version=False,
         save_profile=True,
-        tags=None,
-    ) -> str:
+    ) -> BlobObject:
         """Save a PyTorch model state dictionary as an object blob.
 
         Parameters
         ----------
         model : torch.nn.Module
             PyTorch model whose ``state_dict`` will be persisted.
-        object_id : str, optional
-            Existing object identifier to update.
-        task_id : str, optional
-            Associated task identifier.
-        workflow_id : str, optional
-            Associated workflow identifier.
-        custom_metadata : dict, optional
-            Extra metadata. The model class name is added automatically.
+        blob_obj : BlobObject
+            Metadata for the object. ``object_id`` is generated when ``None``.
+            ``custom_metadata`` is merged with model class name and profile.
         control_version : bool, optional
             Enable append-only history semantics when updating an existing
             logical object id.
         save_profile : bool, optional
             If ``True`` (default), adds ``model_profile`` to
             ``custom_metadata`` using Flowcept PyTorch profiling.
-        tags : list of str, optional
-            Labels to associate with the object.
 
         Returns
         -------
-        str
-            Persisted object identifier.
+        BlobObject
+            The same instance with ``object_id``, ``created_at``, and ``updated_at`` set.
         """
         import torch
         import io
@@ -963,31 +834,22 @@ def save_or_update_torch_model(
         torch.save(state_dict, buffer)
         buffer.seek(0)
         binary_data = buffer.read()
-        if custom_metadata is None:
-            custom_metadata = {}
-        model_profile = {}
+
+        cm = blob_obj.custom_metadata or {}
         if save_profile:
             from flowcept.instrumentation.flowcept_torch import get_torch_model_profile
 
-            model_profile = {"model_profile": get_torch_model_profile(model)}
-        cm = {
-            **custom_metadata,
-            **model_profile,
-            "class": model.__class__.__name__,
-        }
-        obj_id = self.save_or_update_object(
+            cm = {**cm, "model_profile": get_torch_model_profile(model)}
+        cm["class"] = model.__class__.__name__
+        blob_obj.custom_metadata = cm
+        blob_obj.object_type = "ml_model"
+
+        return self._insert_or_update_object(
+            blob_obj=blob_obj,
             object=binary_data,
-            object_id=object_id,
-            object_type="ml_model",
-            task_id=task_id,
-            workflow_id=workflow_id,
-            custom_metadata=cm,
             control_version=control_version,
-            tags=tags,
         )
 
-        return obj_id
-
     def load_torch_model(self, model, object_id: str):
         """Load a stored PyTorch model state dict into a model instance.
 
@@ -1067,3 +929,46 @@ def get_node_positions(self, workflow_id: str, graph_type: str) -> dict:
         if hasattr(dao, "get_node_positions"):
             return dao.get_node_positions(workflow_id, graph_type)
         return {}
+
+    def task_summary(self, filter: Dict) -> Dict:
+        """Summarize tasks: status counts, per-activity stats, and time range."""
+        return DBAPI._dao().task_summary(filter)
+
+    def derive_campaigns(self, campaign_id: str = None) -> List[Dict]:
+        """Derive campaign summaries by grouping workflows and tasks by campaign_id."""
+        return DBAPI._dao().derive_campaigns(campaign_id=campaign_id)
+
+    def derive_agents(self, filter: Dict = None) -> List[Dict]:
+        """Derive agent summaries by joining stored agents with task provenance."""
+        return DBAPI._dao().derive_agents(filter)
+
+    def telemetry_timeseries(
+        self, filter: Dict, fields: List, x_field: str = "started_at", limit: int = 1000
+    ) -> List[Dict]:
+        """Extract plottable rows of dot-notated fields from tasks."""
+        return DBAPI._dao().telemetry_timeseries(filter, fields, x_field=x_field, limit=limit)
+
+    def resolve_chart_data(self, data: Dict, context: Dict = None) -> Dict:
+        """Resolve a declarative chart spec into plottable rows."""
+        return DBAPI._dao().resolve_chart_data(data, context=context)
+
+    def delete_object_keys(self, key_name: str, keys_list: List) -> bool:
+        """Delete object documents matching key_name/keys_list. Raises NotImplementedError if unsupported."""
+        dao = DBAPI._dao()
+        if not hasattr(dao, "delete_object_keys"):
+            raise NotImplementedError("delete_object_keys is not supported by the active DB backend.")
+        return dao.delete_object_keys(key_name, keys_list)
+
+    def delete_workflow_data(self, workflow_id: str) -> dict:
+        """Delete all data for a workflow. Returns empty dict if unsupported."""
+        dao = DBAPI._dao()
+        if not hasattr(dao, "delete_workflow_data"):
+            return {}
+        return dao.delete_workflow_data(workflow_id)
+
+    def delete_campaign_data(self, campaign_id: str) -> dict:
+        """Delete all data for a campaign. Returns empty dict if unsupported."""
+        dao = DBAPI._dao()
+        if not hasattr(dao, "delete_campaign_data"):
+            return {}
+        return dao.delete_campaign_data(campaign_id)
diff --git a/src/flowcept/flowcept_api/flowcept_controller.py b/src/flowcept/flowcept_api/flowcept_controller.py
index b6d8458e..51598b04 100644
--- a/src/flowcept/flowcept_api/flowcept_controller.py
+++ b/src/flowcept/flowcept_api/flowcept_controller.py
@@ -2,7 +2,7 @@
 
 import os
 from pathlib import Path
-from typing import List, Dict, Any
+from typing import List, Dict, Any, Union
 from uuid import uuid4
 
 import flowcept
@@ -13,12 +13,15 @@
     WorkflowObject,
 )
 from flowcept.commons.flowcept_logger import FlowceptLogger
+from time import time
+
 from flowcept.commons.utils import (
     ClassProperty,
     buffer_to_disk,
     resolve_dump_buffer_path,
     generate_pseudo_id,
 )
+from flowcept.commons.vocabulary import Status
 from flowcept.configs import (
     MQ_INSTANCES,
     INSTRUMENTATION_ENABLED,
@@ -43,7 +46,7 @@ class Flowcept(object):
     campaign_id = None
     buffer = None
     is_started = False
-    current_instance = None
+    _current_instance = None
 
     @ClassProperty
     def db(cls):
@@ -54,9 +57,14 @@ def db(cls):
             cls._db = DBAPI()
         return cls._db
 
+    @staticmethod
+    def get_current_instance() -> "Flowcept":
+        """Return the active Flowcept instance, or None if none is running."""
+        return Flowcept._current_instance
+
     def __init__(
         self,
-        interceptors: List[str] = None,
+        interceptors: Union[List[str], str, None] = None,
         bundle_exec_id: str = None,
         campaign_id: str = None,
         workflow_id: str = None,
@@ -82,10 +90,10 @@ def __init__(
 
         Parameters
         ----------
-        interceptors : Union[BaseInterceptor, List[BaseInterceptor], str], optional
+        interceptors : Union[List[str], str, None], optional
             A list of interceptor kinds (or a single interceptor kind) to apply.
             Examples: "instrumentation", "dask", "mlflow", ...
-            The order of interceptors matters — place the outer-most interceptor first,
+            The order of interceptors matters — place the outermost interceptor first,
 
         bundle_exec_id : str, optional
             Identifier for grouping interceptors in a bundle, essential for the correct initialization and stop of
@@ -154,19 +162,21 @@ def __init__(
         self.args = args
         self.kwargs = kwargs
 
-        if interceptors:
-            self._interceptors = interceptors
-            if not isinstance(self._interceptors, list):
-                self._interceptors = [self._interceptors]
-        else:
+        self._interceptors: Union[List[str], None] = None
+        if interceptors is None:
             if not INSTRUMENTATION_ENABLED:
-                self._interceptors = None
                 self.enabled = False
             else:
                 self._interceptors = ["instrumentation"]
+        elif isinstance(interceptors, list):
+            self._interceptors = interceptors
+        else:
+            self._interceptors = [interceptors]
 
         self._interceptor_instances = None
+        self._first_interceptor: BaseInterceptor = None
         self._should_save_workflow = save_workflow
+        self._current_workflow_obj: WorkflowObject = None
         self._workflow_saved = False  # This is to ensure that the wf is saved only once.
         self.current_workflow_id = workflow_id or str(uuid4())
         self.campaign_id = campaign_id or str(uuid4())
@@ -183,30 +193,7 @@ def __init__(
         self.parent_workflow_id = parent_workflow_id
         self.agent_id = agent_id
         self.agent_name = agent_name
-
-        if self.agent_id is not None:
-            from flowcept.commons.flowcept_dataclasses.agent_object import AgentObject
-
-            agent_obj = AgentObject(agent_id=self.agent_id, name=self.agent_name)
-            agent_obj.enrich()
-
-            from flowcept.configs import MONGO_ENABLED, LMDB_ENABLED
-
-            if MONGO_ENABLED:
-                from flowcept.commons.daos.docdb_dao.mongodb_dao import MongoDBDAO
-
-                try:
-                    MongoDBDAO().insert_or_update_agent(agent_obj)
-                except Exception as e:
-                    self.logger.error(f"Error storing agent in MongoDB: {e}")
-
-            if LMDB_ENABLED:
-                from flowcept.commons.daos.docdb_dao.lmdb_dao import LMDBDAO
-
-                try:
-                    LMDBDAO().insert_or_update_agent(agent_obj)
-                except Exception as e:
-                    self.logger.error(f"Error storing agent in LMDB: {e}")
+        self._agent_saved = False
 
         should_delete_buffer_file = (
             flowcept.configs.DELETE_BUFFER_FILE if delete_buffer_file is None else delete_buffer_file
@@ -241,31 +228,27 @@ def start(self) -> "Flowcept":
                 interceptor_inst = BaseInterceptor.build(interceptor)
                 interceptor_inst.start(bundle_exec_id=self.bundle_exec_id, check_safe_stops=self._check_safe_stops)
                 self._interceptor_instances.append(interceptor_inst)
+                if self._first_interceptor is None:
+                    self._first_interceptor = interceptor_inst
                 if isinstance(interceptor_inst._mq_dao.buffer, AutoflushBuffer):
                     Flowcept.buffer = self.buffer = interceptor_inst._mq_dao.buffer.current_buffer
                 else:
                     Flowcept.buffer = self.buffer = interceptor_inst._mq_dao.buffer
 
+                if (self.agent_id is not None or self.agent_name is not None) and not self._agent_saved:
+                    self.agent_id = self.save_agent(name=self.agent_name, agent_id=self.agent_id)
+                    self._agent_saved = True
+
                 if self._should_save_workflow and not self._workflow_saved:
                     self.save_workflow(interceptor, interceptor_inst)
 
         else:
             Flowcept.current_workflow_id = None
-        Flowcept.current_instance = self
+        Flowcept._current_instance = self
         Flowcept.is_started = self.is_started = True
         self.logger.debug("Flowcept started successfully.")
         return self
 
-    @staticmethod
-    def emit_message(message: Dict):
-        """Append a message to the active interceptor buffer."""
-        if Flowcept.current_instance is None:
-            return
-        interceptors = Flowcept.current_instance._interceptor_instances or []
-        if not interceptors:
-            return
-        interceptors[0].intercept(message)
-
     def get_buffer(self, return_df: bool = False):
         """
         Retrieve the in-memory message buffer.
@@ -469,13 +452,262 @@ def save_agent(
             workflow_id=workflow_id or self.current_workflow_id,
             campaign_id=campaign_id or self.campaign_id,
         )
-
-        interceptors = self._interceptor_instances or []
-        if not interceptors:
+        if not self._first_interceptor:
             raise Exception("No active interceptors are initialized or registered on this Flowcept instance.")
-        interceptors[0].send_agent_message(agent_obj)
+        self._first_interceptor.send_agent_message(agent_obj)
         return agent_obj.agent_id
 
+    @staticmethod
+    def _get_interceptor():
+        """Return the active interceptor for object/model message emission.
+
+        Tries the current Flowcept instance first; falls back to InstrumentationInterceptor
+        (needed when called from a Dask worker where no Flowcept context is registered).
+        Raises RuntimeError when neither is available.
+        """
+        fc = Flowcept.get_current_instance()
+        if fc is not None and fc._first_interceptor:
+            return fc._first_interceptor
+        from flowcept.flowceptor.adapters.instrumentation_interceptor import InstrumentationInterceptor
+
+        interceptor = InstrumentationInterceptor.get_instance()
+        if interceptor is None or not interceptor.started:
+            raise RuntimeError(
+                "No active Flowcept context or InstrumentationInterceptor found. "
+                "Ensure Flowcept is started before calling this method."
+            )
+        return interceptor
+
+    @staticmethod
+    def insert_or_update_object(
+        object,
+        object_id=None,
+        task_id=None,
+        workflow_id=None,
+        object_type=None,
+        custom_metadata=None,
+        save_data_in_collection=False,
+        pickle=False,
+        control_version=False,
+        tags=None,
+    ) -> str:
+        """Persist a blob object and emit its metadata to the active MQ buffer.
+
+        Parameters
+        ----------
+        object : Any
+            Blob payload bytes or serializable object.
+        object_id : str, optional
+            Logical object identifier. Generated when omitted.
+        task_id : str, optional
+            Associated task identifier.
+        workflow_id : str, optional
+            Associated workflow identifier. Defaults to current workflow when available.
+        object_type : str, optional
+            User-defined object category.
+        custom_metadata : dict, optional
+            Arbitrary metadata attached to the object.
+        save_data_in_collection : bool, optional
+            ``True`` stores bytes in-object; ``False`` stores in GridFS.
+        pickle : bool, optional
+            If ``True``, pickle ``object`` before persistence.
+        control_version : bool, optional
+            If ``True``, enable append-only history semantics.
+        tags : list of str, optional
+            Labels to associate with the object.
+
+        Returns
+        -------
+        str
+            Persisted object identifier.
+        """
+        from flowcept.flowcept_api.db_api import DBAPI
+        from flowcept.commons.flowcept_dataclasses.blob_object import BlobObject
+
+        interceptor = Flowcept._get_interceptor()
+        wf_id = workflow_id or Flowcept.current_workflow_id
+        blob_obj = BlobObject(
+            object_id=object_id,
+            task_id=task_id,
+            workflow_id=wf_id,
+            object_type=object_type,
+            custom_metadata=custom_metadata,
+            tags=tags,
+        )
+        blob_obj = DBAPI()._insert_or_update_object(
+            blob_obj=blob_obj,
+            object=object,
+            save_data_in_collection=save_data_in_collection,
+            pickle=pickle,
+            control_version=control_version,
+        )
+        interceptor.send_object_message(blob_obj)
+        return blob_obj.object_id
+
+    @staticmethod
+    def insert_or_update_ml_model(
+        object,
+        object_id=None,
+        task_id=None,
+        workflow_id=None,
+        custom_metadata=None,
+        save_data_in_collection=False,
+        pickle=False,
+        control_version=False,
+        tags=None,
+    ) -> str:
+        """Persist an ML model blob and emit its metadata to the active MQ buffer.
+
+        Parameters
+        ----------
+        object : Any
+            Model payload bytes or serializable object.
+        object_id : str, optional
+            Logical object identifier.
+        task_id : str, optional
+            Associated task identifier.
+        workflow_id : str, optional
+            Associated workflow identifier.
+        custom_metadata : dict, optional
+            Arbitrary metadata attached to the object.
+        save_data_in_collection : bool, optional
+            ``True`` stores bytes in-object; ``False`` stores in GridFS.
+        pickle : bool, optional
+            If ``True``, pickle ``object`` before persistence.
+        control_version : bool, optional
+            Enable append-only history semantics.
+        tags : list of str, optional
+            Labels to associate with the object.
+
+        Returns
+        -------
+        str
+            Persisted object identifier.
+        """
+        return Flowcept.insert_or_update_object(
+            object=object,
+            object_id=object_id,
+            task_id=task_id,
+            workflow_id=workflow_id,
+            object_type="ml_model",
+            custom_metadata=custom_metadata,
+            save_data_in_collection=save_data_in_collection,
+            pickle=pickle,
+            control_version=control_version,
+            tags=tags,
+        )
+
+    @staticmethod
+    def insert_or_update_dataset(
+        object,
+        object_id=None,
+        task_id=None,
+        workflow_id=None,
+        custom_metadata=None,
+        save_data_in_collection=False,
+        pickle=False,
+        control_version=False,
+        tags=None,
+    ) -> str:
+        """Persist a dataset blob and emit its metadata to the active MQ buffer.
+
+        Parameters
+        ----------
+        object : Any
+            Dataset payload bytes or serializable object.
+        object_id : str, optional
+            Logical object identifier.
+        task_id : str, optional
+            Associated task identifier.
+        workflow_id : str, optional
+            Associated workflow identifier.
+        custom_metadata : dict, optional
+            Arbitrary metadata attached to the object.
+        save_data_in_collection : bool, optional
+            ``True`` stores bytes in-object; ``False`` stores in GridFS.
+        pickle : bool, optional
+            If ``True``, pickle ``object`` before persistence.
+        control_version : bool, optional
+            Enable append-only history semantics.
+        tags : list of str, optional
+            Labels to associate with the object.
+
+        Returns
+        -------
+        str
+            Persisted object identifier.
+        """
+        return Flowcept.insert_or_update_object(
+            object=object,
+            object_id=object_id,
+            task_id=task_id,
+            workflow_id=workflow_id,
+            object_type="dataset",
+            custom_metadata=custom_metadata,
+            save_data_in_collection=save_data_in_collection,
+            pickle=pickle,
+            control_version=control_version,
+            tags=tags,
+        )
+
+    @staticmethod
+    def insert_or_update_torch_model(
+        model,
+        object_id=None,
+        task_id=None,
+        workflow_id=None,
+        custom_metadata=None,
+        control_version=False,
+        save_profile=True,
+        tags=None,
+    ) -> str:
+        """Persist a PyTorch model state dictionary and emit its metadata to the active MQ buffer.
+
+        Parameters
+        ----------
+        model : torch.nn.Module
+            PyTorch model whose ``state_dict`` will be persisted.
+        object_id : str, optional
+            Existing object identifier to update.
+        task_id : str, optional
+            Associated task identifier.
+        workflow_id : str, optional
+            Associated workflow identifier.
+        custom_metadata : dict, optional
+            Extra metadata. The model class name is added automatically.
+        control_version : bool, optional
+            Enable append-only history semantics.
+        save_profile : bool, optional
+            If ``True`` (default), adds ``model_profile`` to ``custom_metadata``.
+        tags : list of str, optional
+            Labels to associate with the object.
+
+        Returns
+        -------
+        str
+            Persisted object identifier.
+        """
+        from flowcept.flowcept_api.db_api import DBAPI
+        from flowcept.commons.flowcept_dataclasses.blob_object import BlobObject
+
+        interceptor = Flowcept._get_interceptor()
+        wf_id = workflow_id or Flowcept.current_workflow_id
+        blob_obj = BlobObject(
+            object_id=object_id,
+            task_id=task_id,
+            workflow_id=wf_id,
+            custom_metadata=custom_metadata,
+            tags=tags,
+        )
+        blob_obj = DBAPI()._insert_or_update_torch_model(
+            model=model,
+            blob_obj=blob_obj,
+            control_version=control_version,
+            save_profile=save_profile,
+        )
+        interceptor.send_object_message(blob_obj)
+        return blob_obj.object_id
+
     @staticmethod
     def generate_report(
         report_type: str = "workflow_card",
@@ -504,7 +736,8 @@ def generate_report(
         output_path : str, optional
             Destination path for the generated report file.
         input_jsonl_path : str, optional
-            Path to a Flowcept JSONL buffer file used as report input.
+            Path to a Flowcept JSONL buffer file used as report input. If no
+            input mode is provided, the configured default buffer file is used.
         records : list of dict, optional
             In-memory workflow/task/object records used as report input.
         workflow_id : str, optional
@@ -661,35 +894,40 @@ def save_workflow(self, interceptor: str, interceptor_instance: BaseInterceptor)
         -------
         None
         """
-        wf_obj = WorkflowObject()
-        wf_obj.workflow_id = Flowcept.current_workflow_id
-        wf_obj.campaign_id = Flowcept.campaign_id
-        wf_obj.parent_workflow_id = self.parent_workflow_id
-        wf_obj.agent_id = self.agent_id
+        self._current_workflow_obj = WorkflowObject()
+        self._current_workflow_obj.workflow_id = Flowcept.current_workflow_id
+        self._current_workflow_obj.started_at = time()
+        self._current_workflow_obj.status = Status.RUNNING
+        self._current_workflow_obj.campaign_id = Flowcept.campaign_id
+        self._current_workflow_obj.parent_workflow_id = self.parent_workflow_id
+        self._current_workflow_obj.agent_id = self.agent_id
         if self.workflow_name:
-            wf_obj.name = self.workflow_name
+            self._current_workflow_obj.name = self.workflow_name
         if self.workflow_description:
-            wf_obj.workflow_description = self.workflow_description
+            self._current_workflow_obj.workflow_description = self.workflow_description
         if self.workflow_subtype:
-            wf_obj.subtype = self.workflow_subtype
+            self._current_workflow_obj.subtype = self.workflow_subtype
         if self.workflow_args:
-            wf_obj.used = self.workflow_args
+            self._current_workflow_obj.used = self.workflow_args
 
         if interceptor == "dask":
             dask_client = self.kwargs.get("dask_client", None)
             if dask_client:
                 from flowcept.flowceptor.adapters.dask.dask_plugins import set_workflow_info_on_workers
 
-                wf_obj.adapter_id = "dask"
+                self._current_workflow_obj.adapter_id = "dask"
                 scheduler_info = dict(dask_client.scheduler_info())
-                wf_obj.custom_metadata = {"n_workers": len(scheduler_info["workers"]), "scheduler": scheduler_info}
-                set_workflow_info_on_workers(dask_client, wf_obj)
+                self._current_workflow_obj.custom_metadata = {
+                    "n_workers": len(scheduler_info["workers"]),
+                    "scheduler": scheduler_info,
+                }
+                set_workflow_info_on_workers(dask_client, self._current_workflow_obj)
             else:
                 raise Exception("You must provide the argument `dask_client` so we can correctly link the workflow.")
 
         if KVDB_ENABLED:
             interceptor_instance._mq_dao.set_campaign_id(Flowcept.campaign_id)
-        interceptor_instance.send_workflow_message(wf_obj)
+        interceptor_instance.send_workflow_message(self._current_workflow_obj)
         self._workflow_saved = True
 
     def _init_persistence(self, mq_host=None, mq_port=None):
@@ -708,6 +946,15 @@ def stop(self):
             self.logger.warning("Flowcept is already stopped or may never have been started!")
             return
 
+        if (
+            self._should_save_workflow
+            and self._first_interceptor is not None
+            and self._current_workflow_obj is not None
+        ):
+            self._current_workflow_obj.ended_at = time()
+            self._current_workflow_obj.status = Status.FINISHED
+            self._first_interceptor.intercept(self._current_workflow_obj.to_dict())
+
         if self._interceptors and len(self._interceptor_instances):
             for interceptor in self._interceptor_instances:
                 if interceptor is None:
@@ -730,7 +977,7 @@ def stop(self):
             pass
 
         Flowcept.buffer = self.buffer = None
-        Flowcept.current_instance = None
+        Flowcept._current_instance = None
         Flowcept.is_started = self.is_started = False
         self.logger.debug("All stopped!")
 
@@ -744,51 +991,62 @@ def __exit__(self, exc_type, exc_val, exc_tb):
         self.stop()
 
     @staticmethod
-    def services_alive() -> bool:
-        """
-        Checks the liveness of the MQ (Message Queue) and, if enabled, the MongoDB service.
+    def services_status() -> Dict[str, str]:
+        """Return per-service liveness as ``{service: "ok" | "unavailable"}``.
 
-        Returns
-        -------
-        bool
-            True if all services (MQ and optionally MongoDB) are alive, False otherwise.
-
-        Notes
-        -----
-        - The method tests the liveness of the MQ service using `MQDao`.
-        - If `MONGO_ENABLED` is True, it also checks the liveness of the MongoDB service
-          using `MongoDBDAO`.
-        - Logs errors if any service is not ready, and logs success when both services are operational.
-
-        Examples
-        --------
-        >>> is_alive = services_alive()
-        >>> if is_alive:
-        ...     print("All services are running.")
-        ... else:
-        ...     print("One or more services are not ready.")
+        Which services are checked is driven entirely by settings.yaml / env vars:
+        ``mq.enabled``, ``kv_db.enabled``, ``databases.mongodb.enabled``,
+        ``databases.lmdb.enabled``, and ``agent.chat_enabled`` with a valid API key.
         """
         logger = FlowceptLogger()
+        result: Dict[str, str] = {}
         mq = MQDao.build()
+
         if MQ_ENABLED:
-            if not mq.liveness_test():
-                logger.error("MQ Not Ready!")
-                return False
+            up = mq.liveness_test()
+            result["mq"] = "ok" if up else "unavailable"
+            if not up:
+                logger.error("MQ not ready!")
 
         if KVDB_ENABLED:
-            if not mq._keyvalue_dao.liveness_test():
-                logger.error("KVBD is enabled but is not ready!")
-                return False
-
-        logger.info("MQ is alive!")
-        if MONGO_ENABLED:
-            from flowcept.commons.daos.docdb_dao.mongodb_dao import MongoDBDAO
-
-            if not MongoDBDAO(create_indices=False).liveness_test():
-                logger.error("MongoDB is enabled but DocDB is not Ready!")
-                return False
-            logger.info("DocDB is alive!")
-        return True
+            up = mq._keyvalue_dao.liveness_test()
+            result["kvdb"] = "ok" if up else "unavailable"
+            if not up:
+                logger.error("KVDB is enabled but not ready!")
+
+        if MONGO_ENABLED or LMDB_ENABLED:
+            from flowcept.flowcept_api.db_api import DBAPI
+
+            for backend, up in DBAPI.db_liveness_tests().items():
+                result[backend] = "ok" if up else "unavailable"
+                if up:
+                    logger.info(f"{backend} is alive!")
+                else:
+                    logger.error(f"{backend} is enabled but not ready!")
+
+        from flowcept.configs import AGENT, AGENT_CHAT_ENABLED
+
+        if AGENT_CHAT_ENABLED:
+            api_key = AGENT.get("api_key", "")
+            provider = AGENT.get("service_provider", "")
+            bad = {"", "?", "your-api-key-here"}
+            if api_key not in bad and provider not in bad:
+                try:
+                    from flowcept.agents.llm.builders import build_llm_model
+
+                    build_llm_model(track_tools=False).invoke("ping")
+                    result["llm"] = "ok"
+                    logger.info("LLM provider is alive!")
+                except Exception as exc:
+                    result["llm"] = "unavailable"
+                    logger.error(f"LLM provider not reachable: {exc}")
+
+        return result
+
+    @staticmethod
+    def services_alive() -> bool:
+        """Return True when all enabled services are reachable (or none are enabled)."""
+        return all(v == "ok" for v in Flowcept.services_status().values())
 
     @staticmethod
     def start_consumption_services(bundle_exec_id: str = None, check_safe_stops: bool = False, consumers: List = None):
diff --git a/src/flowcept/flowceptor/adapters/base_interceptor.py b/src/flowcept/flowceptor/adapters/base_interceptor.py
index ff8c94ab..59c7b0fc 100644
--- a/src/flowcept/flowceptor/adapters/base_interceptor.py
+++ b/src/flowcept/flowceptor/adapters/base_interceptor.py
@@ -8,6 +8,7 @@
     WorkflowObject,
 )
 from flowcept.commons.flowcept_dataclasses.agent_object import AgentObject
+from flowcept.commons.flowcept_dataclasses.blob_object import BlobObject
 from flowcept.configs import (
     ENRICH_MESSAGES,
     TELEMETRY_ENABLED,
@@ -164,6 +165,14 @@ def send_agent_message(self, agent_obj: AgentObject):
         self.intercept(agent_obj.to_dict())
         return agent_id
 
+    def send_object_message(self, blob_obj: BlobObject):
+        """Send object metadata message to the MQ buffer."""
+        if not self._mq_dao.started:
+            raise Exception(f"This interceptor {id(self)} has never been started!")
+        msg = blob_obj.to_dict()
+        msg["type"] = "object"
+        self.intercept(msg)
+
     def intercept(self, obj_msg: Dict):
         """Intercept a message."""
         self._mq_dao.buffer.append(obj_msg)
diff --git a/src/flowcept/flowceptor/consumers/agent/base_agent_context_manager.py b/src/flowcept/flowceptor/consumers/agent/base_agent_context_manager.py
index ef95b610..fc0db15e 100644
--- a/src/flowcept/flowceptor/consumers/agent/base_agent_context_manager.py
+++ b/src/flowcept/flowceptor/consumers/agent/base_agent_context_manager.py
@@ -1,3 +1,4 @@
+import threading
 from contextlib import asynccontextmanager
 from dataclasses import dataclass
 from typing import Dict, List
@@ -34,6 +35,10 @@ class BaseAgentContextManager(BaseConsumer):
     """
     Base class for any MCP Agent that wants to participate in the Flowcept ecosystem.
 
+    With ``stateless_http=True`` (FastMCP), the lifespan runs once per HTTP request.
+    A class-level lock prevents concurrent requests from racing to stop the shared
+    Flowcept instance when multiple tool calls execute simultaneously.
+
     Agents inheriting from this class can:
     - Subscribe to and consume messages from the Flowcept-compatible message queue (MQ)
     - Handle task-related messages and accumulate them in context
@@ -47,6 +52,7 @@ class BaseAgentContextManager(BaseConsumer):
     """
 
     agent_id = None
+    _stop_lock = threading.Lock()
 
     def __init__(self, allow_mq_disabled: bool = False):
         """
@@ -131,7 +137,14 @@ async def lifespan(self, app):
         try:
             yield self.context
         finally:
-            self.stop_consumption()
-            if getattr(self, "flowcept_instance", None) is not None:
-                self.flowcept_instance.stop()
-                self.flowcept_instance = None
+            try:
+                self.stop_consumption()
+            except Exception as e:
+                self.logger.warning(f"stop_consumption raised during lifespan teardown: {e}")
+            with BaseAgentContextManager._stop_lock:
+                if getattr(self, "flowcept_instance", None) is not None:
+                    try:
+                        self.flowcept_instance.stop()
+                    except Exception as e:
+                        self.logger.warning(f"flowcept_instance.stop() raised during lifespan teardown: {e}")
+                    self.flowcept_instance = None
diff --git a/src/flowcept/instrumentation/flowcept_agent_task.py b/src/flowcept/instrumentation/flowcept_agent_task.py
index 45bd940c..345a7b87 100644
--- a/src/flowcept/instrumentation/flowcept_agent_task.py
+++ b/src/flowcept/instrumentation/flowcept_agent_task.py
@@ -12,8 +12,8 @@
 
 from flowcept.commons.flowcept_dataclasses.task_object import TaskObject
 from flowcept.commons.flowcept_logger import FlowceptLogger
-from flowcept.commons.utils import replace_non_serializable
-from flowcept.commons.vocabulary import Status
+from flowcept.commons.utils import replace_non_serializable, sanitize_json_like
+from flowcept.commons.vocabulary import PROV_AGENT, Status
 from flowcept.configs import (
     INSTRUMENTATION_ENABLED,
     REPLACE_NON_JSON_SERIALIZABLE,
@@ -60,9 +60,11 @@ def wrapper(*args, **kwargs):
             args_handler = decorator_kwargs.get("args_handler", default_args_handler)
             custom_metadata = decorator_kwargs.get("custom_metadata", None)
             tags = decorator_kwargs.get("tags", None)
+            capture_telemetry = decorator_kwargs.get("capture_telemetry", None)
+            task_should_capture_telemetry = TELEMETRY_ENABLED if capture_telemetry is None else capture_telemetry
 
             task_obj = TaskObject()
-            task_obj.subtype = decorator_kwargs.get("subtype", "agent_task")
+            task_obj.subtype = decorator_kwargs.get("subtype", PROV_AGENT.AGENT_TOOL)
             task_obj.activity_id = func.__name__
             handled_args = args_handler(*args, **kwargs)
             task_obj.workflow_id = handled_args.pop("workflow_id", Flowcept.current_workflow_id)
@@ -73,7 +75,7 @@ def wrapper(*args, **kwargs):
             task_obj.custom_metadata = custom_metadata or {}
             task_obj.task_id = str(task_obj.started_at)
             _thread_local._flowcept_current_context_task = task_obj
-            if TELEMETRY_ENABLED:
+            if task_should_capture_telemetry:
                 task_obj.telemetry_at_start = interceptor.telemetry_capture.capture()
             task_obj.agent_id = BaseAgentContextManager.agent_id
 
@@ -87,7 +89,7 @@ def wrapper(*args, **kwargs):
                 task_obj.stderr = str(e)
             task_obj.ended_at = time()
 
-            if TELEMETRY_ENABLED:
+            if task_should_capture_telemetry:
                 task_obj.telemetry_at_end = interceptor.telemetry_capture.capture()
             try:
                 if result is not None:
@@ -98,7 +100,12 @@ def wrapper(*args, **kwargs):
             except Exception as e:
                 logger.exception(e)
 
-            interceptor.intercept(task_obj.to_dict())
+            if interceptor._mq_dao.buffer is None:
+                logger.debug(
+                    f"Instrumentation buffer not ready for {task_obj.activity_id}; skipping provenance capture."
+                )
+            else:
+                interceptor.intercept(task_obj.to_dict())
             return result
 
         return wrapper
@@ -128,20 +135,32 @@ def _extract_llm_metadata(llm: LLM) -> Dict:
     dict
         Dictionary containing class name, module, model name, and configuration if available.
     """
+    config = llm.model_dump() if hasattr(llm, "model_dump") else llm.dict() if hasattr(llm, "dict") else {}
     llm_metadata = {
         "class_name": llm.__class__.__name__,
         "module": llm.__class__.__module__,
-        "config": llm.dict() if hasattr(llm, "dict") else {},
+        "config": sanitize_json_like(replace_non_serializable(config), drop_sensitive_keys=True),
     }
     return llm_metadata
 
 
-def extract_llm_usage(response: Any, fallback_model: str | None = None) -> Dict[str, Any]:
+def _estimate_tokens_from_text(text: str | None) -> int | None:
+    if text is None:
+        return None
+    return max(1, round(len(text) / 4)) if text else 0
+
+
+def extract_llm_usage(
+    response: Any,
+    fallback_model: str | None = None,
+    input_text: str | None = None,
+    output_text: str | None = None,
+) -> Dict[str, Any]:
     """Normalize provider-specific token metadata from an LLM response."""
     usage = {}
     usage.update(getattr(response, "usage_metadata", {}) or {})
 
-    response_metadata = getattr(response, "response_metadata", {}) or {}
+    response_metadata = sanitize_json_like(replace_non_serializable(getattr(response, "response_metadata", {}) or {}))
     token_usage = response_metadata.get("token_usage") or response_metadata.get("usage") or {}
 
     input_tokens = usage.get("input_tokens") or token_usage.get("prompt_tokens") or token_usage.get("input_tokens")
@@ -149,15 +168,41 @@ def extract_llm_usage(response: Any, fallback_model: str | None = None) -> Dict[
         usage.get("output_tokens") or token_usage.get("completion_tokens") or token_usage.get("output_tokens")
     )
     total_tokens = usage.get("total_tokens") or token_usage.get("total_tokens")
+    provider_reported_tokens = input_tokens is not None or output_tokens is not None or total_tokens is not None
+    if input_tokens is None:
+        input_tokens = _estimate_tokens_from_text(input_text)
+    if output_tokens is None:
+        output_tokens = _estimate_tokens_from_text(output_text)
     if total_tokens is None and input_tokens is not None and output_tokens is not None:
         total_tokens = input_tokens + output_tokens
-
-    return {
-        "llm_model": response_metadata.get("model_name") or response_metadata.get("model") or fallback_model,
-        "llm_input_tokens": input_tokens,
-        "llm_output_tokens": output_tokens,
-        "llm_total_tokens": total_tokens,
+    token_count_source = "provider" if provider_reported_tokens else "estimated_from_chars"
+
+    model = response_metadata.get("model_name") or response_metadata.get("model") or fallback_model
+    finish_reason = response_metadata.get("finish_reason")
+    provider_request_id = response_metadata.get("id") or response_metadata.get("request_id")
+    normalized = {
+        "model": model,
+        "input_tokens": input_tokens,
+        "output_tokens": output_tokens,
+        "total_tokens": total_tokens,
+        "input_chars": len(input_text) if input_text is not None else None,
+        "output_chars": len(output_text) if output_text is not None else None,
+        "finish_reason": finish_reason,
+        "provider_request_id": provider_request_id,
+        "provider_response_metadata": response_metadata,
+        "token_count_source": token_count_source,
     }
+    normalized.update(
+        {
+            "llm_model": model,
+            "llm_input_tokens": input_tokens,
+            "llm_output_tokens": output_tokens,
+            "llm_total_tokens": total_tokens,
+            "llm_input_chars": normalized["input_chars"],
+            "llm_output_chars": normalized["output_chars"],
+        }
+    )
+    return normalized
 
 
 class FlowceptLLM(Runnable):
@@ -273,23 +318,29 @@ def _our_call(self, messages, **kwargs):
         used = {"prompt": messages_str}
         with FlowceptTask(
             used=used,
-            subtype="llm_task",
+            subtype=PROV_AGENT.AI_MODEL_INVOCATION,
             custom_metadata=self.metadata,
             agent_id=self.agent_id,
             activity_id="llm_interaction",
             campaign_id=self.campaign_id,
             workflow_id=self.worflow_id,
             parent_task_id=self.parent_task_id,
+            capture_telemetry=False,
         ) as task:
             response = self.llm.invoke(messages, **kwargs)
             response_str = response.content if hasattr(response, "content") else str(response)
-            usage = extract_llm_usage(response, fallback_model=self.metadata.get("config", {}).get("model"))
+            usage = extract_llm_usage(
+                response,
+                fallback_model=self.metadata.get("config", {}).get("model"),
+                input_text=messages_str,
+                output_text=response_str,
+            )
             generated = {"response": response_str}
 
             if hasattr(response, "usage_metadata"):
-                task._task.custom_metadata["usage_metadata"] = response.usage_metadata
+                task._task.custom_metadata["usage_metadata"] = replace_non_serializable(response.usage_metadata)
             if hasattr(response, "response_metadata"):
-                task._task.custom_metadata["response_metadata"] = response.response_metadata
+                task._task.custom_metadata["response_metadata"] = replace_non_serializable(response.response_metadata)
             task._task.custom_metadata["llm_usage"] = usage
 
             task.end(generated=generated)
@@ -316,10 +367,18 @@ def __call__(self, *args, **kwargs):
         return self.invoke(*args, **kwargs)
 
     @staticmethod
-    def _format_messages(messages: Union[str, List[Dict[str, str]]]) -> str:
+    def _format_messages(messages) -> str:
         if isinstance(messages, str):
             return messages
-        elif isinstance(messages, list):
-            return "\n".join(f"{m.get('role', '').capitalize()}: {m.get('content', '')}" for m in messages)
-        else:
+        if not isinstance(messages, list):
             raise ValueError(f"Invalid message format: {messages}")
+        parts = []
+        for m in messages:
+            if isinstance(m, dict):
+                parts.append(f"{m.get('role', '').capitalize()}: {m.get('content', '')}")
+            elif hasattr(m, "content"):
+                role = getattr(m, "type", m.__class__.__name__)
+                parts.append(f"{role}: {m.content}")
+            else:
+                parts.append(str(m))
+        return "\n".join(parts)
diff --git a/src/flowcept/instrumentation/flowcept_task.py b/src/flowcept/instrumentation/flowcept_task.py
index ff31dd2a..e9dab210 100644
--- a/src/flowcept/instrumentation/flowcept_task.py
+++ b/src/flowcept/instrumentation/flowcept_task.py
@@ -138,6 +138,8 @@ def decorator(func):
         decorator_kwargs.get("agent_name", None)
         source_agent_id = decorator_kwargs.get("source_agent_id", None)
         decorator_kwargs.get("source_agent_name", None)
+        capture_telemetry = decorator_kwargs.get("capture_telemetry", None)
+        task_should_capture_telemetry = TELEMETRY_ENABLED if capture_telemetry is None else capture_telemetry
 
         # --- shared helpers for sync+async wrappers -------------------------
 
@@ -178,7 +180,7 @@ def _common_prep(*f_args, **f_kwargs):
             task_obj.task_id = str(task_obj.started_at)
             _thread_local._flowcept_current_context_task_id = task_obj.task_id
 
-            if TELEMETRY_ENABLED:
+            if task_should_capture_telemetry:
                 # capture telemetry at start
                 task_obj.telemetry_at_start = interceptor.telemetry_capture.capture()
 
@@ -246,7 +248,7 @@ def _common_post(task_obj, result, raised_exc):
 
             task_obj.ended_at = time()
 
-            if TELEMETRY_ENABLED:
+            if task_should_capture_telemetry:
                 # capture telemetry at end
                 task_obj.telemetry_at_end = interceptor.telemetry_capture.capture()
 
diff --git a/src/flowcept/instrumentation/task_capture.py b/src/flowcept/instrumentation/task_capture.py
index 324437cb..bfdf021b 100644
--- a/src/flowcept/instrumentation/task_capture.py
+++ b/src/flowcept/instrumentation/task_capture.py
@@ -60,6 +60,7 @@ def __init__(
         stdout: str = None,
         stderr: str = None,
         status: Status = None,
+        capture_telemetry: bool | None = None,
     ):
         """
         Initializes a FlowceptTask and optionally finalizes it.
@@ -99,6 +100,8 @@ def __init__(
             Captured standard error from the task.
         status : Status, optional
             Task completion status. If provided, defaults to Status.FINISHED if unspecified.
+        capture_telemetry : bool, optional
+            Per-task telemetry override. ``None`` follows the global telemetry setting.
         """
         if not INSTRUMENTATION_ENABLED:
             self._ended = True
@@ -106,8 +109,9 @@ def __init__(
 
         self._task = TaskObject()
         self._interceptor = InstrumentationInterceptor.get_instance()
+        self._capture_telemetry = TELEMETRY_ENABLED if capture_telemetry is None else capture_telemetry
 
-        if TELEMETRY_ENABLED:
+        if self._capture_telemetry:
             tel = self._interceptor.telemetry_capture.capture()
             self._task.telemetry_at_start = tel
 
@@ -241,7 +245,7 @@ def end(
         """
         if not INSTRUMENTATION_ENABLED:
             return
-        if TELEMETRY_ENABLED:
+        if self._capture_telemetry:
             tel = self._interceptor.telemetry_capture.capture()
             self._task.telemetry_at_end = tel
         if data:
diff --git a/src/flowcept/report/loaders.py b/src/flowcept/report/loaders.py
index 2f45b3e8..7c5ff69f 100644
--- a/src/flowcept/report/loaders.py
+++ b/src/flowcept/report/loaders.py
@@ -6,7 +6,7 @@
 from pathlib import Path
 from typing import Any, Dict, List, Tuple
 
-from flowcept.commons.sanitization import sanitize_json_like
+from flowcept.commons.utils import sanitize_json_like
 
 
 def read_jsonl(path: Path) -> Tuple[List[Dict[str, Any]], int]:
diff --git a/src/flowcept/report/renderers/workflow_card_markdown.py b/src/flowcept/report/renderers/workflow_card_markdown.py
index 18b70360..c7419112 100644
--- a/src/flowcept/report/renderers/workflow_card_markdown.py
+++ b/src/flowcept/report/renderers/workflow_card_markdown.py
@@ -13,7 +13,7 @@
 
 from flowcept import __version__
 from flowcept.report.aggregations import as_float, elapsed_seconds, fmt_timestamp_utc
-from flowcept.commons.sanitization import sanitize_json_like
+from flowcept.commons.utils import sanitize_json_like
 
 
 def render_markdown_file_into_rich_terminal(markdown_path: str | Path, *, stream=None) -> None:
diff --git a/src/flowcept/report/service.py b/src/flowcept/report/service.py
index fe6ead33..fb85a356 100644
--- a/src/flowcept/report/service.py
+++ b/src/flowcept/report/service.py
@@ -6,6 +6,7 @@
 from pathlib import Path
 from typing import Any, Dict, List
 
+import flowcept.configs as flowcept_configs
 from flowcept.report.aggregations import group_activities, group_transformations, summarize_objects
 from flowcept.report.loaders import load_records_from_db, read_jsonl, split_records
 from flowcept.report.renderers.campaign_workflow_card_markdown import render_campaign_workflow_card_markdown
@@ -30,6 +31,8 @@ def _resolve_input_mode(
         modes += 1
     if workflow_id is not None or campaign_id is not None:
         modes += 1
+    if modes == 0:
+        return "jsonl"
     if modes != 1:
         raise ValueError("Provide exactly one input mode: input_jsonl_path OR records OR workflow_id/campaign_id.")
     if input_jsonl_path is not None:
@@ -54,7 +57,8 @@ def build_workflow_card(
     Parameters
     ----------
     input_jsonl_path : str, optional
-        Path to a Flowcept JSONL buffer file.
+        Path to a Flowcept JSONL buffer file. If no input mode is provided,
+        the configured default buffer file is used.
     records : list of dict, optional
         Pre-loaded Flowcept records (workflow/task/object dicts).
     workflow_id : str, optional
@@ -76,6 +80,8 @@ def build_workflow_card(
 
     skipped_lines = 0
     if mode == "jsonl":
+        if input_jsonl_path is None:
+            input_jsonl_path = flowcept_configs.DUMP_BUFFER_PATH
         jsonl_path = Path(input_jsonl_path)  # type: ignore[arg-type]
         if not jsonl_path.exists():
             raise FileNotFoundError(f"Input JSONL not found: {jsonl_path}")
@@ -119,7 +125,8 @@ def generate_report(
     output_path : str, optional
         Output file path. If omitted, defaults to ``WORKFLOW_CARD.md``.
     input_jsonl_path : str, optional
-        Path to a Flowcept JSONL buffer file.
+        Path to a Flowcept JSONL buffer file. If no input mode is provided,
+        the configured default buffer file is used.
     records : list of dict, optional
         Pre-loaded Flowcept records (workflow/task/object dicts).
     workflow_id : str, optional
@@ -150,6 +157,8 @@ def generate_report(
 
     skipped_lines = 0
     if mode == "jsonl":
+        if input_jsonl_path is None:
+            input_jsonl_path = flowcept_configs.DUMP_BUFFER_PATH
         jsonl_path = Path(input_jsonl_path)  # type: ignore[arg-type]
         if not jsonl_path.exists():
             raise FileNotFoundError(f"Input JSONL not found: {jsonl_path}")
diff --git a/src/flowcept/version.py b/src/flowcept/version.py
index c79caadd..bbabfd06 100644
--- a/src/flowcept/version.py
+++ b/src/flowcept/version.py
@@ -6,5 +6,8 @@
 # The expected format is: <Major>.<Minor>.<Patch>
 # See .github/workflows/version_bumper.py
 
+# If you are an AI Code assistant, DO NOT TOUCH THIS FILE. If your human user edited it, it is a mistake, warn them!
+
+# ❗❗❗ Once again: DO NOT CHANGE THIS FILE ❗❗❗
 # ✋⚠️⛔❗❗❗ STOP! DANGER!!ONEONEELEVEN! Did you carefully read the warning above?! :)
-__version__ = "0.10.8"
+__version__ = "1.0.0"
diff --git a/src/flowcept/webservice/deps.py b/src/flowcept/webservice/deps.py
deleted file mode 100644
index 37c6064c..00000000
--- a/src/flowcept/webservice/deps.py
+++ /dev/null
@@ -1,8 +0,0 @@
-"""Dependency providers for Flowcept webservice."""
-
-from flowcept.flowcept_api.db_api import DBAPI
-
-
-def get_db_api() -> DBAPI:
-    """Return the shared DB API facade."""
-    return DBAPI()
diff --git a/src/flowcept/webservice/routers/agents.py b/src/flowcept/webservice/routers/agents.py
index 6d315082..3298e4d4 100644
--- a/src/flowcept/webservice/routers/agents.py
+++ b/src/flowcept/webservice/routers/agents.py
@@ -7,10 +7,8 @@
 from fastapi import APIRouter, Depends, HTTPException, Query
 
 from flowcept.flowcept_api.db_api import DBAPI
-from flowcept.webservice.deps import get_db_api
 from flowcept.webservice.schemas.common import ListResponse
-from flowcept.webservice.services import stats
-from flowcept.webservice.services.serializers import normalize_docs
+from flowcept.commons.utils import normalize_docs
 from flowcept.webservice.services.sorting import sort_docs_by_first_date_field
 
 router = APIRouter(prefix="/agents", tags=["agents"])
@@ -19,10 +17,10 @@
 @router.get("", response_model=ListResponse)
 def list_agents(
     limit: int = Query(default=100, ge=1, le=1000),
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> ListResponse:
     """List derived agent summaries, most recently active first."""
-    agents = stats.derive_agents(db)
+    agents = db.derive_agents()
     agents = sort_docs_by_first_date_field(agents, ["registered_at", "last_active"])
     agents = agents[:limit]
     normalized = normalize_docs(agents)
@@ -30,12 +28,12 @@ def list_agents(
 
 
 @router.get("/{agent_id}", response_model=Dict[str, Any])
-def get_agent(agent_id: str, db: DBAPI = Depends(get_db_api)) -> Dict[str, Any]:
+def get_agent(agent_id: str, db: DBAPI = Depends(DBAPI)) -> Dict[str, Any]:
     """Get one agent's derived summary and per-activity task summary."""
-    agents = [a for a in stats.derive_agents(db) if a["agent_id"] == agent_id]
+    agents = [a for a in db.derive_agents() if a["agent_id"] == agent_id]
     if not agents:
         raise HTTPException(status_code=404, detail=f"Agent not found: {agent_id}")
-    task_summary = stats.task_summary(db, {"agent_id": agent_id})
+    task_summary = db.task_summary({"agent_id": agent_id})
     return {
         "agent": normalize_docs(agents)[0],
         "task_summary": normalize_docs([task_summary])[0],
@@ -46,7 +44,7 @@ def get_agent(agent_id: str, db: DBAPI = Depends(get_db_api)) -> Dict[str, Any]:
 def get_agent_tasks(
     agent_id: str,
     limit: int = Query(default=100, ge=1, le=1000),
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> ListResponse:
     """List tasks executed by or sent from an agent."""
     docs = (
@@ -65,7 +63,7 @@ def get_agent_tasks(
 
 
 @router.delete("/cleanup/empty", response_model=Dict[str, Any])
-def delete_empty_agents(db: DBAPI = Depends(get_db_api)) -> Dict[str, Any]:
+def delete_empty_agents(db: DBAPI = Depends(DBAPI)) -> Dict[str, Any]:
     """Delete all agents from the database that don't have associated task_id."""
     stored_agents = db.agent_query(filter={}) or []
     deleted_count = 0
diff --git a/src/flowcept/webservice/routers/campaigns.py b/src/flowcept/webservice/routers/campaigns.py
index f21ac549..896f289d 100644
--- a/src/flowcept/webservice/routers/campaigns.py
+++ b/src/flowcept/webservice/routers/campaigns.py
@@ -9,11 +9,9 @@
 from fastapi.responses import Response
 
 from flowcept.flowcept_api.db_api import DBAPI
-from flowcept.webservice.deps import get_db_api
 from flowcept.webservice.schemas.common import ListResponse
-from flowcept.webservice.services import stats
 from flowcept.webservice.services.reports import workflow_card_response
-from flowcept.webservice.services.serializers import normalize_docs
+from flowcept.commons.utils import normalize_docs
 from flowcept.webservice.services.sorting import sort_docs_by_first_date_field
 
 router = APIRouter(prefix="/campaigns", tags=["campaigns"])
@@ -22,10 +20,10 @@
 @router.get("", response_model=ListResponse)
 def list_campaigns(
     limit: int = Query(default=100, ge=1, le=1000),
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> ListResponse:
     """List derived campaign summaries, most recently active first."""
-    campaigns = stats.derive_campaigns(db)
+    campaigns = db.derive_campaigns()
     campaigns = sort_docs_by_first_date_field(campaigns, ["last_ts", "first_ts"])
     campaigns = campaigns[:limit]
     normalized = normalize_docs(campaigns)
@@ -33,10 +31,10 @@ def list_campaigns(
 
 
 @router.get("/{campaign_id}", response_model=Dict[str, Any])
-def get_campaign(campaign_id: str, db: DBAPI = Depends(get_db_api)) -> Dict[str, Any]:
+def get_campaign(campaign_id: str, db: DBAPI = Depends(DBAPI)) -> Dict[str, Any]:
     """Get one campaign: derived summary, its workflows, and a task summary."""
     workflows = db.workflow_query(filter={"campaign_id": campaign_id}) or []
-    task_summary = stats.task_summary(db, {"campaign_id": campaign_id})
+    task_summary = db.task_summary({"campaign_id": campaign_id})
     if not workflows and task_summary["count"] == 0:
         raise HTTPException(status_code=404, detail=f"Campaign not found: {campaign_id}")
 
@@ -45,7 +43,7 @@ def get_campaign(campaign_id: str, db: DBAPI = Depends(get_db_api)) -> Dict[str,
         ["utc_timestamp", "created_at", "updated_at", "timestamp", "started_at", "ended_at"],
     )
     summary = next(
-        (c for c in stats.derive_campaigns(db) if c["campaign_id"] == campaign_id),
+        (c for c in db.derive_campaigns() if c["campaign_id"] == campaign_id),
         {"campaign_id": campaign_id},
     )
     return {
@@ -56,12 +54,12 @@ def get_campaign(campaign_id: str, db: DBAPI = Depends(get_db_api)) -> Dict[str,
 
 
 @router.delete("/{campaign_id}", response_model=Dict[str, Any])
-def delete_campaign(campaign_id: str, db: DBAPI = Depends(get_db_api)) -> Dict[str, Any]:
+def delete_campaign(campaign_id: str, db: DBAPI = Depends(DBAPI)) -> Dict[str, Any]:
     """Recursively delete a campaign and all its workflows, tasks, and objects."""
     workflows = db.workflow_query(filter={"campaign_id": campaign_id}) or []
     if not workflows:
         raise HTTPException(status_code=404, detail=f"Campaign not found: {campaign_id}")
-    counts = DBAPI._dao().delete_campaign_data(campaign_id)
+    counts = db.delete_campaign_data(campaign_id)
     return {"deleted": counts}
 
 
@@ -69,7 +67,7 @@ def delete_campaign(campaign_id: str, db: DBAPI = Depends(get_db_api)) -> Dict[s
 def get_campaign_workflow_card(
     campaign_id: str,
     format: str = Query(default="json"),
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> Response:
     """Get a campaign workflow card as structured JSON or rendered markdown."""
     workflows = db.workflow_query(filter={"campaign_id": campaign_id}) or []
diff --git a/src/flowcept/webservice/routers/chat.py b/src/flowcept/webservice/routers/chat.py
index 3e687ab8..d656e888 100644
--- a/src/flowcept/webservice/routers/chat.py
+++ b/src/flowcept/webservice/routers/chat.py
@@ -11,7 +11,7 @@
 
 from flowcept.commons.flowcept_logger import FlowceptLogger
 from flowcept.configs import AGENT, AGENT_CHAT_ENABLED
-from flowcept.webservice.services.chat_service import run_chat
+from flowcept.agents.chat_orchestration.chat_orchestrator_service import run_chat
 
 router = APIRouter(prefix="/chat", tags=["chat"])
 
@@ -30,6 +30,7 @@ class ChatRequest(BaseModel):
     context: Optional[Dict[str, Any]] = None
     stream: bool = True
     allow_dashboard_edit: bool = False
+    thread_id: Optional[str] = None
 
 
 def get_chat_llm():
@@ -52,7 +53,7 @@ def get_chat_llm():
             ),
         )
     try:
-        from flowcept.agents.agents_utils import build_llm_model
+        from flowcept.agents.llm.builders import build_llm_model
 
         return build_llm_model(track_tools=False)
     except HTTPException:
@@ -84,6 +85,7 @@ def chat(payload: ChatRequest):
         messages=messages,
         context=payload.context,
         allow_dashboard_edit=payload.allow_dashboard_edit,
+        thread_id=payload.thread_id,
     )
 
     if payload.stream:
diff --git a/src/flowcept/webservice/routers/dashboards.py b/src/flowcept/webservice/routers/dashboards.py
index b7aa205a..06aa9c86 100644
--- a/src/flowcept/webservice/routers/dashboards.py
+++ b/src/flowcept/webservice/routers/dashboards.py
@@ -11,11 +11,20 @@
 from flowcept.webservice.routers.query import _validate_filter_shape
 from flowcept.webservice.schemas.common import ListResponse
 from flowcept.webservice.schemas.dashboards import DashboardConfig
-from flowcept.webservice.services.dashboard_store import get_dashboard_store
+from flowcept.flowcept_api.db_api import DBAPI
 
 router = APIRouter(prefix="/dashboards", tags=["dashboards"])
 
 
+def get_dashboard_store():
+    """FastAPI dependency: return the DAO instance for dashboard CRUD."""
+    return DBAPI.get_dao_instance()
+
+
+def _list_by_type(store, dashboard_type: str) -> List[Dict[str, Any]]:
+    return store.list_dashboards(filter={"dashboard_type": dashboard_type}) or []
+
+
 def _now() -> str:
     return datetime.now(timezone.utc).isoformat()
 
@@ -44,11 +53,11 @@ def resolve_dashboard(
     ``campaign_id``.
     """
     if workflow_name:
-        common = store.list_by_type("common_workflow")
-        custom = [c for c in store.list_by_type("custom_workflow") if c.get("target") == workflow_name]
+        common = _list_by_type(store, "common_workflow")
+        custom = [c for c in _list_by_type(store, "custom_workflow") if c.get("target") == workflow_name]
     elif campaign_id:
-        common = store.list_by_type("common_campaign")
-        custom = [c for c in store.list_by_type("custom_campaign") if c.get("target") == campaign_id]
+        common = _list_by_type(store, "common_campaign")
+        custom = [c for c in _list_by_type(store, "custom_campaign") if c.get("target") == campaign_id]
     else:
         raise HTTPException(status_code=400, detail="Provide workflow_name or campaign_id.")
 
@@ -65,9 +74,9 @@ def list_dashboards(
 ) -> ListResponse:
     """List all dashboard configs, optionally filtered by ``dashboard_type``."""
     if dashboard_type:
-        items = store.list_by_type(dashboard_type)
+        items = _list_by_type(store, dashboard_type)
     else:
-        items = store.list()
+        items = store.list_dashboards()
     return ListResponse(items=items, count=len(items), limit=0)
 
 
@@ -78,7 +87,7 @@ def create_dashboard(config: DashboardConfig, store=Depends(get_dashboard_store)
     config.dashboard_id = str(uuid4())
     config.created_at = config.updated_at = _now()
     doc = config.model_dump()
-    if not store.save(doc):
+    if not store.save_dashboard(doc):
         raise HTTPException(status_code=500, detail="Could not save dashboard config.")
     return doc
 
@@ -86,7 +95,7 @@ def create_dashboard(config: DashboardConfig, store=Depends(get_dashboard_store)
 @router.get("/{dashboard_id}", response_model=Dict[str, Any])
 def get_dashboard(dashboard_id: str, store=Depends(get_dashboard_store)) -> Dict[str, Any]:
     """Get a dashboard config by id."""
-    doc = store.get(dashboard_id)
+    doc = store.get_dashboard(dashboard_id)
     if doc is None:
         raise HTTPException(status_code=404, detail=f"Dashboard not found: {dashboard_id}")
     return doc
@@ -95,7 +104,7 @@ def get_dashboard(dashboard_id: str, store=Depends(get_dashboard_store)) -> Dict
 @router.put("/{dashboard_id}", response_model=Dict[str, Any])
 def update_dashboard(dashboard_id: str, config: DashboardConfig, store=Depends(get_dashboard_store)) -> Dict[str, Any]:
     """Replace a dashboard config, preserving its id and creation time."""
-    existing = store.get(dashboard_id)
+    existing = store.get_dashboard(dashboard_id)
     if existing is None:
         raise HTTPException(status_code=404, detail=f"Dashboard not found: {dashboard_id}")
     _validate_config_filters(config)
@@ -103,7 +112,7 @@ def update_dashboard(dashboard_id: str, config: DashboardConfig, store=Depends(g
     config.created_at = existing.get("created_at")
     config.updated_at = _now()
     doc = config.model_dump()
-    if not store.save(doc):
+    if not store.save_dashboard(doc):
         raise HTTPException(status_code=500, detail="Could not save dashboard config.")
     return doc
 
@@ -111,6 +120,6 @@ def update_dashboard(dashboard_id: str, config: DashboardConfig, store=Depends(g
 @router.delete("/{dashboard_id}", response_model=Dict[str, Any])
 def delete_dashboard(dashboard_id: str, store=Depends(get_dashboard_store)) -> Dict[str, Any]:
     """Delete a dashboard config by id."""
-    if not store.delete(dashboard_id):
+    if not store.delete_dashboard(dashboard_id):
         raise HTTPException(status_code=404, detail=f"Dashboard not found: {dashboard_id}")
     return {"deleted": dashboard_id}
diff --git a/src/flowcept/webservice/routers/datasets.py b/src/flowcept/webservice/routers/datasets.py
index 7e7963d1..eaa67b37 100644
--- a/src/flowcept/webservice/routers/datasets.py
+++ b/src/flowcept/webservice/routers/datasets.py
@@ -7,9 +7,8 @@
 from fastapi.responses import Response
 
 from flowcept.flowcept_api.db_api import DBAPI
-from flowcept.webservice.deps import get_db_api
 from flowcept.webservice.schemas.common import ListResponse, ObjectQueryRequest
-from flowcept.webservice.services.serializers import normalize_docs
+from flowcept.commons.utils import normalize_docs
 
 router = APIRouter(prefix="/datasets", tags=["datasets"])
 
@@ -45,7 +44,7 @@ def list_datasets(
     object_id: str | None = None,
     filter_json: str | None = None,
     include_data: bool = False,
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> ListResponse:
     """List dataset objects with optional filters."""
     query_filter = _json_filter(filter_json)
@@ -67,7 +66,7 @@ def get_dataset(
     object_id: str,
     version: int | None = None,
     include_data: bool = False,
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ):
     """Get dataset object metadata by id and optional version."""
     try:
@@ -86,7 +85,7 @@ def get_dataset_version(
     object_id: str,
     version: int,
     include_data: bool = False,
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ):
     """Get a specific dataset object version."""
     return get_dataset(object_id=object_id, version=version, include_data=include_data, db=db)
@@ -96,7 +95,7 @@ def get_dataset_version(
 def download_dataset(
     object_id: str,
     version: int | None = None,
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ):
     """Download dataset payload as a binary attachment."""
     try:
@@ -118,7 +117,7 @@ def download_dataset(
 
 
 @router.post("/query", response_model=ListResponse)
-def query_datasets(payload: ObjectQueryRequest, db: DBAPI = Depends(get_db_api)):
+def query_datasets(payload: ObjectQueryRequest, db: DBAPI = Depends(DBAPI)):
     """Run an advanced read-only query for dataset objects."""
     query_filter = dict(payload.filter)
     query_filter["object_type"] = "dataset"
diff --git a/src/flowcept/webservice/routers/health.py b/src/flowcept/webservice/routers/health.py
index b1785cf7..6c440952 100644
--- a/src/flowcept/webservice/routers/health.py
+++ b/src/flowcept/webservice/routers/health.py
@@ -1,6 +1,7 @@
 """Health endpoints."""
 
 from fastapi import APIRouter
+from fastapi.responses import JSONResponse
 
 from flowcept.version import __version__
 
@@ -10,14 +11,27 @@
 
 @router.get("/live")
 def live() -> dict:
-    """Liveness check."""
+    """Liveness check — process is running."""
     return {"status": "ok"}
 
 
 @router.get("/ready")
-def ready() -> dict:
-    """Readiness check."""
-    return {"status": "ready"}
+def ready() -> JSONResponse:
+    """Readiness check — verifies all enabled services via ``Flowcept.services_alive()``.
+
+    Which services are checked is driven by settings.yaml (MQ, KVDB, MongoDB, LMDB, LLM).
+    Returns HTTP 200 when all enabled services are reachable, HTTP 503 otherwise.
+    The response body includes per-service status so callers can identify which
+    service is down without reading server logs.
+    """
+    from flowcept.flowcept_api.flowcept_controller import Flowcept
+
+    services = Flowcept.services_status()
+    ok = all(v == "ok" for v in services.values())
+    return JSONResponse(
+        status_code=200 if ok else 503,
+        content={"status": "ready" if ok else "degraded", "services": services},
+    )
 
 
 @info_router.get("/info")
diff --git a/src/flowcept/webservice/routers/models.py b/src/flowcept/webservice/routers/models.py
index f9cd4dcf..e1463845 100644
--- a/src/flowcept/webservice/routers/models.py
+++ b/src/flowcept/webservice/routers/models.py
@@ -7,9 +7,8 @@
 from fastapi.responses import Response
 
 from flowcept.flowcept_api.db_api import DBAPI
-from flowcept.webservice.deps import get_db_api
 from flowcept.webservice.schemas.common import ListResponse, ObjectQueryRequest
-from flowcept.webservice.services.serializers import normalize_docs
+from flowcept.commons.utils import normalize_docs
 
 router = APIRouter(prefix="/models", tags=["models"])
 
@@ -45,7 +44,7 @@ def list_models(
     object_id: str | None = None,
     filter_json: str | None = None,
     include_data: bool = False,
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> ListResponse:
     """List ML model objects with optional filters."""
     query_filter = _json_filter(filter_json)
@@ -67,7 +66,7 @@ def get_model(
     object_id: str,
     version: int | None = None,
     include_data: bool = False,
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ):
     """Get ML model object metadata by id and optional version."""
     try:
@@ -86,7 +85,7 @@ def get_model_version(
     object_id: str,
     version: int,
     include_data: bool = False,
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ):
     """Get a specific ML model object version."""
     return get_model(object_id=object_id, version=version, include_data=include_data, db=db)
@@ -96,7 +95,7 @@ def get_model_version(
 def download_model(
     object_id: str,
     version: int | None = None,
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ):
     """Download ML model payload as a binary attachment."""
     try:
@@ -118,7 +117,7 @@ def download_model(
 
 
 @router.post("/query", response_model=ListResponse)
-def query_models(payload: ObjectQueryRequest, db: DBAPI = Depends(get_db_api)):
+def query_models(payload: ObjectQueryRequest, db: DBAPI = Depends(DBAPI)):
     """Run an advanced read-only query for ML model objects."""
     query_filter = dict(payload.filter)
     query_filter["object_type"] = "ml_model"
diff --git a/src/flowcept/webservice/routers/objects.py b/src/flowcept/webservice/routers/objects.py
index f7752d6d..852b0777 100644
--- a/src/flowcept/webservice/routers/objects.py
+++ b/src/flowcept/webservice/routers/objects.py
@@ -7,9 +7,8 @@
 from fastapi.responses import Response
 
 from flowcept.flowcept_api.db_api import DBAPI
-from flowcept.webservice.deps import get_db_api
 from flowcept.webservice.schemas.common import ListResponse, ObjectQueryRequest
-from flowcept.webservice.services.serializers import normalize_docs
+from flowcept.commons.utils import normalize_docs
 from flowcept.webservice.services.sorting import sort_docs_by_first_date_field
 
 router = APIRouter(prefix="/objects", tags=["objects"])
@@ -47,7 +46,7 @@ def list_objects(
     object_type: str | None = None,
     filter_json: str | None = None,
     include_data: bool = False,
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> ListResponse:
     """List objects with optional basic filters."""
     query_filter = _json_filter(filter_json)
@@ -68,7 +67,7 @@ def list_objects(
 
 
 @router.get("/{object_id}", response_model=Dict[str, Any])
-def get_object(object_id: str, include_data: bool = False, db: DBAPI = Depends(get_db_api)) -> Dict[str, Any]:
+def get_object(object_id: str, include_data: bool = False, db: DBAPI = Depends(DBAPI)) -> Dict[str, Any]:
     """Get latest version of an object by id."""
     try:
         obj = db.get_blob_object(object_id=object_id)
@@ -87,7 +86,7 @@ def get_object_version(
     object_id: str,
     version: int,
     include_data: bool = False,
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> Dict[str, Any]:
     """Get a specific object version by id and version number."""
     try:
@@ -106,7 +105,7 @@ def get_object_version(
 def download_object(
     object_id: str,
     version: int | None = None,
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> Response:
     """Download object payload as binary."""
     try:
@@ -130,7 +129,7 @@ def download_object(
 def download_object_version(
     object_id: str,
     version: int,
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> Response:
     """Download a specific object payload version as binary."""
     return download_object(object_id=object_id, version=version, db=db)
@@ -140,7 +139,7 @@ def download_object_version(
 def get_object_history(
     object_id: str,
     limit: int = Query(default=100, ge=1, le=1000),
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> ListResponse:
     """Get object metadata history (latest-first)."""
     try:
@@ -154,19 +153,19 @@ def get_object_history(
 
 
 @router.delete("/{object_id}", response_model=Dict[str, Any])
-def delete_object(object_id: str, db: DBAPI = Depends(get_db_api)) -> Dict[str, Any]:
+def delete_object(object_id: str, db: DBAPI = Depends(DBAPI)) -> Dict[str, Any]:
     """Delete an object and all its versions by object_id."""
-    dao = DBAPI._dao()
-    if not hasattr(dao, "delete_object_keys"):
+    try:
+        deleted = db.delete_object_keys("object_id", [object_id])
+    except NotImplementedError:
         raise HTTPException(status_code=501, detail="Delete not supported by this DB backend.")
-    deleted = dao.delete_object_keys("object_id", [object_id])
     if not deleted:
         raise HTTPException(status_code=404, detail=f"Object not found or could not be deleted: {object_id}")
     return {"deleted": True, "object_id": object_id}
 
 
 @router.post("/query", response_model=ListResponse)
-def query_objects(payload: ObjectQueryRequest, db: DBAPI = Depends(get_db_api)) -> ListResponse:
+def query_objects(payload: ObjectQueryRequest, db: DBAPI = Depends(DBAPI)) -> ListResponse:
     """Run an advanced read-only object query."""
     docs = db.query(
         collection="objects",
diff --git a/src/flowcept/webservice/routers/query.py b/src/flowcept/webservice/routers/query.py
index 9e6fd750..2c9c9657 100644
--- a/src/flowcept/webservice/routers/query.py
+++ b/src/flowcept/webservice/routers/query.py
@@ -7,9 +7,8 @@
 from fastapi import APIRouter, Depends, HTTPException
 
 from flowcept.flowcept_api.db_api import DBAPI
-from flowcept.webservice.deps import get_db_api
 from flowcept.webservice.schemas.common import ListResponse, ObjectQueryRequest
-from flowcept.webservice.services.serializers import normalize_docs
+from flowcept.commons.utils import normalize_docs
 
 router = APIRouter(prefix="/query", tags=["query"])
 
@@ -109,7 +108,7 @@ def _apply_shaping(docs: List[Dict[str, Any]], payload: ObjectQueryRequest) -> L
 
 
 @router.post("/{scope}", response_model=ListResponse)
-def query_scope(scope: QueryScope, payload: ObjectQueryRequest, db: DBAPI = Depends(get_db_api)) -> ListResponse:
+def query_scope(scope: QueryScope, payload: ObjectQueryRequest, db: DBAPI = Depends(DBAPI)) -> ListResponse:
     """Run a read-only advanced query over a constrained collection scope."""
     _validate_filter_shape(payload.filter)
     collection, base_filter, include_data_supported = _get_scope_metadata(scope)
diff --git a/src/flowcept/webservice/routers/stats.py b/src/flowcept/webservice/routers/stats.py
index f95e7b98..720b9076 100644
--- a/src/flowcept/webservice/routers/stats.py
+++ b/src/flowcept/webservice/routers/stats.py
@@ -9,11 +9,9 @@
 from pydantic import BaseModel, Field
 
 from flowcept.flowcept_api.db_api import DBAPI
-from flowcept.webservice.deps import get_db_api
 from flowcept.webservice.routers.query import _validate_filter_shape
 from flowcept.webservice.schemas.dashboards import ChartData
-from flowcept.webservice.services import stats
-from flowcept.webservice.services.serializers import normalize_docs
+from flowcept.commons.utils import normalize_docs
 
 router = APIRouter(prefix="/stats", tags=["stats"])
 
@@ -52,7 +50,7 @@ def get_task_summary(
     campaign_id: Optional[str] = None,
     agent_id: Optional[str] = None,
     filter_json: Optional[str] = None,
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> Dict[str, Any]:
     """Summarize tasks (status counts, per-activity durations, time range)."""
     query_filter = _json_filter(filter_json)
@@ -60,15 +58,14 @@ def get_task_summary(
         if value is not None:
             query_filter[key] = value
     _validate_filter_shape(query_filter)
-    return normalize_docs([stats.task_summary(db, query_filter)])[0]
+    return normalize_docs([db.task_summary(query_filter)])[0]
 
 
 @router.post("/timeseries", response_model=Dict[str, Any])
-def post_timeseries(payload: TimeseriesRequest, db: DBAPI = Depends(get_db_api)) -> Dict[str, Any]:
+def post_timeseries(payload: TimeseriesRequest, db: DBAPI = Depends(DBAPI)) -> Dict[str, Any]:
     """Extract plottable rows of dot-notated fields from tasks."""
     _validate_filter_shape(payload.filter)
-    rows = stats.telemetry_timeseries(
-        db,
+    rows = db.telemetry_timeseries(
         filter=payload.filter,
         fields=payload.fields,
         x_field=payload.x,
@@ -79,11 +76,11 @@ def post_timeseries(payload: TimeseriesRequest, db: DBAPI = Depends(get_db_api))
 
 
 @router.post("/chart_data", response_model=Dict[str, Any])
-def post_chart_data(payload: ChartDataRequest, db: DBAPI = Depends(get_db_api)) -> Dict[str, Any]:
+def post_chart_data(payload: ChartDataRequest, db: DBAPI = Depends(DBAPI)) -> Dict[str, Any]:
     """Resolve a declarative dashboard chart data binding into rows."""
     _validate_filter_shape(payload.data.filter)
     if payload.context:
         _validate_filter_shape(payload.context)
-    result = stats.resolve_chart_data(db, payload.data, context=payload.context)
+    result = db.resolve_chart_data(payload.data.model_dump(), context=payload.context)
     result["rows"] = normalize_docs(result["rows"])
     return result
diff --git a/src/flowcept/webservice/routers/stream.py b/src/flowcept/webservice/routers/stream.py
index 5db9b8a7..da2a18ac 100644
--- a/src/flowcept/webservice/routers/stream.py
+++ b/src/flowcept/webservice/routers/stream.py
@@ -12,8 +12,7 @@
 
 from flowcept.configs import WEBSERVER_SSE_MAX_BATCH, WEBSERVER_SSE_POLL_INTERVAL
 from flowcept.flowcept_api.db_api import DBAPI
-from flowcept.webservice.deps import get_db_api
-from flowcept.webservice.services.serializers import normalize_docs
+from flowcept.commons.utils import normalize_docs
 from flowcept.webservice.services.streaming import poll_new_docs
 
 router = APIRouter(prefix="/stream", tags=["stream"])
@@ -55,7 +54,7 @@ def stream_tasks(
     agent_id: Optional[str] = None,
     since: Optional[float] = None,
     poll_interval: float = Query(default=WEBSERVER_SSE_POLL_INTERVAL, ge=0.1, le=60.0),
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> EventSourceResponse:
     """Stream new/updated tasks as SSE events, optionally scoped by workflow/campaign/agent."""
     base_filter: Dict[str, Any] = {}
@@ -72,7 +71,7 @@ def stream_workflows(
     campaign_id: Optional[str] = None,
     since: Optional[float] = None,
     poll_interval: float = Query(default=WEBSERVER_SSE_POLL_INTERVAL, ge=0.1, le=60.0),
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> EventSourceResponse:
     """Stream new workflows as SSE events, optionally scoped by campaign."""
     base_filter: Dict[str, Any] = {}
diff --git a/src/flowcept/webservice/routers/tasks.py b/src/flowcept/webservice/routers/tasks.py
index c91cab80..3925e6f2 100644
--- a/src/flowcept/webservice/routers/tasks.py
+++ b/src/flowcept/webservice/routers/tasks.py
@@ -6,9 +6,8 @@
 from fastapi import APIRouter, Depends, HTTPException, Query
 
 from flowcept.flowcept_api.db_api import DBAPI
-from flowcept.webservice.deps import get_db_api
 from flowcept.webservice.schemas.common import ListResponse, QueryRequest
-from flowcept.webservice.services.serializers import normalize_docs
+from flowcept.commons.utils import normalize_docs
 from flowcept.webservice.services.sorting import sort_docs_by_first_date_field
 
 router = APIRouter(prefix="/tasks", tags=["tasks"])
@@ -35,7 +34,7 @@ def list_tasks(
     task_id: str | None = None,
     status: str | None = None,
     filter_json: str | None = None,
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> ListResponse:
     """List tasks with optional basic filters."""
     query_filter = _json_filter(filter_json)
@@ -61,7 +60,7 @@ def list_tasks(
 
 
 @router.get("/{task_id}", response_model=Dict[str, Any])
-def get_task(task_id: str, db: DBAPI = Depends(get_db_api)) -> Dict[str, Any]:
+def get_task(task_id: str, db: DBAPI = Depends(DBAPI)) -> Dict[str, Any]:
     """Get a task by id."""
     docs = db.task_query(filter={"task_id": task_id}, limit=1) or []
     if not docs:
@@ -74,7 +73,7 @@ def get_task(task_id: str, db: DBAPI = Depends(get_db_api)) -> Dict[str, Any]:
 def list_tasks_by_workflow(
     workflow_id: str,
     limit: int = Query(default=100, ge=1, le=1000),
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> ListResponse:
     """List tasks for a workflow."""
     docs = db.task_query(filter={"workflow_id": workflow_id}, limit=0) or []
@@ -88,7 +87,7 @@ def list_tasks_by_workflow(
 
 
 @router.post("/query", response_model=ListResponse)
-def query_tasks(payload: QueryRequest, db: DBAPI = Depends(get_db_api)) -> ListResponse:
+def query_tasks(payload: QueryRequest, db: DBAPI = Depends(DBAPI)) -> ListResponse:
     """Run an advanced read-only task query."""
     if payload.aggregation and payload.projection and len(payload.projection) > 1:
         raise HTTPException(
diff --git a/src/flowcept/webservice/routers/workflows.py b/src/flowcept/webservice/routers/workflows.py
index 61a9a98f..97acc868 100644
--- a/src/flowcept/webservice/routers/workflows.py
+++ b/src/flowcept/webservice/routers/workflows.py
@@ -10,11 +10,10 @@
 
 from flowcept import Flowcept
 from flowcept.flowcept_api.db_api import DBAPI
-from flowcept.webservice.deps import get_db_api
 from flowcept.webservice.schemas.common import ListResponse, QueryRequest
 from flowcept.webservice.services.dataflow import build_dataflow
 from flowcept.webservice.services.reports import workflow_card_response
-from flowcept.webservice.services.serializers import normalize_docs
+from flowcept.commons.utils import normalize_docs
 from flowcept.webservice.services.sorting import sort_docs_by_first_date_field
 
 router = APIRouter(prefix="/workflows", tags=["workflows"])
@@ -40,7 +39,7 @@ def list_workflows(
     parent_workflow_id: str | None = None,
     name: str | None = None,
     filter_json: str | None = None,
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> ListResponse:
     """List workflows with optional basic filters."""
     query_filter = _json_filter(filter_json)
@@ -64,7 +63,7 @@ def list_workflows(
 
 
 @router.get("/{workflow_id}", response_model=Dict[str, Any])
-def get_workflow(workflow_id: str, db: DBAPI = Depends(get_db_api)) -> Dict[str, Any]:
+def get_workflow(workflow_id: str, db: DBAPI = Depends(DBAPI)) -> Dict[str, Any]:
     """Get a workflow by id."""
     doc = db.get_workflow_object(workflow_id)
     if doc is None:
@@ -74,16 +73,16 @@ def get_workflow(workflow_id: str, db: DBAPI = Depends(get_db_api)) -> Dict[str,
 
 
 @router.delete("/{workflow_id}", response_model=Dict[str, Any])
-def delete_workflow(workflow_id: str, db: DBAPI = Depends(get_db_api)) -> Dict[str, Any]:
+def delete_workflow(workflow_id: str, db: DBAPI = Depends(DBAPI)) -> Dict[str, Any]:
     """Recursively delete a workflow and all its tasks and objects."""
     if db.get_workflow_object(workflow_id) is None:
         raise HTTPException(status_code=404, detail=f"Workflow not found: {workflow_id}")
-    counts = DBAPI._dao().delete_workflow_data(workflow_id)
+    counts = db.delete_workflow_data(workflow_id)
     return {"deleted": counts}
 
 
 @router.post("/query", response_model=ListResponse)
-def query_workflows(payload: QueryRequest, db: DBAPI = Depends(get_db_api)) -> ListResponse:
+def query_workflows(payload: QueryRequest, db: DBAPI = Depends(DBAPI)) -> ListResponse:
     """Run an advanced read-only workflows query."""
     sort = None if payload.sort is None else [(s.field, s.order) for s in payload.sort]
     docs = db.query(
@@ -103,7 +102,7 @@ def query_workflows(payload: QueryRequest, db: DBAPI = Depends(get_db_api)) -> L
 @router.get("/{workflow_id}/dataflow", response_model=Dict[str, Any])
 def get_workflow_dataflow(
     workflow_id: str,
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> Dict[str, Any]:
     """Get the PROV-style dataflow graph derived from tasks' used/generated fields."""
     graph = build_dataflow(db, workflow_id)
@@ -116,7 +115,7 @@ def get_workflow_dataflow(
 def get_workflow_card(
     workflow_id: str,
     format: str = Query(default="json"),
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> Response:
     """Get a workflow card as structured JSON or rendered markdown."""
     wf_obj = db.get_workflow_object(workflow_id)
@@ -126,7 +125,7 @@ def get_workflow_card(
 
 
 @router.post("/{workflow_id}/reports/workflow-card/download")
-def download_workflow_card(workflow_id: str, db: DBAPI = Depends(get_db_api)) -> Response:
+def download_workflow_card(workflow_id: str, db: DBAPI = Depends(DBAPI)) -> Response:
     """Generate and download a workflow card markdown file."""
     wf_obj = db.get_workflow_object(workflow_id)
     if wf_obj is None:
@@ -165,7 +164,7 @@ def download_workflow_card(workflow_id: str, db: DBAPI = Depends(get_db_api)) ->
 def get_node_positions(
     workflow_id: str,
     graph_type: str = Query(..., description="Graph type: 'dataflow', 'task', or 'activity'"),
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> Dict[str, Any]:
     """Get node positions for a workflow graph type."""
     if db.get_workflow_object(workflow_id) is None:
@@ -177,7 +176,7 @@ def get_node_positions(
 def save_node_positions(
     workflow_id: str,
     payload: Dict[str, Any],
-    db: DBAPI = Depends(get_db_api),
+    db: DBAPI = Depends(DBAPI),
 ) -> Dict[str, Any]:
     """Save node positions for a workflow graph type."""
     if db.get_workflow_object(workflow_id) is None:
diff --git a/src/flowcept/webservice/schemas/dashboards.py b/src/flowcept/webservice/schemas/dashboards.py
index 6a9d8ef7..2f27fda9 100644
--- a/src/flowcept/webservice/schemas/dashboards.py
+++ b/src/flowcept/webservice/schemas/dashboards.py
@@ -1,13 +1,4 @@
-"""Pydantic schemas for dashboard specs and declarative chart-data bindings.
-
-The spec is deliberately declarative so that LLM tools can reliably generate/modify
-it and the frontend can validate and render it.
-
-Data model:
-- A Dashboard has a type (workflow | campaign) and contains multiple charts.
-- Each chart can have a data binding (ChartData) describing what to query.
-- VizSpec describes how to render the query result (bar, pie, line, ...).
-"""
+"""Pydantic schemas for dashboards: data bindings, chart specs, layout, and config."""
 
 from __future__ import annotations
 
@@ -15,7 +6,12 @@
 
 from pydantic import BaseModel, Field
 
-from flowcept.webservice.schemas.common import SortSpec
+
+class SortSpec(BaseModel):
+    """Sort field/order pair for chart data queries."""
+
+    field: str
+    order: Literal[1, -1] = 1
 
 
 class MetricSpec(BaseModel):
diff --git a/src/flowcept/webservice/services/chat_service.py b/src/flowcept/webservice/services/chat_service.py
deleted file mode 100644
index c67b78f6..00000000
--- a/src/flowcept/webservice/services/chat_service.py
+++ /dev/null
@@ -1,213 +0,0 @@
-"""LLM chat orchestration for the webservice: tool-calling loop over the shared prov tools."""
-
-from __future__ import annotations
-
-import json
-from typing import Any, Dict, Generator, List, Optional
-
-from flowcept.agents.prompts.chat_prompts import CHAT_SYSTEM_PROMPT
-from flowcept.agents.tools import prov_tools
-from flowcept.commons.flowcept_logger import FlowceptLogger
-from flowcept.configs import AGENT_CHAT_MAX_TOOL_ITERATIONS
-
-MAX_TOOL_ITERATIONS = AGENT_CHAT_MAX_TOOL_ITERATIONS
-
-
-def _build_langchain_tools(context: Optional[Dict[str, Any]], allow_dashboard_edit: bool):
-    """Wrap the shared prov tool core as langchain tools (results JSON-encoded for the LLM)."""
-    from langchain_core.tools import tool
-
-    def _run(func, **kwargs) -> str:
-        result = func(**kwargs)
-        payload = result.model_dump() if hasattr(result, "model_dump") else result
-        return json.dumps(payload, default=str)
-
-    def _coerce_projection(p: Any) -> Optional[List[str]]:
-        """Accept a list of field names or a Mongo projection dict {field: 1}."""
-        if p is None:
-            return None
-        if isinstance(p, dict):
-            return [k for k, v in p.items() if v]
-        return list(p)
-
-    def _coerce_sort(s: Any) -> Optional[List[Dict[str, Any]]]:
-        """Accept [{field, order}] or a Mongo sort dict {field: -1}."""
-        if s is None:
-            return None
-        if isinstance(s, dict):
-            return [{"field": k, "order": v} for k, v in s.items()]
-        return list(s)
-
-    @tool
-    def query_tasks(
-        filter: Optional[Dict[str, Any]] = None,
-        projection: Optional[Any] = None,
-        limit: int = 100,
-        sort: Optional[Any] = None,
-    ) -> str:
-        """Query task provenance records with a Mongo-style filter.
-
-        projection: list of field names, or a Mongo projection dict {"field": 1}.
-        sort: list of {"field": "...", "order": 1|-1}, or a Mongo sort dict {"field": -1}.
-        """
-        return _run(
-            prov_tools.query_tasks,
-            filter=filter,
-            projection=_coerce_projection(projection),
-            limit=limit,
-            sort=_coerce_sort(sort),
-        )
-
-    @tool
-    def query_workflows(filter: Optional[Dict[str, Any]] = None, limit: int = 100) -> str:
-        """Query workflow provenance records with a Mongo-style filter."""
-        return _run(prov_tools.query_workflows, filter=filter, limit=limit)
-
-    @tool
-    def get_task_summary(filter: Optional[Dict[str, Any]] = None) -> str:
-        """Summarize tasks: status counts, per-activity durations, and time range."""
-        return _run(prov_tools.get_task_summary, filter=filter)
-
-    @tool
-    def list_campaigns() -> str:
-        """List derived campaign summaries (campaigns group workflows and tasks)."""
-        return _run(prov_tools.list_campaigns)
-
-    @tool
-    def list_agents() -> str:
-        """List derived agent summaries (agents observed in task provenance)."""
-        return _run(prov_tools.list_agents)
-
-    @tool
-    def make_chart(card_spec: Dict[str, Any]) -> str:
-        """Build a chart from a declarative dashboard card spec; the UI renders the result."""
-        return _run(prov_tools.make_chart, card_spec=card_spec, context=context)
-
-    @tool
-    def highlight_lineage(
-        task_ids: Optional[Any] = None,
-        filter: Optional[Dict[str, Any]] = None,
-    ) -> str:
-        """Highlight the full provenance lineage (ancestors + descendants) of tasks in the Dataflow graph.
-
-        Pass `task_ids` as a list of task ID strings, or a single task ID string.
-        Or use `filter` to find the seed tasks first.
-        The UI will dim all other nodes and visually trace the lineage chain.
-        Always pass a workflow_id in the filter when on a workflow page.
-        """
-        wf_id = (context or {}).get("workflow_id")
-        # Coerce a bare string to a list so the LLM can pass either form.
-        ids: Optional[List[str]] = None
-        if task_ids is not None:
-            ids = [task_ids] if isinstance(task_ids, str) else list(task_ids)
-        return _run(prov_tools.highlight_lineage, task_ids=ids, filter=filter, workflow_id=wf_id)
-
-    tools = [query_tasks, query_workflows, get_task_summary, list_campaigns, list_agents, make_chart, highlight_lineage]
-
-    if allow_dashboard_edit:
-
-        @tool
-        def get_dashboard(dashboard_id: str) -> str:
-            """Get a stored dashboard spec by id."""
-            return _run(prov_tools.get_dashboard, dashboard_id=dashboard_id)
-
-        @tool
-        def update_dashboard(dashboard_id: str, spec: Dict[str, Any]) -> str:
-            """Replace a stored dashboard spec with a complete revised spec."""
-            return _run(prov_tools.update_dashboard, dashboard_id=dashboard_id, spec=spec)
-
-        tools += [get_dashboard, update_dashboard]
-    return tools
-
-
-def _build_messages(messages: List[Dict[str, str]], context: Optional[Dict[str, Any]]):
-    from langchain_core.messages import AIMessage, HumanMessage, SystemMessage
-
-    system = CHAT_SYSTEM_PROMPT
-    if context:
-        system += f"\nCurrent user context (scope queries with it): {json.dumps(context)}"
-    lc_messages = [SystemMessage(content=system)]
-    for message in messages:
-        role = message.get("role")
-        content = message.get("content", "")
-        lc_messages.append(AIMessage(content=content) if role == "assistant" else HumanMessage(content=content))
-    return lc_messages
-
-
-def run_chat(
-    llm,
-    messages: List[Dict[str, str]],
-    context: Optional[Dict[str, Any]] = None,
-    allow_dashboard_edit: bool = False,
-) -> Generator[Dict[str, Any], None, None]:
-    """Run one chat turn as a generator of events.
-
-    Yields dict events: ``{"event": "tool_call"|"tool_result"|"card"|"token"|"done"|"error", ...}``.
-    The caller decides whether to stream them (SSE) or collect them into one response.
-
-    Parameters
-    ----------
-    llm : Any
-        A langchain chat model (from ``build_llm_model``).
-    messages : list of dict
-        Conversation history, ``[{"role": "user"|"assistant", "content": "..."}]``.
-    context : dict, optional
-        UI context (e.g., ``{"workflow_id": ...}``) injected into the system prompt and charts.
-    allow_dashboard_edit : bool, optional
-        Whether dashboard-modifying tools are bound.
-    """
-    logger = FlowceptLogger()
-    tools = _build_langchain_tools(context, allow_dashboard_edit)
-    tools_by_name = {t.name: t for t in tools}
-    lc_messages = _build_messages(messages, context)
-
-    try:
-        bound = llm.bind_tools(tools)
-    except (NotImplementedError, AttributeError):
-        logger.warning("Chat LLM does not support tool binding; answering without tools.")
-        bound = None
-
-    try:
-        if bound is None:
-            response = llm.invoke(lc_messages)
-            yield {"event": "token", "data": getattr(response, "content", str(response))}
-            yield {"event": "done"}
-            return
-
-        for _ in range(MAX_TOOL_ITERATIONS):
-            ai_message = bound.invoke(lc_messages)
-            tool_calls = getattr(ai_message, "tool_calls", None) or []
-            if not tool_calls:
-                yield {"event": "token", "data": ai_message.content}
-                yield {"event": "done"}
-                return
-
-            lc_messages.append(ai_message)
-            from langchain_core.messages import ToolMessage
-
-            for call in tool_calls:
-                name = call["name"]
-                args = call.get("args") or {}
-                call_id = call.get("id") or name
-                yield {"event": "tool_call", "data": {"name": name, "args": args}}
-                tool_fn = tools_by_name.get(name)
-                output = tool_fn.invoke(args) if tool_fn is not None else json.dumps({"error": f"Unknown tool {name}"})
-                lc_messages.append(ToolMessage(content=output, tool_call_id=call_id))
-
-                summary: Dict[str, Any] = {"name": name}
-                try:
-                    parsed = json.loads(output)
-                    summary["code"] = parsed.get("code")
-                    if name == "make_chart" and isinstance(parsed.get("result"), dict):
-                        yield {"event": "card", "data": parsed["result"]}
-                    if name == "highlight_lineage" and isinstance(parsed.get("result"), dict):
-                        yield {"event": "ui:highlight", "data": parsed["result"]}
-                except Exception:
-                    pass
-                yield {"event": "tool_result", "data": summary}
-
-        yield {"event": "token", "data": "I reached the tool-call limit for this request. Please refine the question."}
-        yield {"event": "done"}
-    except Exception as e:
-        logger.exception(e)
-        yield {"event": "error", "data": str(e)}
diff --git a/src/flowcept/webservice/services/dashboard_store.py b/src/flowcept/webservice/services/dashboard_store.py
deleted file mode 100644
index e1c8a96c..00000000
--- a/src/flowcept/webservice/services/dashboard_store.py
+++ /dev/null
@@ -1,156 +0,0 @@
-"""Dashboard persistence: MongoDB collection when available, JSON files otherwise."""
-
-from __future__ import annotations
-
-import json
-import os
-from pathlib import Path
-from typing import Dict, List, Optional
-
-from flowcept.commons.daos.docdb_dao.docdb_dao_base import DocumentDBDAO
-from flowcept.commons.flowcept_logger import FlowceptLogger
-from flowcept.configs import WEBSERVER_DASHBOARDS_DIR
-
-_SEED_FILE = Path(__file__).parent.parent / "ui_build" / "default_dashboard_configs.json"
-
-
-class MongoDashboardStore:
-    """Dashboard store backed by the ``dashboards`` MongoDB collection."""
-
-    def __init__(self, dao):
-        self._dao = dao
-
-    def save(self, dashboard: Dict) -> bool:
-        """Insert or replace a dashboard document."""
-        return self._dao.save_dashboard(dashboard)
-
-    def get(self, dashboard_id: str) -> Optional[Dict]:
-        """Get a dashboard document by id."""
-        return self._dao.get_dashboard(dashboard_id)
-
-    def list(self) -> List[Dict]:
-        """List all dashboard documents, seeding defaults if the collection is empty."""
-        docs = self._dao.list_dashboards() or []
-        if not docs:
-            docs = self._seed()
-        return docs
-
-    def list_by_type(self, dashboard_type: str) -> List[Dict]:
-        """List dashboard documents of a specific type."""
-        self.list()  # ensure seeded
-        return self._dao.list_dashboards(filter={"dashboard_type": dashboard_type}) or []
-
-    def delete(self, dashboard_id: str) -> bool:
-        """Delete a dashboard document by id."""
-        return self._dao.delete_dashboard(dashboard_id)
-
-    def _seed(self) -> List[Dict]:
-        """Load default configs from the bundled JSON file and persist them."""
-        if not _SEED_FILE.exists():
-            FlowceptLogger().warning(f"Default dashboard configs not found at {_SEED_FILE}")
-            return []
-        try:
-            with open(_SEED_FILE) as f:
-                configs = json.load(f)
-            for doc in configs:
-                self._dao.save_dashboard(doc)
-            return configs
-        except Exception as e:
-            FlowceptLogger().exception(e)
-            return []
-
-
-class FileDashboardStore:
-    """Dashboard store writing one JSON file per dashboard under a local directory."""
-
-    def __init__(self, directory: str = WEBSERVER_DASHBOARDS_DIR):
-        self._dir = Path(directory)
-        self._dir.mkdir(parents=True, exist_ok=True)
-        self.logger = FlowceptLogger()
-
-    def _path(self, dashboard_id: str) -> Path:
-        safe = "".join(c for c in dashboard_id if c.isalnum() or c in "-_")
-        return self._dir / f"{safe}.json"
-
-    def save(self, dashboard: Dict) -> bool:
-        """Insert or replace a dashboard JSON file."""
-        try:
-            with open(self._path(dashboard["dashboard_id"]), "w") as handle:
-                json.dump(dashboard, handle, indent=2)
-            return True
-        except Exception as e:
-            self.logger.exception(e)
-            return False
-
-    def get(self, dashboard_id: str) -> Optional[Dict]:
-        """Get a dashboard from its JSON file."""
-        path = self._path(dashboard_id)
-        if not path.exists():
-            return None
-        try:
-            with open(path) as handle:
-                return json.load(handle)
-        except Exception as e:
-            self.logger.exception(e)
-            return None
-
-    def list(self) -> List[Dict]:
-        """List all dashboards, seeding defaults if the directory is empty."""
-        docs = self._load_all()
-        if not docs:
-            docs = self._seed()
-        return docs
-
-    def list_by_type(self, dashboard_type: str) -> List[Dict]:
-        """List dashboards of a specific type."""
-        self.list()  # ensure seeded
-        return [d for d in self._load_all() if d.get("dashboard_type") == dashboard_type]
-
-    def delete(self, dashboard_id: str) -> bool:
-        """Delete a dashboard JSON file."""
-        path = self._path(dashboard_id)
-        if not path.exists():
-            return False
-        try:
-            os.remove(path)
-            return True
-        except Exception as e:
-            self.logger.exception(e)
-            return False
-
-    def _load_all(self) -> List[Dict]:
-        dashboards = []
-        for path in sorted(self._dir.glob("*.json")):
-            try:
-                with open(path) as handle:
-                    dashboards.append(json.load(handle))
-            except Exception as e:
-                self.logger.exception(e)
-        return dashboards
-
-    def _seed(self) -> List[Dict]:
-        """Load default configs from the bundled JSON file and persist them."""
-        if not _SEED_FILE.exists():
-            self.logger.warning(f"Default dashboard configs not found at {_SEED_FILE}")
-            return []
-        try:
-            with open(_SEED_FILE) as f:
-                configs = json.load(f)
-            for doc in configs:
-                self.save(doc)
-            return configs
-        except Exception as e:
-            self.logger.exception(e)
-            return []
-
-
-def get_dashboard_store():
-    """Return the dashboard store for the configured DocDB backend.
-
-    Mongo-backed deployments store dashboards in a ``dashboards`` collection;
-    other backends fall back to JSON files under ``web_server.dashboards_dir``.
-    """
-    dao = DocumentDBDAO.get_instance(create_indices=False)
-    if hasattr(dao, "save_dashboard"):
-        return MongoDashboardStore(dao)
-    return FileDashboardStore()
diff --git a/src/flowcept/webservice/services/dataflow.py b/src/flowcept/webservice/services/dataflow.py
index 76184bfb..8f3fc594 100644
--- a/src/flowcept/webservice/services/dataflow.py
+++ b/src/flowcept/webservice/services/dataflow.py
@@ -16,7 +16,7 @@
 from typing import Any, Dict, List, Optional, Set
 
 from flowcept.flowcept_api.db_api import DBAPI
-from flowcept.webservice.services.stats import _to_epoch
+from flowcept.commons.utils import to_epoch
 
 MAX_NODES = 400
 _TASK_PROJECTION = [
@@ -117,7 +117,7 @@ def build_dataflow(db: DBAPI, workflow_id: str) -> Optional[Dict[str, Any]]:
     tasks = [t for t in tasks if t.get("used") or t.get("generated")]
     if not tasks:
         return None
-    tasks.sort(key=lambda t: _to_epoch(t.get("started_at")) or 0)
+    tasks.sort(key=lambda t: to_epoch(t.get("started_at")) or 0)
     return _coarse(tasks)
 
 
@@ -209,14 +209,14 @@ def _chunk(payload: Dict[str, Any], role: str) -> str:
         if not used:
             continue
         in_id = _chunk(used, "input")
-        t_start = _to_epoch(t.get("started_at"))
+        t_start = to_epoch(t.get("started_at"))
         for key, value in _flatten_payload(used):
             if _is_trivial(value):
                 continue
             for producer, out_id in producers.get((key, repr(value)), ()):
                 if producer["task_id"] == t["task_id"] or out_id == in_id:
                     continue
-                p_end = _to_epoch(producer.get("ended_at"))
+                p_end = to_epoch(producer.get("ended_at"))
                 if t_start is not None and p_end is not None and p_end > t_start:
                     continue
                 if (out_id, in_id) not in seen_derived:
@@ -229,12 +229,12 @@ def _chunk(payload: Dict[str, Any], role: str) -> str:
         agent_id = t.get("agent_id")
         if source_agent_id and agent_id:
             delegator = None
-            t_start = _to_epoch(t.get("started_at")) or 0
+            t_start = to_epoch(t.get("started_at")) or 0
             for s in tasks:
                 if s.get("agent_id") == source_agent_id:
-                    s_start = _to_epoch(s.get("started_at")) or 0
+                    s_start = to_epoch(s.get("started_at")) or 0
                     if s_start <= t_start:
-                        if delegator is None or s_start > (_to_epoch(delegator.get("started_at")) or 0):
+                        if delegator is None or s_start > (to_epoch(delegator.get("started_at")) or 0):
                             delegator = s
             if delegator:
                 edges.append(
diff --git a/src/flowcept/webservice/services/reports.py b/src/flowcept/webservice/services/reports.py
index 553fcc75..bdd7d1ac 100644
--- a/src/flowcept/webservice/services/reports.py
+++ b/src/flowcept/webservice/services/reports.py
@@ -10,7 +10,7 @@
 from fastapi.responses import JSONResponse, Response
 
 from flowcept.report.service import build_workflow_card, generate_report
-from flowcept.webservice.services.serializers import normalize_docs
+from flowcept.commons.utils import normalize_docs
 
 
 def workflow_card_response(
diff --git a/src/flowcept/webservice/services/serializers.py b/src/flowcept/webservice/services/serializers.py
deleted file mode 100644
index 70ccb2e1..00000000
--- a/src/flowcept/webservice/services/serializers.py
+++ /dev/null
@@ -1,43 +0,0 @@
-"""Serialization helpers for API responses."""
-
-from __future__ import annotations
-
-import base64
-from datetime import datetime
-from typing import Any, Dict, List
-
-
-try:
-    from bson import ObjectId
-except Exception:
-    ObjectId = None
-
-
-def _to_jsonable(value: Any, include_data: bool = False) -> Any:
-    """Recursively normalize values for JSON responses."""
-    if value is None:
-        return None
-    if isinstance(value, (str, int, float, bool)):
-        return value
-    if isinstance(value, datetime):
-        return value.isoformat()
-    if isinstance(value, bytes):
-        if include_data:
-            return base64.b64encode(value).decode("ascii")
-        return None
-    if ObjectId is not None and isinstance(value, ObjectId):
-        return str(value)
-    if isinstance(value, list):
-        return [_to_jsonable(item, include_data=include_data) for item in value]
-    if isinstance(value, tuple):
-        return [_to_jsonable(item, include_data=include_data) for item in value]
-    if isinstance(value, dict):
-        return {
-            str(k): _to_jsonable(v, include_data=include_data) for k, v in value.items() if include_data or k != "data"
-        }
-    return str(value)
-
-
-def normalize_docs(docs: List[Dict[str, Any]], include_data: bool = False) -> List[Dict[str, Any]]:
-    """Normalize result documents for JSON API response."""
-    return [_to_jsonable(doc, include_data=include_data) for doc in docs]
diff --git a/src/flowcept/webservice/services/stats.py b/src/flowcept/webservice/services/stats.py
deleted file mode 100644
index 827a1da9..00000000
--- a/src/flowcept/webservice/services/stats.py
+++ /dev/null
@@ -1,733 +0,0 @@
-"""Aggregation and derivation services for webservice stats endpoints and dashboard cards.
-
-Mongo-backed deployments use native aggregation pipelines; other backends (e.g., LMDB)
-fall back to in-Python aggregation over plain queries.
-"""
-
-from __future__ import annotations
-
-from collections import defaultdict
-from typing import Any, Dict, List, Optional
-
-from flowcept.commons.daos.docdb_dao.docdb_dao_base import DocumentDBDAO
-from flowcept.flowcept_api.db_api import DBAPI
-from flowcept.webservice.schemas.dashboards import ChartData, MetricSpec
-
-
-def _to_epoch(value) -> Optional[float]:
-    """Normalize a timestamp value (float epoch-sec, epoch-ms, ISO string, or datetime) to epoch seconds."""
-    if value is None:
-        return None
-    if isinstance(value, (int, float)):
-        # Epoch milliseconds have 13 digits; epoch seconds have 10.
-        return value / 1000.0 if value > 1e12 else float(value)
-    if isinstance(value, str):
-        from datetime import datetime, timezone
-
-        try:
-            dt = datetime.fromisoformat(value.replace("Z", "+00:00"))
-            return dt.replace(tzinfo=timezone.utc).timestamp() if dt.tzinfo is None else dt.timestamp()
-        except ValueError:
-            return None
-    # pymongo returns datetime objects for BSON Date fields (e.g. from $min/$max aggregations)
-    try:
-        from datetime import datetime, timezone
-
-        if isinstance(value, datetime):
-            return value.replace(tzinfo=timezone.utc).timestamp() if value.tzinfo is None else value.timestamp()
-    except Exception:
-        pass
-    return None
-
-
-def _mongo_dao_or_none(db: Optional[DBAPI] = None) -> Optional[DocumentDBDAO]:
-    """Return the DAO singleton when it supports raw aggregation pipelines, else None."""
-    if db is not None and not isinstance(db, DBAPI):
-        return None
-    try:
-        dao = DocumentDBDAO.get_instance(create_indices=False)
-        return dao if hasattr(dao, "raw_pipeline") else None
-    except Exception:
-        return None
-
-
-def get_nested(item: Dict[str, Any], field: str) -> Any:
-    """Read a dot-notated field value from a document."""
-    current = item
-    for part in field.split("."):
-        if not isinstance(current, dict):
-            return None
-        current = current.get(part)
-    return current
-
-
-def _duration(doc: Dict[str, Any]) -> Optional[float]:
-    started, ended = _to_epoch(doc.get("started_at")), _to_epoch(doc.get("ended_at"))
-    if started is not None and ended is not None:
-        return ended - started
-    return None
-
-
-def task_summary(db: DBAPI, filter: Dict[str, Any]) -> Dict[str, Any]:
-    """Summarize tasks matching a filter: status counts, per-activity stats, and time range.
-
-    Parameters
-    ----------
-    db : DBAPI
-        DB API facade.
-    filter : dict
-        Mongo-style filter over the ``tasks`` collection.
-
-    Returns
-    -------
-    dict
-        ``{"count", "status_counts", "activity_stats", "time_range"}``.
-    """
-    dao = _mongo_dao_or_none(db)
-    if dao is not None:
-        return _task_summary_mongo(dao, filter)
-    return _task_summary_python(db, filter)
-
-
-def _task_summary_mongo(dao, filter: Dict[str, Any]) -> Dict[str, Any]:
-    match = [{"$match": filter}] if filter else []
-    rows = (
-        dao.raw_pipeline(
-            match
-            + [
-                {
-                    "$group": {
-                        "_id": {"activity_id": "$activity_id", "status": "$status"},
-                        "count": {"$sum": 1},
-                        "avg_duration": {"$avg": {"$subtract": ["$ended_at", "$started_at"]}},
-                        "min_duration": {"$min": {"$subtract": ["$ended_at", "$started_at"]}},
-                        "max_duration": {"$max": {"$subtract": ["$ended_at", "$started_at"]}},
-                        "sum_duration": {"$sum": {"$subtract": ["$ended_at", "$started_at"]}},
-                        "min_started_at": {"$min": "$started_at"},
-                        "max_ended_at": {"$max": "$ended_at"},
-                    }
-                }
-            ],
-            collection="tasks",
-        )
-        or []
-    )
-    return _merge_summary_rows(
-        [
-            {
-                "activity_id": row["_id"].get("activity_id"),
-                "status": row["_id"].get("status"),
-                **{k: row.get(k) for k in row if k != "_id"},
-            }
-            for row in rows
-        ]
-    )
-
-
-def _task_summary_python(db: DBAPI, filter: Dict[str, Any]) -> Dict[str, Any]:
-    docs = (
-        db.task_query(
-            filter=filter,
-            projection=["activity_id", "status", "started_at", "ended_at"],
-        )
-        or []
-    )
-    groups: Dict[tuple, Dict[str, Any]] = {}
-    for doc in docs:
-        key = (doc.get("activity_id"), doc.get("status"))
-        group = groups.setdefault(
-            key,
-            {
-                "activity_id": key[0],
-                "status": key[1],
-                "count": 0,
-                "durations": [],
-                "min_started_at": None,
-                "max_ended_at": None,
-            },
-        )
-        group["count"] += 1
-        duration = _duration(doc)
-        if duration is not None:
-            group["durations"].append(duration)
-        started, ended = doc.get("started_at"), doc.get("ended_at")
-        if isinstance(started, (int, float)):
-            current = group["min_started_at"]
-            group["min_started_at"] = started if current is None else min(current, started)
-        if isinstance(ended, (int, float)):
-            current = group["max_ended_at"]
-            group["max_ended_at"] = ended if current is None else max(current, ended)
-
-    rows = []
-    for group in groups.values():
-        durations = group.pop("durations")
-        group["avg_duration"] = sum(durations) / len(durations) if durations else None
-        group["min_duration"] = min(durations) if durations else None
-        group["max_duration"] = max(durations) if durations else None
-        group["sum_duration"] = sum(durations) if durations else None
-        rows.append(group)
-    return _merge_summary_rows(rows)
-
-
-def _merge_summary_rows(rows: List[Dict[str, Any]]) -> Dict[str, Any]:
-    """Combine per-(activity,status) rows into the summary response shape."""
-    status_counts: Dict[str, int] = defaultdict(int)
-    activities: Dict[str, Dict[str, Any]] = {}
-    total = 0
-    min_started, max_ended = None, None
-    for row in rows:
-        count = row.get("count") or 0
-        total += count
-        status = row.get("status") or "UNKNOWN"
-        status_counts[status] += count
-
-        activity = activities.setdefault(
-            str(row.get("activity_id")),
-            {
-                "activity_id": row.get("activity_id"),
-                "count": 0,
-                "status_counts": defaultdict(int),
-                "avg_duration": None,
-                "min_duration": None,
-                "max_duration": None,
-                "sum_duration": None,
-                "_weighted_sum": 0.0,
-                "_weighted_count": 0,
-            },
-        )
-        activity["count"] += count
-        activity["status_counts"][status] += count
-        for bound, op in (("min_duration", min), ("max_duration", max)):
-            if row.get(bound) is not None:
-                current = activity[bound]
-                activity[bound] = row[bound] if current is None else op(current, row[bound])
-        if row.get("sum_duration") is not None:
-            activity["sum_duration"] = (activity["sum_duration"] or 0) + row["sum_duration"]
-        if row.get("avg_duration") is not None:
-            activity["_weighted_sum"] += row["avg_duration"] * count
-            activity["_weighted_count"] += count
-
-        if row.get("min_started_at") is not None:
-            val = _to_epoch(row["min_started_at"])
-            min_started = val if min_started is None else min(min_started, val)
-        if row.get("max_ended_at") is not None:
-            val = _to_epoch(row["max_ended_at"])
-            max_ended = val if max_ended is None else max(max_ended, val)
-
-    activity_stats = []
-    for activity in activities.values():
-        if activity.pop("_weighted_count"):
-            activity["avg_duration"] = activity.pop("_weighted_sum") / activity["count"]
-        else:
-            activity.pop("_weighted_sum")
-        activity["status_counts"] = dict(activity["status_counts"])
-        activity_stats.append(activity)
-    activity_stats.sort(key=lambda a: str(a["activity_id"]))
-
-    return {
-        "count": total,
-        "status_counts": dict(status_counts),
-        "activity_stats": activity_stats,
-        "time_range": {"min_started_at": min_started, "max_ended_at": max_ended},
-    }
-
-
-def derive_campaigns(db: DBAPI) -> List[Dict[str, Any]]:
-    """Derive campaign summaries by grouping workflows and tasks by ``campaign_id``.
-
-    There is no campaigns collection; campaigns exist as a grouping key.
-
-    Returns
-    -------
-    list of dict
-        One record per campaign with workflow/task counts, users, names, and time range.
-    """
-    campaigns: Dict[str, Dict[str, Any]] = {}
-
-    def _campaign(campaign_id: str) -> Dict[str, Any]:
-        return campaigns.setdefault(
-            campaign_id,
-            {
-                "campaign_id": campaign_id,
-                "workflow_count": 0,
-                "task_count": 0,
-                "users": set(),
-                "workflow_names": set(),
-                "first_ts": None,
-                "last_ts": None,
-            },
-        )
-
-    def _expand_range(record: Dict[str, Any], *values) -> None:
-        for raw in values:
-            value = _to_epoch(raw)
-            if value is None:
-                continue
-            record["first_ts"] = value if record["first_ts"] is None else min(record["first_ts"], value)
-            record["last_ts"] = value if record["last_ts"] is None else max(record["last_ts"], value)
-
-    dao = _mongo_dao_or_none(db)
-    if dao is not None:
-        wf_rows = (
-            dao.raw_pipeline(
-                [
-                    {"$match": {"campaign_id": {"$exists": True, "$ne": None}}},
-                    {
-                        "$group": {
-                            "_id": "$campaign_id",
-                            "workflow_count": {"$sum": 1},
-                            "users": {"$addToSet": "$user"},
-                            "workflow_names": {"$addToSet": "$name"},
-                            "first_ts": {"$min": "$utc_timestamp"},
-                            "last_ts": {"$max": "$utc_timestamp"},
-                        }
-                    },
-                ],
-                collection="workflows",
-            )
-            or []
-        )
-        task_rows = (
-            dao.raw_pipeline(
-                [
-                    {"$match": {"campaign_id": {"$exists": True, "$ne": None}}},
-                    {
-                        "$group": {
-                            "_id": "$campaign_id",
-                            "task_count": {"$sum": 1},
-                            "first_ts": {"$min": "$started_at"},
-                            "last_ts": {"$max": "$ended_at"},
-                        }
-                    },
-                ],
-                collection="tasks",
-            )
-            or []
-        )
-        for row in wf_rows:
-            record = _campaign(row["_id"])
-            record["workflow_count"] = row.get("workflow_count", 0)
-            record["users"].update(u for u in row.get("users", []) if u)
-            record["workflow_names"].update(n for n in row.get("workflow_names", []) if n)
-            _expand_range(record, row.get("first_ts"), row.get("last_ts"))
-        for row in task_rows:
-            record = _campaign(row["_id"])
-            record["task_count"] = row.get("task_count", 0)
-            _expand_range(record, row.get("first_ts"), row.get("last_ts"))
-    else:
-        wf_filter = {"campaign_id": {"$exists": True, "$ne": None}}
-        for doc in db.workflow_query(filter=wf_filter) or []:
-            if not doc.get("campaign_id"):
-                continue
-            record = _campaign(doc["campaign_id"])
-            record["workflow_count"] += 1
-            if doc.get("user"):
-                record["users"].add(doc["user"])
-            if doc.get("name"):
-                record["workflow_names"].add(doc["name"])
-            _expand_range(record, doc.get("utc_timestamp"))
-        task_docs = (
-            db.task_query(
-                filter=wf_filter,
-                projection=["campaign_id", "started_at", "ended_at"],
-            )
-            or []
-        )
-        for doc in task_docs:
-            if not doc.get("campaign_id"):
-                continue
-            record = _campaign(doc["campaign_id"])
-            record["task_count"] += 1
-            _expand_range(record, doc.get("started_at"), doc.get("ended_at"))
-
-    results = []
-    for record in campaigns.values():
-        record["users"] = sorted(record["users"])
-        record["workflow_names"] = sorted(record["workflow_names"])
-        results.append(record)
-    results.sort(
-        key=lambda r: (1, r["last_ts"]) if r["last_ts"] is not None else (0, float("-inf")),
-        reverse=True,
-    )
-    return results
-
-
-def derive_agents(db: DBAPI, filter: Optional[Dict[str, Any]] = None) -> List[Dict[str, Any]]:
-    """Derive agent summaries by grouping tasks by ``agent_id`` for agents in the agents collection.
-
-    Parameters
-    ----------
-    db : DBAPI
-        DB API facade.
-    filter : dict, optional
-        Extra Mongo-style filter for querying the agents collection.
-
-    Returns
-    -------
-    list of dict
-        One record per agent with task counts, activities, and last activity time.
-    """
-
-    def to_float_ts(val):
-        if val is None:
-            return None
-        if isinstance(val, (int, float)):
-            return float(val)
-        from datetime import datetime as dt
-
-        if isinstance(val, dt):
-            return val.timestamp()
-        if isinstance(val, str):
-            try:
-                return dt.fromisoformat(val.replace("Z", "+00:00")).timestamp()
-            except Exception:
-                return None
-        return None
-
-    try:
-        stored_agents = db.agent_query(filter=filter or {}) or []
-    except Exception as e:
-        from flowcept.commons.flowcept_logger import FlowceptLogger
-
-        FlowceptLogger().error(f"Error querying stored agents: {e}")
-        stored_agents = []
-
-    # Filter out train_agent_id and orchestrator_agent_id
-    stored_agents = [a for a in stored_agents if a.get("agent_id") not in ("train_agent_id", "orchestrator_agent_id")]
-
-    if not stored_agents:
-        return []
-
-    agent_ids = [a["agent_id"] for a in stored_agents if "agent_id" in a]
-    query_filter = {"agent_id": {"$in": agent_ids}}
-
-    dao = _mongo_dao_or_none(db)
-    if dao is not None:
-        rows = (
-            dao.raw_pipeline(
-                [
-                    {"$match": query_filter},
-                    {
-                        "$group": {
-                            "_id": "$agent_id",
-                            "task_count": {"$sum": 1},
-                            "activities": {"$addToSet": "$activity_id"},
-                            "source_agent_ids": {"$addToSet": "$source_agent_id"},
-                            "campaign_ids": {"$addToSet": "$campaign_id"},
-                            "workflow_ids": {"$addToSet": "$workflow_id"},
-                            "last_active": {"$max": "$registered_at"},
-                        }
-                    },
-                ],
-                collection="tasks",
-            )
-            or []
-        )
-        stats_map = {
-            row["_id"]: {
-                "task_count": row.get("task_count", 0),
-                "activities": sorted(a for a in row.get("activities", []) if a),
-                "source_agent_ids": sorted(s for s in row.get("source_agent_ids", []) if s),
-                "campaign_ids": sorted(c for c in row.get("campaign_ids", []) if c),
-                "workflow_ids": sorted(w for w in row.get("workflow_ids", []) if w),
-                "last_active": to_float_ts(row.get("last_active")),
-            }
-            for row in rows
-        }
-    else:
-        docs = (
-            db.task_query(
-                filter=query_filter,
-                projection=[
-                    "agent_id",
-                    "activity_id",
-                    "source_agent_id",
-                    "campaign_id",
-                    "workflow_id",
-                    "registered_at",
-                ],
-            )
-            or []
-        )
-        stats_map = {}
-        for doc in docs:
-            agent_id = doc.get("agent_id")
-            if not agent_id:
-                continue
-            record = stats_map.setdefault(
-                agent_id,
-                {
-                    "task_count": 0,
-                    "activities": set(),
-                    "source_agent_ids": set(),
-                    "campaign_ids": set(),
-                    "workflow_ids": set(),
-                    "last_active": None,
-                },
-            )
-            record["task_count"] += 1
-            for key, field in (
-                ("activities", "activity_id"),
-                ("source_agent_ids", "source_agent_id"),
-                ("campaign_ids", "campaign_id"),
-                ("workflow_ids", "workflow_id"),
-            ):
-                if doc.get(field):
-                    record[key].add(doc[field])
-            ts = to_float_ts(doc.get("registered_at"))
-            if ts is not None:
-                current = record["last_active"]
-                record["last_active"] = ts if current is None else max(current, ts)
-        for record in stats_map.values():
-            for key in ("activities", "source_agent_ids", "campaign_ids", "workflow_ids"):
-                record[key] = sorted(record[key])
-
-    agents = []
-    for sa in stored_agents:
-        agent_id = sa["agent_id"]
-        stat = stats_map.get(
-            agent_id,
-            {
-                "task_count": 0,
-                "activities": [],
-                "source_agent_ids": [],
-                "campaign_ids": [],
-                "workflow_ids": [],
-                "last_active": None,
-            },
-        )
-        if stat["task_count"] == 0:
-            continue
-        agents.append(
-            {
-                "agent_id": agent_id,
-                "task_count": stat["task_count"],
-                "activities": stat["activities"],
-                "source_agent_ids": stat["source_agent_ids"],
-                "campaign_ids": stat["campaign_ids"],
-                "workflow_ids": stat["workflow_ids"],
-                "last_active": stat["last_active"],
-                "name": sa.get("name"),
-                "registered_at": to_float_ts(sa.get("registered_at")),
-            }
-        )
-
-    agents.sort(
-        key=lambda a: (1, a["registered_at"]) if a["registered_at"] is not None else (0, float("-inf")),
-        reverse=True,
-    )
-    return agents
-
-
-def telemetry_timeseries(
-    db: DBAPI,
-    filter: Dict[str, Any],
-    fields: List[str],
-    x_field: str = "started_at",
-    limit: int = 1000,
-) -> List[Dict[str, Any]]:
-    """Extract plottable rows of dot-notated (telemetry) fields from tasks.
-
-    Parameters
-    ----------
-    db : DBAPI
-        DB API facade.
-    filter : dict
-        Mongo-style filter over tasks.
-    fields : list of str
-        Dot-notated y-value paths (e.g., ``telemetry_at_end.cpu.percent_all``).
-    x_field : str, optional
-        X-axis field (a task time field by default).
-    limit : int, optional
-        Maximum number of rows.
-
-    Returns
-    -------
-    list of dict
-        Rows of ``{x_field, task_id, activity_id, <field>: value, ...}`` sorted by x.
-    """
-    top_level = sorted({field.split(".")[0] for field in fields} | {x_field.split(".")[0]})
-    docs = (
-        db.task_query(
-            filter=filter,
-            projection=["task_id", "activity_id"] + top_level,
-            limit=limit,
-        )
-        or []
-    )
-    rows = []
-    for doc in docs:
-        row = {
-            x_field: get_nested(doc, x_field),
-            "task_id": doc.get("task_id"),
-            "activity_id": doc.get("activity_id"),
-        }
-        row.update({field: get_nested(doc, field) for field in fields})
-        rows.append(row)
-    rows.sort(key=lambda r: (r[x_field] is None, r[x_field]))
-    return rows
-
-
-def _merge_context_filter(card_filter: Dict[str, Any], context: Optional[Dict[str, Any]]) -> Dict[str, Any]:
-    if not context:
-        return dict(card_filter)
-    if not card_filter:
-        return dict(context)
-    return {"$and": [context, card_filter]}
-
-
-def _resolve_collection_sizes(db: DBAPI, query_filter: Dict[str, Any]) -> List[Dict[str, Any]]:
-    """Return per-collection BSON byte totals for the given filter (e.g. workflow_id).
-
-    Uses MongoDB ``$bsonSize`` on each of the three provenance collections.
-    Returns an empty list when Mongo is unavailable.
-    """
-    dao = _mongo_dao_or_none(db)
-    if dao is None:
-        return []
-    rows = []
-    for collection in ("tasks", "objects", "workflows"):
-        try:
-            result = dao.raw_pipeline(
-                [
-                    {"$match": query_filter},
-                    {"$group": {"_id": None, "bytes": {"$sum": {"$bsonSize": "$$ROOT"}}}},
-                ],
-                collection=collection,
-            )
-            bytes_val = result[0]["bytes"] if result else 0
-        except Exception:
-            bytes_val = 0
-        rows.append({"collection": collection, "sum_bytes": bytes_val})
-    return rows
-
-
-def resolve_chart_data(db: DBAPI, data: "ChartData", context: Optional[Dict[str, Any]] = None) -> Dict[str, Any]:
-    """Resolve a declarative card data binding into plottable rows.
-
-    This is the single data contract shared by dashboard cards, the stats router,
-    and LLM chart tools.
-
-    Parameters
-    ----------
-    db : DBAPI
-        DB API facade.
-    data : ChartData
-        Declarative binding (source, filter, group_by/metrics or x/y, sort, limit).
-    context : dict, optional
-        Dashboard-level filter ANDed into the card filter (e.g., ``{"campaign_id": ...}``).
-
-    Returns
-    -------
-    dict
-        ``{"rows": [...], "count": int}``.
-    """
-    query_filter = _merge_context_filter(data.filter, context)
-
-    if data.source == "collection_sizes":
-        rows = _resolve_collection_sizes(db, query_filter)
-        return {"rows": rows, "count": len(rows)}
-
-    if data.group_by or data.metrics:
-        rows = _resolve_grouped(db, data, query_filter)
-    elif data.x and data.y:
-        rows = telemetry_timeseries(db, query_filter, fields=data.y, x_field=data.x, limit=data.limit)
-    else:
-        sort = None if data.sort is None else [(s.field, s.order) for s in data.sort]
-        rows = (
-            db.query(
-                collection=data.source,
-                filter=query_filter,
-                limit=data.limit,
-                sort=sort,
-            )
-            or []
-        )
-    rows = rows[: data.limit]
-    return {"rows": rows, "count": len(rows)}
-
-
-def _resolve_grouped(db: DBAPI, data: "ChartData", query_filter: Dict[str, Any]) -> List[Dict[str, Any]]:
-    """Group/aggregate rows for a card, using Mongo pipelines when available."""
-    metrics = data.metrics or [MetricSpec(field="", agg="count")]
-    dao = _mongo_dao_or_none(db)
-    has_elapsed_metric = any(getattr(m, "field", None) == "elapsed" for m in metrics)
-    if dao is not None and data.source in ("tasks", "workflows", "objects") and not has_elapsed_metric:
-        group_id = f"${data.group_by}" if data.group_by else None
-        group_stage: Dict[str, Any] = {"_id": group_id}
-        # MongoDB forbids dots in $group output field names; use underscores internally
-        # and remap back to the canonical key before returning.
-        mongo_key_map: Dict[str, str] = {}
-        for metric in metrics:
-            canonical = _metric_key(metric)
-            mongo_key = canonical.replace(".", "_")
-            mongo_key_map[mongo_key] = canonical
-            if metric.agg == "count":
-                group_stage[mongo_key] = {"$sum": 1}
-            else:
-                group_stage[mongo_key] = {f"${metric.agg}": f"${metric.field}"}
-        pipeline = ([{"$match": query_filter}] if query_filter else []) + [{"$group": group_stage}]
-        rows = dao.raw_pipeline(pipeline, collection=data.source) or []
-        out = []
-        for row in rows:
-            record = {data.group_by or "group": row.pop("_id")}
-            for mongo_key, canonical in mongo_key_map.items():
-                if mongo_key in row:
-                    record[canonical] = row.pop(mongo_key)
-            record.update(row)
-            out.append(record)
-        out.sort(key=lambda r: str(r.get(data.group_by or "group")))
-        return out
-
-    fields = sorted({m.field for m in metrics if m.field and m.field != "elapsed"})
-    elapsed_fields = ["started_at", "ended_at"] if has_elapsed_metric else []
-    top_level = sorted(
-        {f.split(".")[0] for f in fields}
-        | ({data.group_by.split(".")[0]} if data.group_by else set())
-        | set(elapsed_fields)
-    )
-    docs = (
-        db.query(
-            collection=data.source,
-            filter=query_filter,
-            projection=top_level or None,
-        )
-        or []
-    )
-    grouped: Dict[Any, List[Dict[str, Any]]] = defaultdict(list)
-    for doc in docs:
-        grouped[get_nested(doc, data.group_by) if data.group_by else None].append(doc)
-    out = []
-    for key, docs_in_group in grouped.items():
-        record = {data.group_by or "group": key}
-        for metric in metrics:
-            if metric.field == "elapsed":
-                # Compute elapsed as ended_at - started_at for each doc
-                def _elapsed(d: Dict[str, Any]) -> Optional[float]:
-                    s, e = _to_epoch(d.get("started_at")), _to_epoch(d.get("ended_at"))
-                    return (e - s) if s is not None and e is not None else None
-
-                values = [v for v in (_elapsed(d) for d in docs_in_group) if v is not None]
-            else:
-                values = [
-                    v for v in (get_nested(d, metric.field) for d in docs_in_group) if isinstance(v, (int, float))
-                ]
-            if metric.agg == "count":
-                record[_metric_key(metric)] = len(docs_in_group)
-            elif not values:
-                record[_metric_key(metric)] = None
-            elif metric.agg == "avg":
-                record[_metric_key(metric)] = sum(values) / len(values)
-            elif metric.agg == "sum":
-                record[_metric_key(metric)] = sum(values)
-            elif metric.agg == "min":
-                record[_metric_key(metric)] = min(values)
-            elif metric.agg == "max":
-                record[_metric_key(metric)] = max(values)
-        out.append(record)
-    out.sort(key=lambda r: str(r.get(data.group_by or "group")))
-    return out
-
-
-def _metric_key(metric: "MetricSpec") -> str:
-    return f"{metric.agg}_{metric.field}" if metric.field else metric.agg
diff --git a/src/flowcept/webservice/services/streaming.py b/src/flowcept/webservice/services/streaming.py
index 126c97d9..9522fcbd 100644
--- a/src/flowcept/webservice/services/streaming.py
+++ b/src/flowcept/webservice/services/streaming.py
@@ -11,7 +11,6 @@
 from datetime import datetime, timezone
 from typing import Any, Dict, List, Optional, Tuple
 
-from flowcept.commons.daos.docdb_dao.docdb_dao_base import DocumentDBDAO
 from flowcept.flowcept_api.db_api import DBAPI
 
 TASK_CURSOR_FIELDS = ("registered_at", "started_at", "ended_at", "utc_timestamp")
@@ -19,8 +18,7 @@
 
 
 def _supports_operators() -> bool:
-    dao = DocumentDBDAO.get_instance(create_indices=False)
-    return hasattr(dao, "raw_pipeline")
+    return hasattr(DBAPI.get_dao_instance(), "raw_pipeline")
 
 
 def _as_epoch(value: Any) -> Optional[float]:
diff --git a/tests/adapters/test_dask.py b/tests/adapters/test_dask.py
index f578a3a5..d945b011 100644
--- a/tests/adapters/test_dask.py
+++ b/tests/adapters/test_dask.py
@@ -23,7 +23,6 @@ def problem_evaluate(phenome, uuid):
 def dummy_func1(x):
     cool_var = "cool value"  # test if we can intercept this var
     print(cool_var)
-    y = cool_var
     return x * 2
 
 
@@ -52,7 +51,7 @@ def __init__(self, *args, **kwargs):
     def test_dummyfunc(self):
         client, cluster = start_local_dask_cluster(n_workers=1)
         i1 = np.random.random()
-        o1 = client.submit(dummy_func1, i1)
+        client.submit(dummy_func1, i1)
         stop_local_dask_cluster(client, cluster)
         # self.logger.debug(o1.result())
 
diff --git a/tests/adapters/test_dask_with_context_mgmt.py b/tests/adapters/test_dask_with_context_mgmt.py
index 504755cb..b16c66d9 100644
--- a/tests/adapters/test_dask_with_context_mgmt.py
+++ b/tests/adapters/test_dask_with_context_mgmt.py
@@ -8,7 +8,6 @@
 from flowcept.commons.flowcept_logger import FlowceptLogger
 from flowcept.commons.utils import assert_by_querying_tasks_until
 from flowcept.flowceptor.adapters.dask.dask_plugins import (
-    set_workflow_info_on_workers,
     FlowceptDaskWorkerAdapter,
 )
 from tests.adapters.dask_test_utils import (
@@ -19,7 +18,6 @@
 def dummy_func1(x):
     cool_var = "cool value"  # test if we can intercept this var
     print(cool_var)
-    y = cool_var
     return x * 2
 
 
diff --git a/tests/adapters/test_mlflow.py b/tests/adapters/test_mlflow.py
index 8a83f9f3..71dd954a 100644
--- a/tests/adapters/test_mlflow.py
+++ b/tests/adapters/test_mlflow.py
@@ -1,6 +1,5 @@
 import os
 import unittest
-import os
 import uuid
 from time import sleep
 import numpy as np
diff --git a/tests/agent/agent_tests.py b/tests/agent/agent_tests.py
index 057473b4..53b6368c 100644
--- a/tests/agent/agent_tests.py
+++ b/tests/agent/agent_tests.py
@@ -3,6 +3,8 @@
 import tempfile
 from time import sleep
 import unittest
+
+import pytest
 from unittest.mock import patch
 
 import pandas as pd
@@ -35,7 +37,7 @@ def test_loads_jsonl_buffer_when_mq_disabled(self):
             FlowceptLogger().warning("Skipping no-MQ agent buffer test because instrumentation is disabled.")
             self.skipTest("Instrumentation is disabled.")
 
-        from flowcept.agents import flowcept_agent as agent_module
+        from flowcept.agents.mcp import mcp_server as agent_module
 
         with tempfile.NamedTemporaryFile(mode="w", suffix=".jsonl", delete=False) as handle:
             buffer_path = handle.name
@@ -44,13 +46,15 @@ def test_loads_jsonl_buffer_when_mq_disabled(self):
             TestAgent.offline_buffer_task(1, 2)
             f.dump_buffer(path=buffer_path)
 
-        agent = agent_module.FlowceptAgent(buffer_path=buffer_path)
+        agent = agent_module.FlowceptMCPServer(buffer_path=buffer_path)
         agent.start()
         try:
+            from flowcept.agents.mcp.mcp_client import run_tool
+
             sleep(0.5)
-            resp = agent.query("how many tasks?")
-            tool_result = ToolResult(**json.loads(resp))
-            self.assertTrue(tool_result.code in {201, 301})
+            resp = run_tool("get_latest")[0]
+            latest = json.loads(resp)
+            self.assertEqual(latest["activity_id"], "offline_buffer_task")
         finally:
             agent.stop()
 
@@ -68,8 +72,8 @@ def test_mcp_db_backed_provenance_tools(self):
 
         from uuid import uuid4
 
-        from flowcept.agents import flowcept_agent as agent_module
-        from flowcept.agents.agent_client import run_tool
+        from flowcept.agents.mcp import mcp_server as agent_module
+        from flowcept.agents.mcp.mcp_client import run_tool
         from flowcept.instrumentation.task_capture import FlowceptTask
 
         campaign_id = f"mcp-campaign-{uuid4()}"
@@ -83,16 +87,16 @@ def test_mcp_db_backed_provenance_tools(self):
             sleep(0.5)
             deadline -= 1
 
-        agent = agent_module.FlowceptAgent()
+        agent = agent_module.FlowceptMCPServer()
         agent.start()
         try:
-            resp = run_tool("query_provenance_tasks", kwargs={"filter": {"workflow_id": workflow_id}})[0]
+            resp = run_tool("query_tasks", kwargs={"filter": {"workflow_id": workflow_id}})[0]
             tool_result = ToolResult(**json.loads(resp))
             self.assertIn(tool_result.code, {201, 301})
             items = tool_result.result["items"]
             self.assertTrue(any(t["activity_id"] == "mcp_seed" for t in items))
 
-            resp = run_tool("list_provenance_campaigns", kwargs={})[0]
+            resp = run_tool("list_campaigns", kwargs={})[0]
             tool_result = ToolResult(**json.loads(resp))
             self.assertIn(tool_result.code, {201, 301})
             self.assertTrue(any(c["campaign_id"] == campaign_id for c in tool_result.result["items"]))
@@ -102,6 +106,95 @@ def test_mcp_db_backed_provenance_tools(self):
                 DocumentDBDAO._instance.close()
 
 
+class TestDbQueryToolsIntegration(unittest.TestCase):
+    """Integration tests for data_query_tools/db_query_tools.py.
+
+    Requires real MongoDB + Redis services.  Guards skip when unavailable.
+    """
+
+    def setUp(self):
+        from flowcept.configs import MONGO_ENABLED
+
+        if not MONGO_ENABLED:
+            FlowceptLogger().warning("Skipping db_query_tools integration tests: MongoDB disabled.")
+            self.skipTest("MongoDB is disabled.")
+        if not Flowcept.services_alive():
+            FlowceptLogger().warning("Skipping db_query_tools integration tests: services not alive.")
+            self.skipTest("Flowcept services are not alive.")
+
+    def test_i2_query_tasks_returns_seeded_task(self):
+        """query_tasks returns tasks matching a workflow_id filter."""
+        from uuid import uuid4
+        from flowcept.agents.data_query_tools.db_query_tools import query_tasks
+        from flowcept.instrumentation.task_capture import FlowceptTask
+        from flowcept.commons.daos.docdb_dao.docdb_dao_base import DocumentDBDAO
+
+        campaign_id = f"dqt-test-{uuid4()}"
+        with Flowcept(campaign_id=campaign_id, workflow_name=f"dqt-wf-{uuid4()}"):
+            workflow_id = Flowcept.current_workflow_id
+            with FlowceptTask(activity_id="dqt_activity", used={"p": 42}) as task:
+                task.end(generated={"result": 99})
+
+        deadline = 20
+        while deadline > 0 and not (Flowcept.db.task_query(filter={"workflow_id": workflow_id}) or []):
+            sleep(0.5)
+            deadline -= 1
+
+        result = query_tasks(filter={"workflow_id": workflow_id})
+        self.assertIn(result.code, {201, 301})
+        items = result.result["items"]
+        self.assertTrue(any(t["activity_id"] == "dqt_activity" for t in items))
+
+        try:
+            if DocumentDBDAO._instance is not None:
+                DocumentDBDAO._instance.close()
+        except Exception:
+            pass
+
+    def test_i2_list_campaigns_includes_seeded_campaign(self):
+        """list_campaigns returns a campaign for a seeded workflow."""
+        from uuid import uuid4
+        from flowcept.agents.data_query_tools.db_query_tools import list_campaigns
+        from flowcept.instrumentation.task_capture import FlowceptTask
+        from flowcept.commons.daos.docdb_dao.docdb_dao_base import DocumentDBDAO
+
+        campaign_id = f"dqt-campaign-{uuid4()}"
+        with Flowcept(campaign_id=campaign_id, workflow_name=f"dqt-wf-{uuid4()}"):
+            workflow_id = Flowcept.current_workflow_id
+            with FlowceptTask(activity_id="dqt_campaign_activity") as task:
+                task.end()
+
+        deadline = 20
+        while deadline > 0 and not (Flowcept.db.task_query(filter={"workflow_id": workflow_id}) or []):
+            sleep(0.5)
+            deadline -= 1
+
+        result = list_campaigns()
+        self.assertIn(result.code, {201, 301})
+        campaigns = result.result["items"]
+        self.assertTrue(any(c["campaign_id"] == campaign_id for c in campaigns))
+
+        try:
+            if DocumentDBDAO._instance is not None:
+                DocumentDBDAO._instance.close()
+        except Exception:
+            pass
+
+    def test_i2_validate_filter_rejects_disallowed_operator(self):
+        """validate_filter raises ValueError for operators not in the allowlist."""
+        from flowcept.agents.data_query_tools.db_query_tools import validate_filter
+
+        with self.assertRaises(ValueError):
+            validate_filter({"status": {"$where": "this.x > 0"}})
+
+    def test_i2_query_tasks_rejects_bad_filter(self):
+        """query_tasks returns an error code when given a disallowed filter operator."""
+        from flowcept.agents.data_query_tools.db_query_tools import query_tasks
+
+        result = query_tasks(filter={"status": {"$where": "this.x > 0"}})
+        self.assertTrue(result.code >= 400, f"Expected error code, got {result.code}")
+
+
 class TestAgentInMemoryQueryTools(unittest.TestCase):
     class _DummyContext:
         def __init__(self, df, schema, value_examples, custom_user_guidance):
@@ -113,7 +206,7 @@ def __init__(self, df, schema, value_examples, custom_user_guidance):
             self.request_context.lifespan_context.custom_guidance = custom_user_guidance
 
     def test_build_df_query_prompt_returns_prompt_payload(self):
-        from flowcept.agents.prompts import in_memory_query_prompts as t
+        from flowcept.agents.mcp import mcp_prompts as t
 
         df = pd.DataFrame({"activity_id": ["a", "b"], "used.x": [1, 2]})
         schema = {"activity_a": {"i": ["used.x"], "o": []}}
@@ -135,7 +228,7 @@ def test_build_df_query_prompt_returns_prompt_payload(self):
         self.assertIn("count tasks by activity", prompt_text)
 
     def test_build_df_query_prompt_returns_404_when_df_missing(self):
-        from flowcept.agents.prompts import in_memory_query_prompts as t
+        from flowcept.agents.mcp import mcp_prompts as t
 
         dummy_ctx = self._DummyContext(df=pd.DataFrame(), schema={}, value_examples={}, custom_user_guidance=[])
         with patch.object(t.mcp_flowcept, "get_context", return_value=dummy_ctx):
@@ -144,7 +237,7 @@ def test_build_df_query_prompt_returns_404_when_df_missing(self):
         self.assertEqual(prompt_text, "Current df is empty or null.")
 
     def test_execute_generated_df_code_runs_against_current_df(self):
-        from flowcept.agents.tools.in_memory_queries import in_memory_queries_tools as t
+        from flowcept.agents.mcp.mcp_tools import in_memory_task_query_mcp_tools as t
 
         df = pd.DataFrame({"a": [1, 2, 3], "b": [10, 20, 30]})
         dummy_ctx = self._DummyContext(df=df, schema={}, value_examples={}, custom_user_guidance=[])
@@ -159,7 +252,7 @@ def test_execute_generated_df_code_runs_against_current_df(self):
         self.assertIn("2", tool_result.result["result_df"])
 
     def test_generate_workflow_card_tool(self):
-        from flowcept.agents.tools import general_tools as g
+        from flowcept.agents.mcp.mcp_tools import report_tools as g
 
         expected_stats = {"markdown": "# Workflow Card: Demo\n\nBody"}
 
@@ -201,7 +294,7 @@ def test_llm_query_over_buffer(self):
             masked = f"{key[:4]}...{key[-4:]}" if len(key) > 8 else key
             print(f"Using agent.api_key: {masked}")
 
-        from flowcept.agents import flowcept_agent as agent_module
+        from flowcept.agents.mcp import mcp_server as agent_module
 
         with tempfile.NamedTemporaryFile(mode="w", suffix=".jsonl", delete=False) as buffer_handle:
             buffer_path = buffer_handle.name
@@ -210,14 +303,721 @@ def test_llm_query_over_buffer(self):
             TestAgent.offline_buffer_task(1, 2)
             f.dump_buffer(path=buffer_path)
 
-        agent = agent_module.FlowceptAgent(buffer_path=buffer_path)
+        agent = agent_module.FlowceptMCPServer(buffer_path=buffer_path)
         agent.start()
         try:
-            sleep(0.5)
-            resp = agent.query("how many tasks?")
-            tool_result = ToolResult(**json.loads(resp))
+            from flowcept.agents.mcp.mcp_client import run_tool
 
-            print(f"LLM response: {tool_result.result}")
-            self.assertTrue(tool_result.code in {201, 301})
+            sleep(0.5)
+            resp = run_tool("get_latest")[0]
+            latest = json.loads(resp)
+            self.assertEqual(latest["activity_id"], "offline_buffer_task")
         finally:
             agent.stop()
+
+
+class TestSchemaIntrospection(unittest.TestCase):
+    """Unit tests for static_schema_builder.py — no services, no LLM required."""
+
+    def test_get_attribute_docstrings_returns_documented_fields(self):
+        from flowcept.agents.provenance_schema_manager.static_schema_builder import get_attribute_docstrings
+
+        class _Documented:
+            foo: str = None
+            """Description of foo."""
+            bar: int = None
+            """Description of bar."""
+
+        docs = get_attribute_docstrings(_Documented)
+        self.assertEqual(docs["foo"], "Description of foo.")
+        self.assertEqual(docs["bar"], "Description of bar.")
+
+    def test_get_attribute_docstrings_excludes_undocumented(self):
+        from flowcept.agents.provenance_schema_manager.static_schema_builder import get_attribute_docstrings
+
+        class _Mixed:
+            documented: str = None
+            """Has a docstring."""
+            undocumented: int = None
+
+        docs = get_attribute_docstrings(_Mixed)
+        self.assertIn("documented", docs)
+        self.assertNotIn("undocumented", docs)
+
+    def test_assert_schema_documented_passes_on_full_coverage(self):
+        from flowcept.agents.provenance_schema_manager.static_schema_builder import assert_schema_documented
+
+        class _Full:
+            x: str = None
+            """Describes x."""
+            y: float = None
+            """Describes y."""
+
+        assert_schema_documented(_Full)  # must not raise
+
+    def test_assert_schema_documented_raises_on_missing(self):
+        from flowcept.agents.provenance_schema_manager.static_schema_builder import assert_schema_documented, SchemaDocumentationError
+
+        class _Partial:
+            good: str = None
+            """Has a docstring."""
+            bad: int = None
+
+        with self.assertRaises(SchemaDocumentationError) as ctx:
+            assert_schema_documented(_Partial)
+        self.assertIn("bad", str(ctx.exception))
+        self.assertIn("_Partial", str(ctx.exception))
+
+    def test_assert_schema_documented_error_message_is_actionable(self):
+        from flowcept.agents.provenance_schema_manager.static_schema_builder import assert_schema_documented, SchemaDocumentationError
+
+        class _Empty:
+            field_a: str = None
+            field_b: int = None
+
+        with self.assertRaises(SchemaDocumentationError) as ctx:
+            assert_schema_documented(_Empty)
+        msg = str(ctx.exception)
+        self.assertIn("field_a", msg)
+        self.assertIn("field_b", msg)
+        self.assertIn("triple-quoted", msg)
+
+    def test_domain_classes_all_documented(self):
+        """All domain classes must pass the startup assert — catches regressions."""
+        from flowcept.agents.provenance_schema_manager.static_schema_builder import assert_schema_documented
+        from flowcept.commons.flowcept_dataclasses.task_object import TaskObject
+        from flowcept.commons.flowcept_dataclasses.workflow_object import WorkflowObject
+        from flowcept.commons.flowcept_dataclasses.agent_object import AgentObject
+        from flowcept.commons.flowcept_dataclasses.blob_object import BlobObject
+        from flowcept.commons.task_data_preprocess import (
+            TelemetrySummary, CpuSummary, MemorySummary, DiskSummary, NetworkSummary,
+        )
+
+        assert_schema_documented(
+            TaskObject, WorkflowObject, AgentObject, BlobObject,
+            TelemetrySummary, CpuSummary, MemorySummary, DiskSummary, NetworkSummary,
+        )
+
+    def test_build_schema_context_returns_expected_keys(self):
+        from flowcept.agents.provenance_schema_manager.static_schema_builder import build_schema_context
+
+        ctx = build_schema_context()
+        for key in ("task_fields", "workflow_fields", "agent_fields", "blob_fields", "telemetry_summary_fields"):
+            self.assertIn(key, ctx)
+            self.assertIsInstance(ctx[key], list)
+            self.assertTrue(len(ctx[key]) > 0, f"{key} must not be empty")
+
+    def test_build_schema_context_task_fields_have_required_keys(self):
+        from flowcept.agents.provenance_schema_manager.static_schema_builder import build_schema_context
+
+        ctx = build_schema_context()
+        field_names = {f["name"] for f in ctx["task_fields"]}
+        for expected in ("task_id", "workflow_id", "activity_id", "started_at", "ended_at", "hostname"):
+            self.assertIn(expected, field_names)
+
+    def test_build_schema_context_telemetry_expands_subfields(self):
+        from flowcept.agents.provenance_schema_manager.static_schema_builder import build_schema_context
+
+        ctx = build_schema_context()
+        field_names = {f["name"] for f in ctx["telemetry_summary_fields"]}
+        for expected in (
+            "duration_sec",
+            "cpu.percent_all_diff",
+            "memory.used_mem_diff",
+            "disk.read_bytes_diff",
+            "network.bytes_sent_diff",
+        ):
+            self.assertIn(expected, field_names)
+
+    def test_telemetry_summary_fields_match_summarize_telemetry_output(self):
+        """TelemetrySummary schema must match the actual keys produced by summarize_telemetry()."""
+        from flowcept.agents.provenance_schema_manager.static_schema_builder import get_attribute_docstrings
+        from flowcept.commons.task_data_preprocess import (
+            CpuSummary, MemorySummary, DiskSummary, NetworkSummary,
+            summarize_telemetry,
+        )
+
+        cpu = {"percent_all": 10.0, "times_avg": {"user": 1.0, "system": 0.5, "idle": 8.5}}
+        disk = {"io_sum": {"read_bytes": 100, "write_bytes": 50, "read_count": 5, "write_count": 3}}
+        memory = {"virtual": {"used": 1024, "percent": 50.0}, "swap": {"used": 0}}
+        network = {"netio_sum": {"bytes_sent": 200, "bytes_recv": 300, "packets_sent": 2, "packets_recv": 3}}
+
+        task = {
+            "started_at": 1000.0,
+            "ended_at": 1042.7,
+            "telemetry_at_start": {"cpu": cpu, "disk": disk, "memory": memory, "network": network},
+            "telemetry_at_end": {
+                "cpu": {"percent_all": 20.0, "times_avg": {"user": 2.0, "system": 1.0, "idle": 7.0}},
+                "disk": {"io_sum": {"read_bytes": 200, "write_bytes": 100, "read_count": 10, "write_count": 6}},
+                "memory": {"virtual": {"used": 2048, "percent": 60.0}, "swap": {"used": 128}},
+                "network": {"netio_sum": {"bytes_sent": 400, "bytes_recv": 600, "packets_sent": 4, "packets_recv": 6}},
+            },
+        }
+
+        import logging
+        logger = logging.getLogger("test")
+        result = summarize_telemetry(task, logger)
+
+        sub_map = {"cpu": CpuSummary, "memory": MemorySummary, "disk": DiskSummary, "network": NetworkSummary}
+        for section, sub_cls in sub_map.items():
+            self.assertIn(section, result, f"summarize_telemetry must produce '{section}' key")
+            schema_keys = set(get_attribute_docstrings(sub_cls).keys())
+            actual_keys = set(result[section].keys())
+            self.assertEqual(schema_keys, actual_keys, f"{sub_cls.__name__} schema mismatch for '{section}'")
+
+    def test_lifespan_override_runs_schema_assert_and_populates_context(self):
+        """Importing the ctx manager module triggers no errors and the lifespan method is overridden."""
+        from flowcept.agents.mcp.context_manager import FlowceptAgentContextManager
+        from flowcept.agents.provenance_schema_manager.static_schema_builder import assert_schema_documented, build_schema_context, SCHEMA_CONTEXT
+
+        # Confirm the override is defined directly on FlowceptAgentContextManager (not just inherited).
+        self.assertIn("lifespan", FlowceptAgentContextManager.__dict__)
+
+        # Simulate what the lifespan does at startup (sans the async machinery).
+        from flowcept.commons.flowcept_dataclasses.task_object import TaskObject
+        from flowcept.commons.flowcept_dataclasses.workflow_object import WorkflowObject
+        from flowcept.commons.flowcept_dataclasses.agent_object import AgentObject
+        from flowcept.commons.flowcept_dataclasses.blob_object import BlobObject
+        from flowcept.commons.task_data_preprocess import (
+            TelemetrySummary, CpuSummary, MemorySummary, DiskSummary, NetworkSummary,
+        )
+        # Should not raise — all domain classes are fully documented.
+        assert_schema_documented(
+            TaskObject, WorkflowObject, AgentObject, BlobObject,
+            TelemetrySummary, CpuSummary, MemorySummary, DiskSummary, NetworkSummary,
+        )
+        ctx = build_schema_context()
+        SCHEMA_CONTEXT.update(ctx)
+        self.assertEqual(set(SCHEMA_CONTEXT.keys()), {
+            "task_fields", "workflow_fields", "agent_fields", "blob_fields", "telemetry_summary_fields"
+        })
+        # SCHEMA_CONTEXT is populated in the module; check it is the same object.
+        from flowcept.agents.provenance_schema_manager import static_schema_builder as si
+        self.assertIs(SCHEMA_CONTEXT, si.SCHEMA_CONTEXT)
+
+
+class TestRefactoredAgentStructure(unittest.TestCase):
+    """Structural import tests for the C/D/E/F refactor.
+
+    All tests are pure import / attribute checks — no live services needed.
+    TDD: these tests are written first; they fail until the refactor is implemented.
+    """
+
+    # ── C4: ToolResult extracted to tool_result.py ────────────────────────
+    def test_c4_tool_result_importable_from_new_module(self):
+        from flowcept.agents.tool_result import ToolResult
+        r = ToolResult(code=201, result="ok")
+        self.assertTrue(r.is_success())
+        self.assertTrue(r.result_is_str())
+
+    # ── C5: build_llm_model + normalize_message in llm/builders.py ────────
+    def test_c5_llm_builders_importable(self):
+        from flowcept.agents.llm.builders import build_llm_model, normalize_message
+        self.assertTrue(callable(build_llm_model))
+        self.assertEqual(normalize_message(" Hello? "), "hello")
+
+    # ── C1: mcp_server.py (was flowcept_agent.py) ─────────────────────────
+    def test_c1_mcp_server_importable(self):
+        from flowcept.agents.mcp.mcp_server import FlowceptMCPServer
+        self.assertTrue(callable(FlowceptMCPServer))
+
+    # ── C2: mcp_client.py (was agent_client.py) ───────────────────────────
+    def test_c2_mcp_client_importable(self):
+        from flowcept.agents.mcp.mcp_client import run_tool, run_prompt
+        self.assertTrue(callable(run_tool))
+        self.assertTrue(callable(run_prompt))
+
+    # ── C3: context_manager.py (was flowcept_ctx_manager.py) ──────────────
+    def test_c3_context_manager_importable(self):
+        from flowcept.agents.mcp.context_manager import (
+            ctx_manager,
+            mcp_flowcept,
+        )
+        self.assertIsNotNone(ctx_manager)
+        self.assertEqual(mcp_flowcept.name, "FlowceptAgent")
+
+    # ── D1: db_query_tools.py ─────────────────────────────────────────────
+    def test_d1_db_query_tools_importable(self):
+        from flowcept.agents.data_query_tools.db_query_tools import (
+            query_tasks,
+            ALLOWED_FILTER_OPERATORS,
+            validate_filter,
+        )
+        self.assertIn("$eq", ALLOWED_FILTER_OPERATORS)
+        self.assertTrue(callable(query_tasks))
+        validate_filter({"status": {"$eq": "FINISHED"}})  # must not raise
+
+    # ── D2: in_memory_task_query_tools.py ─────────────────────────────────
+    def test_d2_in_memory_task_query_tools_importable(self):
+        from flowcept.agents.data_query_tools.in_memory_task_query_tools import (
+            run_df_query,
+        )
+        self.assertTrue(callable(run_df_query))
+
+    # ── D3: pandas_utils.py ───────────────────────────────────────────────
+    def test_d3_pandas_utils_importable(self):
+        from flowcept.agents.data_query_tools.pandas_utils import (
+            safe_execute,
+        )
+        self.assertTrue(callable(safe_execute))
+
+    # ── D4: in_memory_workflow_query_tools.py ─────────────────────────────
+    def test_d4_in_memory_workflow_query_tools_importable(self):
+        from flowcept.agents.data_query_tools.in_memory_workflow_query_tools import (
+            execute_generated_workflow_query,
+            _resolve_path,
+        )
+        self.assertTrue(callable(execute_generated_workflow_query))
+        self.assertEqual(_resolve_path({"a": {"b": 1}}, "a.b"), 1)
+
+    # ── E1: db_query_mcp_tools.py — no _provenance_ infix ─────────────────
+    def test_e1_db_query_mcp_tools_importable_and_names_clean(self):
+        from flowcept.agents.mcp.mcp_tools import db_query_mcp_tools
+        for name in ("query_tasks", "query_workflows", "get_task_summary", "list_campaigns", "list_agents"):
+            self.assertTrue(hasattr(db_query_mcp_tools, name), f"missing {name}")
+            self.assertNotIn("provenance", name, f"{name} must not contain 'provenance'")
+
+    # ── E4: session_tools.py + report_tools.py ────────────────────────────
+    def test_e4_session_tools_importable(self):
+        from flowcept.agents.mcp.mcp_tools import (
+            check_liveness,
+        )
+        self.assertTrue(callable(check_liveness))
+
+    def test_e4_report_tools_importable(self):
+        from flowcept.agents.mcp.mcp_tools import generate_workflow_card
+        self.assertTrue(callable(generate_workflow_card))
+
+    # ── F1: base_prompts.py — BASE_ROLE + build_*_prompt functions ─────────
+    def test_f1_base_prompts_importable(self):
+        from flowcept.agents.prompts.base_prompts import (
+            BASE_ROLE,
+            build_single_task_prompt,
+            build_multitask_prompt,
+        )
+        self.assertIn("provenance", BASE_ROLE.lower())
+        self.assertTrue(callable(build_single_task_prompt))
+        self.assertTrue(callable(build_multitask_prompt))
+
+    # ── F2: db_query_prompts.py ───────────────────────────────────────────
+    def test_f2_db_query_prompts_importable(self):
+        from flowcept.agents.prompts.db_query_prompts import build_db_filter_prompt
+        self.assertTrue(callable(build_db_filter_prompt))
+        result = build_db_filter_prompt("find tasks in error")
+        self.assertIsInstance(result, str)
+        self.assertGreater(len(result), 0)
+
+    def test_f3_schema_prompt_context_is_domain_neutral_and_shared(self):
+        from flowcept.agents.prompts.schema_prompt_context import (
+            build_allowed_fields_prompt,
+            build_example_values_prompt,
+            build_task_static_field_table,
+            build_task_structure_prompt,
+        )
+
+        current_fields = ["activity_id", "used.input_value", "generated.output_value"]
+        examples = {"input_value": {"t": "int", "v": [1]}, "output_value": {"t": "float", "v": [2.0]}}
+        allowed = build_allowed_fields_prompt(current_fields, target_name="df")
+        table = build_task_static_field_table(current_fields)
+        values = build_example_values_prompt(examples)
+        structure = build_task_structure_prompt(
+            dynamic_schema={"step_a": {"i": ["used.input_value"], "o": ["generated.output_value"]}},
+            example_values=examples,
+            current_fields=current_fields,
+            record_description="Each record represents one task.",
+        )
+
+        combined = "\n".join([allowed, table, values, structure]).lower()
+        self.assertIn("allowed_fields", combined)
+        self.assertIn("used.input_value", combined)
+        self.assertIn("generated.output_value", combined)
+        for forbidden in ("gridsearch", "hyperparameter", "training", "model", "cfg_"):
+            self.assertNotIn(forbidden, combined)
+
+    # ── G4: agent_mode setting ────────────────────────────────────────────
+    def test_g4_agent_mode_setting_in_configs(self):
+        from flowcept.configs import AGENT_MODE
+        self.assertIn(AGENT_MODE, ("disabled", "separate", "colocated"))
+
+    # ── G5: chat router accepts thread_id ─────────────────────────────────
+    def test_g5_chat_request_has_thread_id(self):
+        from flowcept.webservice.routers.chat import ChatRequest
+        import inspect
+        inspect.signature(ChatRequest).parameters
+        # thread_id should be declared as a field (even if Optional)
+        self.assertIn("thread_id", ChatRequest.model_fields)
+
+    # ── G2-G3: run_chat accepts thread_id ─────────────────────────────────
+    def test_g2_run_chat_signature_has_thread_id(self):
+        from flowcept.agents.chat_orchestration.chat_orchestrator_service import run_chat
+        import inspect
+        sig = inspect.signature(run_chat)
+        self.assertIn("thread_id", sig.parameters)
+
+    def test_g6_chat_router_forwards_thread_id_to_orchestrator(self):
+        from flowcept.webservice.routers import chat as chat_router
+
+        payload = chat_router.ChatRequest(
+            messages=[chat_router.ChatMessage(role="user", content="hello")],
+            stream=False,
+            thread_id="thread-123",
+        )
+
+        with (
+            patch.object(chat_router, "get_chat_llm", return_value=object()),
+            patch.object(chat_router, "run_chat", return_value=iter([{"event": "done"}])) as run_chat_mock,
+        ):
+            response = chat_router.chat(payload)
+
+        self.assertEqual(response, {"message": "", "tool_trace": [], "cards": []})
+        self.assertEqual(run_chat_mock.call_args.kwargs["thread_id"], "thread-123")
+
+
+class TestLLMRoundTrips(unittest.TestCase):
+    """I4: LLM-dependent round-trip tests.  Marked @pytest.mark.llm so CI skips them."""
+
+    def _skip_if_no_llm(self):
+        api_key = AGENT.get("api_key", "")
+        if not api_key or api_key in ("?", "your-api-key-here", ""):
+            FlowceptLogger().warning("Skipping LLM round-trip test: no valid api_key in AGENT settings.")
+            self.skipTest("LLM not configured.")
+
+    @pytest.mark.llm
+    def test_i4_run_df_query_real_llm(self):
+        """run_df_query uses a real LLM to generate pandas code and returns a successful ToolResult."""
+        self._skip_if_no_llm()
+        import pandas as pd
+        from flowcept.agents.data_query_tools.in_memory_task_query_tools import run_df_query
+        from flowcept.agents.llm.builders import build_llm_model
+
+        df = pd.DataFrame({
+            "activity_id": ["train", "train", "eval"],
+            "status": ["finished", "finished", "finished"],
+            "telemetry_summary.duration_sec": [10.0, 12.5, 5.0],
+        })
+        schema = {"activity_id": {"type": "str"}, "status": {"type": "str"}}
+        llm = build_llm_model(track_tools=False)
+        result = run_df_query(
+            query="How many rows are there?",
+            df=df,
+            schema=schema,
+            value_examples={},
+            custom_user_guidance=[],
+            llm=llm,
+        )
+        self.assertIn(result.code, (201, 301), f"Expected success code, got {result.code}: {result.result}")
+
+    @pytest.mark.llm
+    def test_i4_run_chat_tool_call_round_trip(self):
+        """run_chat drives tool calling with a real LLM, yielding tool_call + token + done events."""
+        self._skip_if_no_llm()
+        if not Flowcept.services_alive():
+            FlowceptLogger().warning("Skipping run_chat round-trip: Flowcept services not alive.")
+            self.skipTest("Flowcept services not alive.")
+        from flowcept.agents.llm.builders import build_llm_model
+        from flowcept.agents.chat_orchestration.chat_orchestrator_service import run_chat
+
+        llm = build_llm_model(track_tools=False)
+        messages = [{"role": "user", "content": "How many tasks are there in the database?"}]
+        events = list(run_chat(llm, messages=messages))
+        event_types = [e["event"] for e in events]
+        self.assertIn("done", event_types, f"Expected 'done' event, got: {event_types}")
+        self.assertTrue(
+            any(e in event_types for e in ("token", "error")),
+            f"Expected 'token' or 'error' event, got: {event_types}",
+        )
+
+    @pytest.mark.llm
+    def test_i4_langgraph_thread_memory(self):
+        """thread_id enables server-side conversation memory: follow-up question recalls prior answer."""
+        self._skip_if_no_llm()
+        from flowcept.agents.llm.builders import build_llm_model
+        from flowcept.agents.chat_orchestration.chat_orchestrator_service import run_chat
+
+        import uuid
+        tid = f"test-thread-{uuid.uuid4()}"
+        llm = build_llm_model(track_tools=False)
+
+        # First turn: plant a fact
+        events1 = list(run_chat(llm, messages=[{"role": "user", "content": "My lucky number is 7777."}], thread_id=tid))
+        types1 = [e["event"] for e in events1]
+        self.assertIn("done", types1, f"First turn missing 'done': {types1}")
+
+        # Second turn: recall the fact (only new message; server owns history via MemorySaver)
+        events2 = list(run_chat(llm, messages=[{"role": "user", "content": "What is my lucky number?"}], thread_id=tid))
+        full_text = " ".join(str(e.get("data", "")) for e in events2 if e["event"] == "token")
+        self.assertIn("7777", full_text, f"Expected '7777' in follow-up response, got: {full_text!r}")
+
+
+class TestProvAgentInstrumentation(unittest.TestCase):
+    """Structural tests for PROV-AGENT enum usage.  No live services required."""
+
+    def test_prov_agent_enum_values(self):
+        from flowcept.commons.vocabulary import PROV_AGENT
+
+        self.assertEqual(PROV_AGENT.AI_MODEL_INVOCATION.value, "ai_model_invocation")
+        self.assertEqual(PROV_AGENT.AGENT_TOOL.value, "agent_tool")
+
+    def test_flowcept_llm_uses_prov_agent_enum_not_bare_string(self):
+        import inspect
+        from flowcept.instrumentation.flowcept_agent_task import FlowceptLLM
+
+        src = inspect.getsource(FlowceptLLM._our_call)
+        self.assertNotIn('"llm_task"', src, "FlowceptLLM must use PROV_AGENT.AI_MODEL_INVOCATION, not bare string")
+        self.assertIn("PROV_AGENT.AI_MODEL_INVOCATION", src)
+
+    def test_agent_flowcept_task_default_uses_prov_agent_enum(self):
+        import inspect
+        import flowcept.instrumentation.flowcept_agent_task as m
+
+        src = inspect.getsource(m.agent_flowcept_task)
+        self.assertNotIn('"agent_task"', src, "agent_flowcept_task must use PROV_AGENT.AGENT_TOOL, not bare string")
+        self.assertIn("PROV_AGENT.AGENT_TOOL", src)
+
+    def test_context_manager_comparisons_use_prov_agent_enum(self):
+        import inspect
+        from flowcept.agents.mcp.context_manager import FlowceptAgentContextManager
+
+        src = inspect.getsource(FlowceptAgentContextManager.message_handler)
+        self.assertNotIn('"llm_task"', src)
+        self.assertNotIn('"agent_task"', src)
+        self.assertIn("PROV_AGENT", src)
+
+    def test_context_manager_caches_dynamic_schema_by_workflow_id(self):
+        from flowcept.agents.mcp.context_manager import FlowceptAgentContextManager
+
+        manager = FlowceptAgentContextManager()
+        manager.message_handler(
+            {
+                "type": "task",
+                "workflow_id": "wf-a",
+                "activity_id": "step_a",
+                "used": {"input_value": 1},
+                "generated": {"output_value": 2},
+            }
+        )
+        manager.message_handler(
+            {
+                "type": "task",
+                "workflow_id": "wf-b",
+                "activity_id": "step_b",
+                "used": {"other_input": "x"},
+                "generated": {"other_output": "y"},
+            }
+        )
+
+        wf_a = manager.get_workflow_schema_snapshot("wf-a")
+        wf_b = manager.get_workflow_schema_snapshot("wf-b")
+
+        self.assertIn("step_a", wf_a["dynamic_schema"])
+        self.assertNotIn("step_b", wf_a["dynamic_schema"])
+        self.assertIn("used.input_value", wf_a["current_fields"])
+        self.assertIn("step_b", wf_b["dynamic_schema"])
+        self.assertNotIn("step_a", wf_b["dynamic_schema"])
+
+    def test_schema_mcp_tool_returns_workflow_prompt_context(self):
+        from flowcept.agents.mcp.context_manager import ctx_manager
+        from flowcept.agents.mcp.mcp_tools.schema_mcp_tools import get_workflow_schema_context
+
+        ctx_manager.reset_context()
+        ctx_manager.message_handler(
+            {
+                "type": "task",
+                "workflow_id": "wf-schema-tool",
+                "activity_id": "step_a",
+                "used": {"input_value": 1},
+                "generated": {"output_value": 2},
+            }
+        )
+
+        result = get_workflow_schema_context(workflow_id="wf-schema-tool")
+
+        self.assertEqual(result.code, 301)
+        self.assertIn("prompt_context", result.result)
+        self.assertIn("used.input_value", result.result["prompt_context"])
+        self.assertIn("generated.output_value", result.result["prompt_context"])
+
+    def test_mcp_db_query_tools_use_agent_flowcept_task(self):
+        import inspect
+        import flowcept.agents.mcp_tools.db_query_mcp_tools as m
+
+        src = inspect.getsource(m)
+        self.assertIn("agent_flowcept_task", src)
+        self.assertIn("PROV_AGENT", src)
+
+    def test_report_tools_use_agent_flowcept_task(self):
+        import inspect
+        import flowcept.agents.mcp_tools.report_tools as m
+
+        src = inspect.getsource(m)
+        self.assertIn("agent_flowcept_task", src)
+
+    def test_in_memory_task_query_mcp_tools_use_agent_flowcept_task(self):
+        import inspect
+        import flowcept.agents.mcp_tools.in_memory_task_query_mcp_tools as m
+
+        src = inspect.getsource(m)
+        self.assertIn("agent_flowcept_task", src)
+
+    def test_format_messages_handles_base_messages(self):
+        from flowcept.instrumentation.flowcept_agent_task import FlowceptLLM
+        from langchain_core.messages import HumanMessage, AIMessage, SystemMessage
+
+        msgs = [SystemMessage(content="sys"), HumanMessage(content="hi"), AIMessage(content="hello")]
+        result = FlowceptLLM._format_messages(msgs)
+        self.assertIn("hi", result)
+        self.assertIn("hello", result)
+        self.assertIn("sys", result)
+
+    def test_extract_llm_usage_normalizes_langchain_response_metadata(self):
+        from langchain_core.messages import AIMessage
+
+        from flowcept.instrumentation.flowcept_agent_task import extract_llm_usage
+
+        response = AIMessage(
+            content="answer text",
+            usage_metadata={"input_tokens": 3, "output_tokens": 2, "total_tokens": 5},
+            response_metadata={"model_name": "gpt-test", "finish_reason": "stop", "id": "req-123"},
+        )
+
+        usage = extract_llm_usage(response, input_text="abc", output_text=response.content)
+
+        self.assertEqual(usage["model"], "gpt-test")
+        self.assertEqual(usage["input_tokens"], 3)
+        self.assertEqual(usage["output_tokens"], 2)
+        self.assertEqual(usage["total_tokens"], 5)
+        self.assertEqual(usage["input_chars"], 3)
+        self.assertEqual(usage["output_chars"], 11)
+        self.assertEqual(usage["finish_reason"], "stop")
+        self.assertEqual(usage["provider_request_id"], "req-123")
+        self.assertEqual(usage["llm_model"], "gpt-test")
+        self.assertEqual(usage["llm_total_tokens"], 5)
+
+    def test_extract_llm_usage_estimates_missing_provider_tokens_from_text(self):
+        from langchain_core.messages import AIMessage
+
+        from flowcept.instrumentation.flowcept_agent_task import extract_llm_usage
+
+        usage = extract_llm_usage(
+            AIMessage(content="abcd" * 5),
+            fallback_model="model-without-token-usage",
+            input_text="abcd" * 10,
+            output_text="abcd" * 5,
+        )
+
+        self.assertEqual(usage["model"], "model-without-token-usage")
+        self.assertEqual(usage["input_tokens"], 10)
+        self.assertEqual(usage["output_tokens"], 5)
+        self.assertEqual(usage["total_tokens"], 15)
+        self.assertEqual(usage["token_count_source"], "estimated_from_chars")
+
+    def test_llm_metadata_config_drops_api_keys(self):
+        from flowcept.instrumentation.flowcept_agent_task import _extract_llm_metadata
+
+        class MinimalLLMConfig:
+            def model_dump(self):
+                return {
+                    "model": "gpt-test",
+                    "openai_api_key": "secret-key",
+                    "nested": {"api_key": "secret-key-2"},
+                }
+
+        metadata = _extract_llm_metadata(MinimalLLMConfig())
+
+        self.assertEqual(metadata["config"]["model"], "gpt-test")
+        self.assertNotIn("openai_api_key", metadata["config"])
+        self.assertNotIn("api_key", metadata["config"]["nested"])
+
+    def test_flowcept_llm_records_provider_call_as_ai_model_invocation(self):
+        import inspect
+
+        from flowcept.commons.vocabulary import PROV_AGENT
+        from flowcept.instrumentation.flowcept_agent_task import FlowceptLLM
+
+        src = inspect.getsource(FlowceptLLM._our_call)
+
+        self.assertIn("subtype=PROV_AGENT.AI_MODEL_INVOCATION", src)
+        self.assertEqual(PROV_AGENT.AI_MODEL_INVOCATION.value, "ai_model_invocation")
+
+    def test_run_chat_wraps_graph_in_flowcept_context(self):
+        """Each LangGraph execution is wrapped in a Flowcept context to get its own workflow_id."""
+        import inspect
+        from flowcept.agents.chat_orchestration import chat_orchestrator_service as svc
+
+        src = inspect.getsource(svc.run_chat)
+        # Must use Flowcept context manager, not manual WorkflowObject
+        self.assertEqual(svc.CHAT_WORKFLOW_NAME, "Flowcept LangGraph Chat")
+        self.assertNotIn("WorkflowObject", src)
+        self.assertIn("start_persistence=True", src)
+        self.assertIn("save_workflow=True", src)
+
+    def test_build_graph_does_not_accept_workflow_id(self):
+        """workflow_id is not threaded through _build_graph — Flowcept.current_workflow_id is used instead."""
+        import inspect
+        from flowcept.agents.chat_orchestration import chat_orchestrator_service as svc
+
+        sig = inspect.signature(svc._build_graph)
+        self.assertNotIn("workflow_id", sig.parameters)
+
+
+class TestContextManager(unittest.TestCase):
+
+    def test_workflow_schema_updates_on_new_activity(self):
+        """Schema cache updates when a finished task with a new activity_id arrives."""
+        from flowcept.agents.mcp.context_manager import FlowceptAgentContextManager
+        from flowcept.commons.vocabulary import Status
+
+        cm = FlowceptAgentContextManager()
+        wf_id = "test-wf-schema"
+
+        # Task with activity_id "train" — finished, has both used and generated.
+        task1 = {
+            "type": "task",
+            "task_id": "t1",
+            "workflow_id": wf_id,
+            "activity_id": "train",
+            "used": {"lr": 0.01},
+            "generated": {"loss": 0.5},
+            "ended_at": 1.0,
+            "status": Status.FINISHED,
+        }
+        cm.message_handler(task1)
+        assert wf_id in cm.context.workflow_schema_cache
+        cache_after_first = cm.context.workflow_schema_cache[wf_id]
+        assert cache_after_first is not None
+
+        # Same activity_id again — schema cache should NOT update again.
+        task2 = dict(task1, task_id="t2", used={"lr": 0.001}, generated={"loss": 0.4})
+        cm.message_handler(task2)
+        assert cm.context.workflow_schema_cache[wf_id] is cache_after_first
+
+        # New activity_id "evaluate" — schema cache SHOULD update.
+        task3 = {
+            "type": "task",
+            "task_id": "t3",
+            "workflow_id": wf_id,
+            "activity_id": "evaluate",
+            "used": {"model": "best"},
+            "generated": {"accuracy": 0.95},
+            "ended_at": 2.0,
+            "status": Status.FINISHED,
+        }
+        cm.message_handler(task3)
+        assert cm.context.workflow_schema_cache[wf_id] is not cache_after_first
+
+    def test_workflow_finish_triggers_schema_persist(self):  # noqa: D102
+        """A workflow message with status=FINISHED triggers persist_workflow_schema_snapshot."""
+        from unittest.mock import patch
+        from flowcept.agents.mcp.context_manager import FlowceptAgentContextManager
+        from flowcept.commons.vocabulary import Status
+
+        cm = FlowceptAgentContextManager()
+        wf_id = "test-wf-finish"
+
+        # Seed schema cache so persist has something to work with.
+        cm.context.workflow_schema_cache[wf_id] = {"dynamic_schema": {}, "value_examples": {}, "current_fields": []}
+
+        wf_msg = {"type": "workflow", "workflow_id": wf_id, "status": Status.FINISHED}
+        with patch.object(cm, "persist_workflow_schema_snapshot") as mock_persist:
+            cm.message_handler(wf_msg)
+            mock_persist.assert_called_once_with(wf_id)
diff --git a/tests/api/db_api_test.py b/tests/api/db_api_test.py
index 4f785c58..ae0b8a1a 100644
--- a/tests/api/db_api_test.py
+++ b/tests/api/db_api_test.py
@@ -5,7 +5,8 @@
 from flowcept.commons.flowcept_dataclasses.task_object import TaskObject
 from flowcept.commons.daos.docdb_dao.docdb_dao_base import DocumentDBDAO
 from flowcept import BlobObject, Flowcept, WorkflowObject, AgentObject
-from flowcept.configs import MONGO_ENABLED
+from flowcept.commons.vocabulary import Status
+from flowcept.configs import MONGO_ENABLED, LMDB_ENABLED
 from flowcept.flowceptor.telemetry_capture import TelemetryCapture
 
 
@@ -86,14 +87,26 @@ def test_flowcept_agent_instantiation(self):
         agent_name = "InstantiatedAgent"
 
         with Flowcept(agent_id=agent_id, agent_name=agent_name, save_workflow=False, start_persistence=False):
-            pass
+            agent_msgs = [msg for msg in Flowcept.buffer if msg.get("type") == "agent"]
 
-        agent_obj = Flowcept.db.get_agent_object(agent_id=agent_id)
-        assert agent_obj is not None
-        assert agent_obj.name == agent_name
-        assert agent_obj.agent_id == agent_id
-        assert agent_obj.registered_at is not None
+        assert len(agent_msgs) == 1
+        assert agent_msgs[0]["agent_id"] == agent_id
+        assert agent_msgs[0]["name"] == agent_name
+        assert agent_msgs[0]["registered_at"] is not None
+
+    def test_flowcept_agent_name_generates_agent_id(self):
+        agent_name = "GeneratedIdAgent"
+
+        with Flowcept(agent_name=agent_name, save_workflow=False, start_persistence=False) as fc:
+            agent_id = fc.agent_id
+            agent_msgs = [msg for msg in Flowcept.buffer if msg.get("type") == "agent"]
+
+        assert agent_id is not None
+        assert len(agent_msgs) == 1
+        assert agent_msgs[0]["agent_id"] == agent_id
+        assert agent_msgs[0]["name"] == agent_name
 
+    def test_workflow_dao_update_fields(self):
         wf2_id = str(uuid4())
         print(wf2_id)
 
@@ -148,13 +161,39 @@ def test_workflow_to_dict_redacts_sensitive_settings(self):
         assert "redis-pass" not in str(wf_dict)
         assert "agent-key" not in str(wf_dict)
 
+    def test_workflow_dynamic_schema_snapshot_roundtrip(self):
+        workflow_id = str(uuid4())
+        wf = WorkflowObject()
+        wf.workflow_id = workflow_id
+        wf.name = "schema snapshot workflow"
+        wf.custom_metadata = {"owner": "existing"}
+        assert Flowcept.db.insert_or_update_workflow(wf)
+
+        snapshot = {
+            "dynamic_schema": {"step_a": {"i": ["used.input_value"], "o": ["generated.output_value"]}},
+            "value_examples": {"input_value": {"t": "int", "v": [1]}},
+            "current_fields": ["workflow_id", "activity_id", "used.input_value", "generated.output_value"],
+        }
+
+        assert Flowcept.db.save_workflow_domain_data_schema(workflow_id, snapshot)
+
+        loaded = Flowcept.db.get_workflow_domain_data_schema(workflow_id)
+        wf_obj = Flowcept.db.get_workflow_object(workflow_id)
+
+        assert loaded == snapshot
+        assert wf_obj.workflow_domain_data_schema == snapshot
+        assert wf_obj.name == "schema snapshot workflow"
+        assert wf_obj.custom_metadata["owner"] == "existing"
+        assert "dynamic_schema_snapshot" not in wf_obj.custom_metadata
+
     @unittest.skipIf(not MONGO_ENABLED, "MongoDB is disabled")
     def test_save_blob(self):
         import pickle
 
         obj = pickle.dumps(OurObject())
 
-        obj_id = Flowcept.db.save_or_update_object(object=obj, save_data_in_collection=True)
+        blob_obj = Flowcept.db._insert_or_update_object(BlobObject(), object=obj, save_data_in_collection=True)
+        obj_id = blob_obj.object_id
         print(obj_id)
 
         obj_docs = Flowcept.db.query(filter={"object_id": obj_id}, collection="objects")
@@ -165,7 +204,7 @@ def test_save_blob(self):
     def test_blob_object_query_and_get(self):
         payload = b"blob-content"
         with Flowcept(workflow_name="blob_demo"):
-            obj_id = Flowcept.db.save_or_update_object(
+            obj_id = Flowcept.insert_or_update_object(
                 object=payload,
                 task_id="task_blob_1",
                 object_type="artifact",
@@ -190,35 +229,36 @@ def test_blob_object_query_and_get(self):
             assert blob.version == 0
 
     @unittest.skipIf(not MONGO_ENABLED, "MongoDB is disabled")
-    def test_save_blob_emits_object_metadata_message(self):
-        object_messages = []
-        with Flowcept(workflow_name="blob_message_demo", start_persistence=False):
-            with patch.object(Flowcept, "emit_message", side_effect=object_messages.append):
-                obj_id = Flowcept.db.save_or_update_object(
-                    object=b"blob-message-content",
-                    task_id="task_blob_message",
-                    object_type="artifact",
-                    custom_metadata={"owner": "tests"},
-                    save_data_in_collection=True,
-                )
-
-        assert len(object_messages) == 1
-        object_msg = object_messages[0]
-        assert object_msg["object_id"] == obj_id
-        assert object_msg["object_type"] == "artifact"
-        assert object_msg["task_id"] == "task_blob_message"
-        assert object_msg["workflow_id"] is not None
-        assert object_msg["custom_metadata"]["owner"] == "tests"
-        assert "data" not in object_msg
+    def test_insert_object_emits_message_with_timing(self):
+        with Flowcept(workflow_name="blob_message_demo", start_persistence=False) as f:
+            obj_id = Flowcept.insert_or_update_object(
+                object=b"blob-message-content",
+                task_id="task_blob_message",
+                object_type="artifact",
+                custom_metadata={"owner": "tests"},
+                save_data_in_collection=True,
+            )
+            msgs = list(f.get_buffer())
+
+        object_msgs = [m for m in msgs if m.get("type") == "object"]
+        assert len(object_msgs) == 1
+        msg = object_msgs[0]
+        assert msg["object_id"] == obj_id
+        assert msg["object_type"] == "artifact"
+        assert msg["task_id"] == "task_blob_message"
+        assert msg["workflow_id"] is not None
+        assert msg["custom_metadata"]["owner"] == "tests"
+        assert "data" not in msg
+        assert "created_at" in msg
+        assert "updated_at" in msg
 
     @unittest.skipIf(not MONGO_ENABLED, "MongoDB is disabled")
     def test_blob_object_version_control(self):
         obj_id = str(uuid4())
         payload_v0 = b"v0"
-        Flowcept.db.save_or_update_object(
+        Flowcept.db._insert_or_update_object(
+            BlobObject(object_id=obj_id, object_type="artifact"),
             object=payload_v0,
-            object_id=obj_id,
-            object_type="artifact",
             save_data_in_collection=True,
         )
         blob_v0 = Flowcept.db.get_blob_object(obj_id)
@@ -227,10 +267,9 @@ def test_blob_object_version_control(self):
         assert doc_v0["data"] == payload_v0
 
         payload_v1 = b"v1"
-        Flowcept.db.save_or_update_object(
+        Flowcept.db._insert_or_update_object(
+            BlobObject(object_id=obj_id, object_type="artifact"),
             object=payload_v1,
-            object_id=obj_id,
-            object_type="artifact",
             save_data_in_collection=True,
         )
         blob_v1 = Flowcept.db.get_blob_object(obj_id)
@@ -243,7 +282,7 @@ def test_blob_object_store_in_gridfs(self):
         with Flowcept(workflow_name="blob_gridfs_test"):
             expected_wf_id = Flowcept.current_workflow_id
             payload = b"gridfs-content-v0"
-            obj_id = Flowcept.db.save_or_update_object(
+            obj_id = Flowcept.insert_or_update_object(
                 object=payload,
                 task_id="task_gridfs_1",
                 object_type="artifact",
@@ -266,7 +305,7 @@ def test_blob_object_store_in_gridfs_update(self):
             expected_wf_id = Flowcept.current_workflow_id
             obj_id = str(uuid4())
             payload_v0 = b"gridfs-content-v0"
-            Flowcept.db.save_or_update_object(
+            Flowcept.insert_or_update_object(
                 object=payload_v0,
                 object_id=obj_id,
                 object_type="artifact",
@@ -278,7 +317,7 @@ def test_blob_object_store_in_gridfs_update(self):
             assert retrieved_v0 == payload_v0
 
             payload_v1 = b"gridfs-content-v1"
-            Flowcept.db.save_or_update_object(
+            Flowcept.insert_or_update_object(
                 object=payload_v1,
                 object_id=obj_id,
                 object_type="artifact",
@@ -299,17 +338,17 @@ def test_blob_object_store_in_gridfs_update(self):
     def test_blob_fingerprint_and_equality_in_object(self):
         with Flowcept(workflow_name="blob_fingerprint_test"):
             payload = b"equal-payload"
-            obj_id_a = Flowcept.db.save_or_update_object(
+            obj_id_a = Flowcept.insert_or_update_object(
                 object=payload,
                 object_type="artifact",
                 save_data_in_collection=True,
             )
-            obj_id_b = Flowcept.db.save_or_update_object(
+            obj_id_b = Flowcept.insert_or_update_object(
                 object=payload,
                 object_type="artifact",
                 save_data_in_collection=True,
             )
-            obj_id_c = Flowcept.db.save_or_update_object(
+            obj_id_c = Flowcept.insert_or_update_object(
                 object=b"different-payload",
                 object_type="artifact",
                 save_data_in_collection=True,
@@ -327,17 +366,17 @@ def test_blob_fingerprint_and_equality_in_object(self):
     def test_blob_fingerprint_and_equality_gridfs(self):
         with Flowcept(workflow_name="blob_fingerprint_gridfs_test"):
             payload = b"gridfs-equal-payload"
-            obj_id_a = Flowcept.db.save_or_update_object(
+            obj_id_a = Flowcept.insert_or_update_object(
                 object=payload,
                 object_type="artifact",
                 save_data_in_collection=False,
             )
-            obj_id_b = Flowcept.db.save_or_update_object(
+            obj_id_b = Flowcept.insert_or_update_object(
                 object=payload,
                 object_type="artifact",
                 save_data_in_collection=False,
             )
-            obj_id_c = Flowcept.db.save_or_update_object(
+            obj_id_c = Flowcept.insert_or_update_object(
                 object=b"gridfs-different-payload",
                 object_type="artifact",
                 save_data_in_collection=False,
@@ -355,7 +394,7 @@ def test_blob_fingerprint_and_equality_gridfs(self):
     def test_ml_model_aliases(self):
         payload = b"model-bytes"
         with Flowcept(workflow_name="ml_model_alias_test"):
-            obj_id = Flowcept.db.save_or_update_ml_model(
+            obj_id = Flowcept.insert_or_update_ml_model(
                 object=payload,
                 task_id="task_model_1",
                 save_data_in_collection=True,
@@ -378,7 +417,7 @@ def test_ml_model_aliases(self):
     def test_dataset_aliases(self):
         payload = b"dataset-bytes"
         with Flowcept(workflow_name="dataset_alias_test"):
-            obj_id = Flowcept.db.save_or_update_dataset(
+            obj_id = Flowcept.insert_or_update_dataset(
                 object=payload,
                 task_id="task_dataset_1",
                 save_data_in_collection=True,
@@ -401,7 +440,7 @@ def test_dataset_aliases(self):
     def test_save_object_defaults_workflow_id_from_current_workflow(self):
         with Flowcept(workflow_name="blob_default_wf_test"):
             current_wf_id = Flowcept.current_workflow_id
-            obj_id = Flowcept.db.save_or_update_object(
+            obj_id = Flowcept.insert_or_update_object(
                 object=b"default-wf-content",
                 task_id="task_default_wf",
                 object_type="artifact",
@@ -411,11 +450,34 @@ def test_save_object_defaults_workflow_id_from_current_workflow(self):
         blob = Flowcept.db.get_blob_object(obj_id)
         assert blob.workflow_id == current_wf_id
 
+    @unittest.skipIf(not MONGO_ENABLED, "MongoDB is disabled")
+    def test_object_stores_created_at_without_control_version(self):
+        with Flowcept(workflow_name="blob_timestamps"):
+            obj_id = Flowcept.insert_or_update_object(
+                object=b"payload",
+                object_type="artifact",
+                save_data_in_collection=True,
+            )
+            doc = Flowcept.db.query(filter={"object_id": obj_id}, collection="objects")[0]
+            assert "created_at" in doc
+            assert "updated_at" in doc
+            created_at_v0 = doc["created_at"]
+
+            Flowcept.insert_or_update_object(
+                object=b"payload-v1",
+                object_id=obj_id,
+                object_type="artifact",
+                save_data_in_collection=True,
+            )
+            doc_v1 = Flowcept.db.query(filter={"object_id": obj_id}, collection="objects")[0]
+            assert doc_v1["created_at"] == created_at_v0
+            assert doc_v1["updated_at"] >= created_at_v0
+
     @unittest.skipIf(not MONGO_ENABLED, "MongoDB is disabled")
     def test_control_version_first_insert(self):
         with Flowcept(workflow_name="blob_control_first_insert"):
             payload = b"cv-v1"
-            obj_id = Flowcept.db.save_or_update_object(
+            obj_id = Flowcept.insert_or_update_object(
                 object=payload,
                 task_id="task_cv_1",
                 object_type="artifact",
@@ -438,13 +500,13 @@ def test_control_version_update_and_history_in_object(self):
         with Flowcept(workflow_name="blob_control_update_in_object"):
             payload_v1 = b"cv-in-object-v1"
             payload_v2 = b"cv-in-object-v2"
-            obj_id = Flowcept.db.save_or_update_object(
+            obj_id = Flowcept.insert_or_update_object(
                 object=payload_v1,
                 object_type="artifact",
                 save_data_in_collection=True,
                 control_version=True,
             )
-            Flowcept.db.save_or_update_object(
+            Flowcept.insert_or_update_object(
                 object=payload_v2,
                 object_id=obj_id,
                 object_type="artifact",
@@ -468,13 +530,13 @@ def test_control_version_update_and_history_gridfs(self):
         with Flowcept(workflow_name="blob_control_update_gridfs"):
             payload_v1 = b"cv-gridfs-v1"
             payload_v2 = b"cv-gridfs-v2"
-            obj_id = Flowcept.db.save_or_update_object(
+            obj_id = Flowcept.insert_or_update_object(
                 object=payload_v1,
                 object_type="artifact",
                 save_data_in_collection=False,
                 control_version=True,
             )
-            Flowcept.db.save_or_update_object(
+            Flowcept.insert_or_update_object(
                 object=payload_v2,
                 object_id=obj_id,
                 object_type="artifact",
@@ -491,12 +553,12 @@ def test_control_version_update_and_history_gridfs(self):
     @unittest.skipIf(not MONGO_ENABLED, "MongoDB is disabled")
     def test_get_object_history(self):
         with Flowcept(workflow_name="blob_list_versions"):
-            obj_id = Flowcept.db.save_or_update_object(
+            obj_id = Flowcept.insert_or_update_object(
                 object=b"lv-v1",
                 save_data_in_collection=True,
                 control_version=True,
             )
-            Flowcept.db.save_or_update_object(
+            Flowcept.insert_or_update_object(
                 object=b"lv-v2",
                 object_id=obj_id,
                 save_data_in_collection=True,
@@ -511,7 +573,7 @@ def test_get_object_history(self):
     @unittest.skipIf(not MONGO_ENABLED, "MongoDB is disabled")
     def test_control_version_retry_on_cas_mismatch(self):
         with Flowcept(workflow_name="blob_cas_retry"):
-            obj_id = Flowcept.db.save_or_update_object(
+            obj_id = Flowcept.insert_or_update_object(
                 object=b"cas-v1",
                 save_data_in_collection=True,
                 control_version=True,
@@ -527,7 +589,7 @@ def flaky_update(*args, **kwargs):
                 return original(*args, **kwargs)
 
             with patch.object(dao, "_update_with_optional_transaction", side_effect=flaky_update):
-                Flowcept.db.save_or_update_object(
+                Flowcept.insert_or_update_object(
                     object=b"cas-v2",
                     object_id=obj_id,
                     save_data_in_collection=True,
@@ -565,7 +627,7 @@ def test_tasks_recursive(self):
                 ],
             },
         }
-        d = Flowcept.db._dao().get_tasks_recursive("e9a3b567-cb56-4884-ba14-f137c0260191", mapping=mapping)
+        Flowcept.db._dao().get_tasks_recursive("e9a3b567-cb56-4884-ba14-f137c0260191", mapping=mapping)
 
     @unittest.skipIf(not MONGO_ENABLED, "MongoDB is disabled")
     def test_dump(self):
@@ -589,3 +651,150 @@ def test_dump(self):
         Flowcept.db._dao().delete_tasks_with_filter(_filter)
         c1 = Flowcept.db._dao().count_tasks()
         assert c0 == c1
+
+    def test_dashboard_crud_both_db_paths(self):
+        """Dashboard CRUD works on both MongoDBDAO and LMDBDAO."""
+        from flowcept.commons.daos.docdb_dao.mongodb_dao import MongoDBDAO
+        from flowcept.commons.daos.docdb_dao.lmdb_dao import LMDBDAO
+
+        dashboard_id = str(uuid4())
+        doc = {
+            "dashboard_id": dashboard_id,
+            "dashboard_type": "common_workflow",
+            "name": "test-dash",
+            "charts": [],
+            "layout": [],
+        }
+
+        if MONGO_ENABLED:
+            dao = MongoDBDAO()
+            assert dao.save_dashboard(doc)
+            result = dao.get_dashboard(dashboard_id)
+            assert result is not None
+            assert result["name"] == "test-dash"
+            all_docs = dao.list_dashboards()
+            assert any(d["dashboard_id"] == dashboard_id for d in all_docs)
+            filtered = dao.list_dashboards(filter={"dashboard_type": "common_workflow"})
+            assert any(d["dashboard_id"] == dashboard_id for d in filtered)
+            assert dao.delete_dashboard(dashboard_id)
+            assert dao.get_dashboard(dashboard_id) is None
+            dao.close()
+
+        if LMDB_ENABLED:
+            dao = LMDBDAO()
+            assert dao.save_dashboard(doc)
+            result = dao.get_dashboard(dashboard_id)
+            assert result is not None
+            assert result["name"] == "test-dash"
+            all_docs = dao.list_dashboards()
+            assert any(d["dashboard_id"] == dashboard_id for d in all_docs)
+            filtered = dao.list_dashboards(filter={"dashboard_type": "common_workflow"})
+            assert any(d["dashboard_id"] == dashboard_id for d in filtered)
+            assert dao.delete_dashboard(dashboard_id)
+            assert dao.get_dashboard(dashboard_id) is None
+            dao.close()
+
+    def test_dbapi_analytics_methods(self):
+        """DBAPI exposes task_summary, derive_campaigns, derive_agents, telemetry_timeseries."""
+        if not Flowcept.services_alive():
+            import pytest
+            pytest.skip("No live services.")
+        db = Flowcept.db
+        summary = db.task_summary({})
+        assert isinstance(summary, dict)
+        assert "count" in summary
+        assert "status_counts" in summary
+        assert "activity_stats" in summary
+        assert "time_range" in summary
+
+        campaigns = db.derive_campaigns()
+        assert isinstance(campaigns, list)
+
+        agents = db.derive_agents()
+        assert isinstance(agents, list)
+
+        rows = db.telemetry_timeseries({}, fields=["started_at"], x_field="started_at", limit=10)
+        assert isinstance(rows, list)
+
+    def test_dbapi_get_dao_instance(self):
+        """DBAPI.get_dao_instance() returns the DocumentDBDAO singleton."""
+        if not Flowcept.services_alive():
+            import pytest
+            pytest.skip("No live services.")
+        from flowcept.flowcept_api.db_api import DBAPI
+        dao = DBAPI.get_dao_instance()
+        assert isinstance(dao, DocumentDBDAO)
+        dashboard_id = str(uuid4())
+        doc = {"dashboard_id": dashboard_id, "name": "test", "charts": []}
+        assert dao.save_dashboard(doc) is True
+        fetched = dao.get_dashboard(dashboard_id)
+        assert fetched is not None
+        assert fetched["dashboard_id"] == dashboard_id
+        listed = dao.list_dashboards()
+        assert any(d["dashboard_id"] == dashboard_id for d in listed)
+        assert dao.delete_dashboard(dashboard_id) is True
+        assert dao.get_dashboard(dashboard_id) is None
+
+    def test_dbapi_resolve_chart_data(self):
+        """DBAPI.resolve_chart_data returns rows and count for basic specs."""
+        if not Flowcept.services_alive():
+            import pytest
+            pytest.skip("No live services.")
+        from flowcept.flowcept_api.db_api import DBAPI
+        db = DBAPI()
+        result = db.resolve_chart_data({"source": "tasks", "filter": {}})
+        assert isinstance(result, dict)
+        assert "rows" in result and "count" in result
+        assert isinstance(result["rows"], list)
+        assert isinstance(result["count"], int)
+
+        grouped = db.resolve_chart_data({
+            "source": "tasks",
+            "group_by": "status",
+            "metrics": [{"field": "", "agg": "count"}],
+        })
+        assert isinstance(grouped, dict)
+        assert "rows" in grouped and "count" in grouped
+
+    def test_docdb_dao_utils(self):
+        """Shared DAO helpers in docdb_dao_utils are importable and correct."""
+        import pytest
+        from flowcept.commons.daos.docdb_dao.docdb_dao_utils import (
+            to_epoch,
+            get_nested,
+        )
+        # epoch-ms → epoch-sec
+        assert to_epoch(1_000_000_000_000) == pytest.approx(1_000_000_000.0)
+        # already epoch-sec
+        assert to_epoch(1_000_000_000.0) == pytest.approx(1_000_000_000.0)
+        # ISO string (Unix 1000000000 = 2001-09-09T01:46:40Z)
+        iso_result = to_epoch("2001-09-09T01:46:40+00:00")
+        assert iso_result is not None
+        assert abs(iso_result - 1_000_000_000.0) < 60  # within 1 minute of expected
+        # None passthrough
+        assert to_epoch(None) is None
+        # dot-notated nested field
+        assert get_nested({"a": {"b": 1}}, "a.b") == 1
+        assert get_nested({"a": {"b": 1}}, "a.c") is None
+        assert get_nested({"a": 1}, "a.b") is None
+
+    def test_workflow_is_finished(self):
+        # A freshly constructed WorkflowObject (as sent through the MQ) is never finished.
+        wf = WorkflowObject()
+        assert not wf.workflow_is_finished(), (
+            "WorkflowObject.to_dict() never sets status, so workflow_is_finished() "
+            "must return False for a plain workflow message — if this fails, "
+            "the MQ publish path now sets status=FINISHED and the dead-logic is resolved."
+        )
+
+        # Only an explicit status=FINISHED makes it finished.
+        wf_finished = WorkflowObject.from_dict({"status": Status.FINISHED})
+        assert wf_finished.workflow_is_finished()
+
+        # Raw string value (as stored in DB docs) also matches because Status is a str enum.
+        wf_finished_str = WorkflowObject.from_dict({"status": "FINISHED"})
+        assert wf_finished_str.workflow_is_finished()
+
+        # Any other status is not finished.
+        wf_running = WorkflowObject.from_dict({"status": "RUNNING"})
+        assert not wf_running.workflow_is_finished()
diff --git a/tests/api/flowcept_api_test.py b/tests/api/flowcept_api_test.py
index e7d08db3..819a5d6e 100644
--- a/tests/api/flowcept_api_test.py
+++ b/tests/api/flowcept_api_test.py
@@ -93,7 +93,7 @@ def test_continuous_run(self):
             while True:
                 n = np.random.rand()
                 o1 = sum_one_(x=n)
-                o2 = mult_two_(**o1)
+                mult_two_(**o1)
                 sleep(10)
 
     def test_simple_all_consumers(self):
@@ -137,3 +137,66 @@ def test_runtime_query(self):
                 tasks = Flowcept.db.get_tasks_from_current_workflow()
                 assert len(tasks) == (i+1)
         assert len(Flowcept.db.get_tasks_from_current_workflow()) == N
+
+
+class RabbitMQDaoTest(unittest.TestCase):
+    """Direct publish/subscribe tests for MQDaoRabbitMQ.
+
+    Skipped automatically when MQ_TYPE != 'rabbitmq' so the suite stays green
+    on Redis/Kafka configurations.
+    """
+
+    def setUp(self):
+        from flowcept.configs import MQ_TYPE
+
+        if MQ_TYPE != "rabbitmq":
+            self.skipTest(f"MQ_TYPE={MQ_TYPE!r}; skipping RabbitMQ-specific tests.")
+
+    def test_rabbitmq_liveness(self):
+        """MQDaoRabbitMQ.liveness_test() returns True when broker is reachable."""
+        from flowcept.commons.daos.mq_dao.mq_dao_rabbitmq import MQDaoRabbitMQ
+
+        dao = MQDaoRabbitMQ()
+        assert dao.liveness_test(), "RabbitMQ broker is not reachable."
+
+    def test_rabbitmq_publish_subscribe(self):
+        """Messages published by MQDaoRabbitMQ are received by a subscribed consumer."""
+        from threading import Thread
+        from flowcept.commons.daos.mq_dao.mq_dao_rabbitmq import MQDaoRabbitMQ
+
+        received = []
+        n_messages = 3
+
+        producer = MQDaoRabbitMQ()
+        consumer = MQDaoRabbitMQ()
+        consumer.subscribe()
+
+        def _listen():
+            def _handler(msg):
+                received.append(msg)
+                return len(received) < n_messages
+
+            consumer.message_listener(_handler)
+
+        t = Thread(target=_listen, daemon=True)
+        t.start()
+        sleep(0.3)  # allow consumer to bind before publishing
+
+        for i in range(n_messages):
+            producer.send_message({"seq": i, "data": f"msg_{i}"})
+
+        t.join(timeout=10)
+        assert len(received) == n_messages, f"Expected {n_messages} msgs, got {len(received)}"
+        assert {m["seq"] for m in received} == set(range(n_messages))
+
+    @unittest.skipIf(not MONGO_ENABLED, "MongoDB is disabled")
+    def test_rabbitmq_full_workflow(self):
+        """A decorated task flowing through RabbitMQ persists correctly to MongoDB."""
+        assert Flowcept.services_alive()
+        with Flowcept(workflow_name="test_rabbitmq_workflow"):
+            sum_one(42)
+
+        assert assert_by_querying_tasks_until(
+            {"workflow_id": Flowcept.current_workflow_id},
+            condition_to_evaluate=lambda docs: len(docs) == 1,
+        )
diff --git a/tests/instrumentation_tests/flowcept_explicit_tasks_test.py b/tests/instrumentation_tests/flowcept_explicit_tasks_test.py
index be273991..331f8748 100644
--- a/tests/instrumentation_tests/flowcept_explicit_tasks_test.py
+++ b/tests/instrumentation_tests/flowcept_explicit_tasks_test.py
@@ -45,6 +45,23 @@ def test_explicit_task_custom_metadata_non_serializable_is_sanitized(self):
         assert isinstance(value, str)
         assert value.startswith("object_instance_id_")
 
+    def test_explicit_task_can_opt_out_of_telemetry_capture(self):
+        with Flowcept(start_persistence=False):
+            with FlowceptTask(activity_id="default_telemetry", used={"a": 1}) as task_ctx:
+                task_ctx.end(generated={"b": 2})
+            with FlowceptTask(activity_id="no_telemetry", used={"a": 2}, capture_telemetry=False) as task_ctx:
+                task_ctx.end(generated={"b": 3})
+
+            tasks = [msg for msg in Flowcept.buffer if isinstance(msg, dict) and msg.get("type") == "task"]
+
+        default_task = next(task for task in tasks if task["activity_id"] == "default_telemetry")
+        no_telemetry_task = next(task for task in tasks if task["activity_id"] == "no_telemetry")
+        if configs.TELEMETRY_ENABLED:
+            assert "telemetry_at_start" in default_task
+            assert "telemetry_at_end" in default_task
+        assert "telemetry_at_start" not in no_telemetry_task
+        assert "telemetry_at_end" not in no_telemetry_task
+
     @pytest.mark.safeoffline
     def test_custom_tasks(self):
         if not configs.DUMP_BUFFER_ENABLED:
@@ -53,7 +70,7 @@ def test_custom_tasks(self):
         flowcept = Flowcept(start_persistence=False, save_workflow=True, workflow_name="MyFirstWorkflow").start()
 
         agent1 = str(uuid.uuid4())
-        t1 = FlowceptTask(activity_id="super_func1", used={"x":1}, agent_id=agent1, tags=["tag1"]).send()
+        FlowceptTask(activity_id="super_func1", used={"x":1}, agent_id=agent1, tags=["tag1"]).send()
 
         with FlowceptTask(activity_id="super_func2", used={"y": 1}, agent_id=agent1, tags=["tag2"]) as t2:
             sleep(0.5)
@@ -72,12 +89,37 @@ def test_custom_tasks(self):
             read_args["workflow_id"] = workflow_id
 
         flowcept_messages = Flowcept.read_buffer_file(**read_args)
-        assert len(flowcept_messages) == 4
+        # 1 workflow start + 3 tasks + 1 workflow end = 5
+        assert len(flowcept_messages) == 5
 
+    @pytest.mark.safeoffline
+    def test_workflow_start_end_fields(self):
+        """Workflow messages must carry started_at on start and ended_at+status=FINISHED on stop."""
+        if not configs.DUMP_BUFFER_ENABLED:
+            self.skipTest("Skipping: project.dump_buffer.enabled is false.")
+
+        flowcept = Flowcept(start_persistence=False, save_workflow=True).start()
+        workflow_id = Flowcept.current_workflow_id
+        flowcept.stop()
+
+        read_args = {"file_path": configs.DUMP_BUFFER_PATH}
+        if configs.APPEND_WORKFLOW_ID_TO_PATH or configs.APPEND_ID_TO_PATH:
+            read_args["consolidate"] = True
+            read_args["workflow_id"] = workflow_id
+
+        messages = Flowcept.read_buffer_file(**read_args)
+        wf_messages = [m for m in messages if m.get("type") == "workflow"]
+
+        start_msg = next((m for m in wf_messages if "started_at" in m and "ended_at" not in m), None)
+        end_msg = next((m for m in wf_messages if "ended_at" in m), None)
+
+        assert start_msg is not None, "No workflow start message with started_at found."
+        assert end_msg is not None, "No workflow end message with ended_at found."
+        assert end_msg.get("status") == Status.FINISHED, "Workflow end message must have status=FINISHED."
 
     @pytest.mark.safeoffline
     def test_data_files(self):
-        with Flowcept() as f:
+        with Flowcept():
             used_args = {"a": 1}
             with FlowceptTask(used=used_args) as t:
                 repo_root = Path(__file__).resolve().parents[2]
diff --git a/tests/instrumentation_tests/ml_tests/dl_trainer.py b/tests/instrumentation_tests/ml_tests/dl_trainer.py
index 61e28548..623ba6e3 100644
--- a/tests/instrumentation_tests/ml_tests/dl_trainer.py
+++ b/tests/instrumentation_tests/ml_tests/dl_trainer.py
@@ -208,7 +208,7 @@ def model_fit(
         test_data, _ = batch
         result = test_info.copy()
 
-        best_obj_id = Flowcept.db.save_or_update_torch_model(model, task_id=task_id, workflow_id=workflow_id, custom_metadata=result)
+        best_obj_id = Flowcept.insert_or_update_torch_model(model, task_id=task_id, workflow_id=workflow_id, custom_metadata=result)
         result.update(
             {
                 "best_obj_id": best_obj_id,
diff --git a/tests/instrumentation_tests/ml_tests/ml_decorator_test.py b/tests/instrumentation_tests/ml_tests/ml_decorator_test.py
index 4c953d2f..3490c6d2 100644
--- a/tests/instrumentation_tests/ml_tests/ml_decorator_test.py
+++ b/tests/instrumentation_tests/ml_tests/ml_decorator_test.py
@@ -6,7 +6,7 @@
 
 from torch import nn
 
-from flowcept import Flowcept
+from flowcept import BlobObject, Flowcept
 from flowcept.configs import MONGO_ENABLED
 from tests.instrumentation_tests.ml_tests.dl_trainer import ModelTrainer, MyNet
 
@@ -15,7 +15,8 @@ class MLDecoratorTests(unittest.TestCase):
     @unittest.skipIf(not MONGO_ENABLED, "MongoDB is disabled")
     def test_torch_save_n_load(self):
         model = nn.Module()
-        model_id = Flowcept.db.save_or_update_torch_model(model)
+        blob_obj = Flowcept.db._insert_or_update_torch_model(model, BlobObject())
+        model_id = blob_obj.object_id
         new_model = nn.Module()
         doc = Flowcept.db.load_torch_model(model=new_model, object_id=model_id)
         print(doc)
diff --git a/tests/instrumentation_tests/ml_tests/single_layer_perceptron_test.py b/tests/instrumentation_tests/ml_tests/single_layer_perceptron_test.py
index 19ea33ac..a056d8f5 100644
--- a/tests/instrumentation_tests/ml_tests/single_layer_perceptron_test.py
+++ b/tests/instrumentation_tests/ml_tests/single_layer_perceptron_test.py
@@ -4,7 +4,6 @@
 import random
 
 import pytest
-from uuid import uuid4
 
 pytest.importorskip("torch")
 
@@ -92,7 +91,7 @@ def get_dataset(n_samples, split_ratio):
     y_train, y_val = y[:n_train], y[n_train:]
     dataset_task_id = get_current_context_task_id()
     custom_metadata = {"n_samples": n_samples, "split_ratio": split_ratio}
-    dataset_object_id = Flowcept.db.save_or_update_dataset(
+    dataset_object_id = Flowcept.insert_or_update_dataset(
         object={
             "x_train": x_train,
             "y_train": y_train,
@@ -132,13 +131,12 @@ def submit_gridsearch_job(
     source_agent_id=None,
 ):
     """Simulate submitting a training job to an HPC system."""
-    from uuid import uuid4
     configs = [
-        {"epochs": 2, "learning_rate": 0.01, "n_input_neurons": 1},
-        {"epochs": 4, "learning_rate": 0.03, "n_input_neurons": 1},
-        {"epochs": 6, "learning_rate": 0.08, "n_input_neurons": 2},
-        {"epochs": 10, "learning_rate": 0.12, "n_input_neurons": 2},
-        {"epochs": 14, "learning_rate": 0.20, "n_input_neurons": 2},
+        {"config_id": "cfg_1", "epochs": 2, "learning_rate": 0.01, "n_input_neurons": 1},
+        {"config_id": "cfg_2", "epochs": 4, "learning_rate": 0.03, "n_input_neurons": 1},
+        {"config_id": "cfg_3", "epochs": 6, "learning_rate": 0.08, "n_input_neurons": 2},
+        {"config_id": "cfg_4", "epochs": 10, "learning_rate": 0.12, "n_input_neurons": 2},
+        {"config_id": "cfg_5", "epochs": 14, "learning_rate": 0.20, "n_input_neurons": 2},
     ]
     configs = configs[:n_configs]
     assert len(configs) == n_configs
@@ -195,7 +193,7 @@ def train_and_validate(
             }
             if config_id is not None:
                 custom_metadata["config_id"] = config_id
-            torch_model_object_id = Flowcept.db.save_or_update_torch_model(
+            torch_model_object_id = Flowcept.insert_or_update_torch_model(
                 model=model,
                 object_id=torch_model_object_id,
                 task_id=current_task_id,
@@ -203,7 +201,7 @@ def train_and_validate(
                 control_version=True,
             )
             if not torch_only:
-                ml_model_object_id = Flowcept.db.save_or_update_ml_model(
+                ml_model_object_id = Flowcept.insert_or_update_ml_model(
                     object=model.state_dict(),
                     object_id=ml_model_object_id,
                     task_id=current_task_id,
@@ -332,7 +330,7 @@ def run_gridsearch_experiment(campaign_id=None):
                 y_val=y_val,
                 dataset_id=dataset_id,
                 checkpoint_check=2,
-                config_id=f"cfg_{idx}",
+                config_id=cfg["config_id"],
                 torch_only=True,
             )
             results.append({"torch_model_object_id": result.get("torch_model_object_id")})
diff --git a/tests/misc_tests/log_test.py b/tests/misc_tests/log_test.py
index 532076ec..2582e83c 100644
--- a/tests/misc_tests/log_test.py
+++ b/tests/misc_tests/log_test.py
@@ -1,9 +1,8 @@
 import logging
-import os.path
 import unittest
 
 from flowcept.commons.flowcept_logger import FlowceptLogger
-from flowcept.configs import PROJECT_NAME, LOG_FILE_LEVEL, LOG_FILE_PATH
+from flowcept.configs import PROJECT_NAME
 
 
 class TestLog(unittest.TestCase):
diff --git a/tests/misc_tests/singleton_test.py b/tests/misc_tests/singleton_test.py
index 82ba47cb..a47f73a0 100644
--- a/tests/misc_tests/singleton_test.py
+++ b/tests/misc_tests/singleton_test.py
@@ -1,19 +1,17 @@
 import unittest
 
-from flowcept import Flowcept
 from flowcept.commons.daos.docdb_dao.docdb_dao_base import DocumentDBDAO
 from flowcept.commons.daos.docdb_dao.lmdb_dao import LMDBDAO
 from flowcept.commons.daos.docdb_dao.mongodb_dao import MongoDBDAO
 from flowcept.commons.flowcept_logger import FlowceptLogger
 from flowcept.configs import MONGO_ENABLED
-from flowcept.flowcept_api.db_api import DBAPI
 
 
 class TestSingleton(unittest.TestCase):
     def test_singleton(self):
         logger = FlowceptLogger()
         try:
-            dao_err = DocumentDBDAO()
+            DocumentDBDAO()
         except Exception as e:
             logger.debug("This exception is expected because we can't instantiate this: " + str(e))
 
diff --git a/tests/report/report_service_test.py b/tests/report/report_service_test.py
index 6a9f0c2f..2a8a2953 100644
--- a/tests/report/report_service_test.py
+++ b/tests/report/report_service_test.py
@@ -1,4 +1,7 @@
 import json
+import os
+import subprocess
+import sys
 import tempfile
 import unittest
 from pathlib import Path
@@ -405,6 +408,48 @@ def test_generate_report_from_jsonl(self):
             assert output.exists()
             assert stats["input_mode"] == "jsonl"
 
+    def test_generate_report_defaults_to_buffer_file(self):
+        with tempfile.TemporaryDirectory() as td:
+            jsonl_path = Path(td) / "flowcept_buffer.jsonl"
+            with jsonl_path.open("w", encoding="utf-8") as f:
+                for rec in _sample_records():
+                    rec_copy = dict(rec)
+                    if isinstance(rec_copy.get("data"), (bytes, bytearray)):
+                        rec_copy["data"] = "bytes-redacted"
+                    f.write(json.dumps(rec_copy) + "\n")
+            output = Path(td) / "card.md"
+            with patch("flowcept.configs.DUMP_BUFFER_PATH", str(jsonl_path)):
+                stats = Flowcept.generate_report(output_path=str(output))
+            assert output.exists()
+            assert stats["input_mode"] == "jsonl"
+
+    def test_start_here_runs_without_settings_file(self):
+        repo_root = Path(__file__).resolve().parents[2]
+        env = os.environ.copy()
+        with tempfile.TemporaryDirectory() as td:
+            for _k in (
+                "FLOWCEPT_SETTINGS_PATH",
+                "FLOWCEPT_USE_DEFAULT",
+                "LMDB_ENABLED",
+                "MONGO_ENABLED",
+                "MQ_ENABLED",
+                "DB_FLUSH_MODE",
+            ):
+                env.pop(_k, None)
+            env["HOME"] = td
+            env["PYTHONPATH"] = str(repo_root / "src")
+            result = subprocess.run(
+                [sys.executable, str(repo_root / "examples/start_here.py")],
+                cwd=td,
+                env=env,
+                capture_output=True,
+                text=True,
+                check=False,
+            )
+            assert result.returncode == 0, result.stderr
+            assert (Path(td) / "flowcept_buffer.jsonl").exists()
+            assert (Path(td) / "WORKFLOW_CARD.md").exists()
+
     def test_generate_report_input_validation(self):
         with self.assertRaises(ValueError):
             Flowcept.generate_report(
diff --git a/tests/test_utils/__init__.py b/tests/test_utils/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/tests/test_utils/test_llm_utils.py b/tests/test_utils/test_llm_utils.py
new file mode 100644
index 00000000..8b8468bd
--- /dev/null
+++ b/tests/test_utils/test_llm_utils.py
@@ -0,0 +1,116 @@
+"""Utilities for scoring LLM responses against expected text in integration tests.
+
+Uses fact-recall scoring: what fraction of expected's content words are present in
+actual (case-insensitive, 5-char prefix matching for morphological variants).
+
+This metric is more appropriate than TF-IDF cosine for LLM responses that contain
+markdown tables, UUIDs, or verbose formatting: it does not penalise actual for having
+more text, and correctly detects missing key facts.
+
+sklearn is NOT required.  Falls back gracefully if unavailable.
+"""
+
+from __future__ import annotations
+
+import re
+
+_UUID_RE = re.compile(r"\b[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}\b", re.I)
+_HEX_FRAG_RE = re.compile(r"\b[0-9a-f]{8,}\b", re.I)
+_MD_NOISE_RE = re.compile(r"[|`*#_\-]{2,}")
+
+_STOP_WORDS = {
+    "the", "a", "an", "is", "was", "are", "were", "be", "been", "have", "has", "had",
+    "do", "does", "did", "will", "would", "shall", "should", "may", "might", "must",
+    "can", "could", "to", "of", "in", "on", "at", "by", "for", "with", "about", "from",
+    "it", "its", "and", "or", "but", "if", "than", "that", "this", "these", "those",
+    "which", "who", "whose", "what", "how", "when", "where", "why", "via", "vs",
+    "two", "one", "some", "any", "all", "each", "per", "ran", "run", "not", "no",
+    "so", "as", "up", "out", "also", "into", "during", "same", "more", "most", "just",
+    "too", "very", "still",
+}
+
+
+def _clean_tokenize(text: str) -> set:
+    """Strip UUIDs, markdown noise, then return a set of lowercase word tokens."""
+    text = _UUID_RE.sub(" ", text)
+    text = _HEX_FRAG_RE.sub(" ", text)
+    text = _MD_NOISE_RE.sub(" ", text)
+    return set(re.findall(r"\b\w+\b", text.lower()))
+
+
+def fact_recall(actual: str, expected: str) -> float:
+    """Fraction of expected's content words present in actual (0.0–1.0).
+
+    Content words are extracted from *expected* by removing stop words and
+    short tokens (< 3 chars).  Presence in *actual* is tested via 5-char
+    prefix matching so that morphological variants like ``coordinates`` /
+    ``coordinated`` or ``submit`` / ``submitted`` match correctly.
+
+    Parameters
+    ----------
+    actual : str
+        LLM response to evaluate.
+    expected : str
+        Reference text with the key facts the response should contain.
+
+    Returns
+    -------
+    float
+        Score in [0.0, 1.0].  Returns 0.0 when expected has no content words.
+    """
+    exp_words = [
+        w for w in _clean_tokenize(expected)
+        if len(w) >= 3 and w not in _STOP_WORDS
+    ]
+    if not exp_words:
+        return 0.0
+
+    act_tokens = _clean_tokenize(actual)
+
+    def _present(word: str) -> bool:
+        if word in act_tokens:
+            return True
+        prefix = word[:5] if len(word) >= 5 else word
+        return any(t.startswith(prefix) for t in act_tokens)
+
+    found = sum(1 for w in exp_words if _present(w))
+    return found / len(exp_words)
+
+
+def cosine_similarity(text_a: str, text_b: str) -> float:
+    """Return TF-IDF cosine similarity between two strings (0.0–1.0).
+
+    Kept for backward compatibility; ``score_response`` now uses
+    ``fact_recall`` instead.  Returns 0.0 on empty input or if sklearn is
+    unavailable.
+    """
+    try:
+        from sklearn.feature_extraction.text import TfidfVectorizer
+        from sklearn.metrics.pairwise import cosine_similarity as _sk_cos
+    except ImportError:
+        return 0.0
+
+    a = _UUID_RE.sub(" ", text_a)
+    b = _UUID_RE.sub(" ", text_b)
+    if not a.strip() or not b.strip():
+        return 0.0
+    try:
+        matrix = TfidfVectorizer().fit_transform([a, b])
+        return float(_sk_cos(matrix[0:1], matrix[1:2])[0][0])
+    except Exception:
+        return 0.0
+
+
+def score_response(actual: str, expected: str, threshold: float) -> bool:
+    """Return True if the fact-recall score of *actual* against *expected* meets *threshold*.
+
+    Parameters
+    ----------
+    actual : str
+        LLM response to evaluate.
+    expected : str
+        Reference text from the test YAML.
+    threshold : float
+        Minimum score required (0.0–1.0).
+    """
+    return fact_recall(actual, expected) >= threshold
diff --git a/tests/webservice/chat_query_tests.yaml b/tests/webservice/chat_query_tests.yaml
new file mode 100644
index 00000000..a37757ae
--- /dev/null
+++ b/tests/webservice/chat_query_tests.yaml
@@ -0,0 +1,265 @@
+# Path-agnostic chat endpoint integration cases.
+#
+# Every question in this file must pass through both paths:
+#   /api/v1/chat -> LangGraph -> MCP -> DB tools
+#   /api/v1/chat -> LangGraph -> MCP -> runtime in-memory tools
+#
+# Tests vary only the HTTP chat context field `tool_context` (`db` vs `df`).
+# Do not add DB-only or DF-only questions without explicit maintainer approval.
+
+- user_query: "What was the complete workflow execution lineage including all activities around the train_and_validate task that achieved the best validation accuracy?"
+  expected_response: "call_hpc_agent submit_gridsearch_job get_dataset train_and_validate select_best_model."
+  score_threshold: 0.65
+
+- user_query: "For configuration cfg_1, what parameters were used and what agent submitted them?"
+  expected_response: "cfg_1 config_id epochs 2 learning_rate 0.01 n_input_neurons 1 submit_gridsearch_job HPCAgent."
+  score_threshold: 0.72
+
+- user_query: "What input fields were used by the train_and_validate tasks?"
+  expected_response: "train_and_validate n_input_neurons epochs x_train y_train x_val y_val dataset_id checkpoint_check learning_rate config_id torch_only job_id."
+  score_threshold: 0.72
+
+- user_query: "Which agent and task submitted the work items for train_and_validate?"
+  expected_response: "HPCAgent submit_gridsearch_job."
+  score_threshold: 0.70
+
+- user_query: "How many tasks ran across all workflows in the campaign?"
+  expected_response: "nine 9 tasks."
+  score_threshold: 0.65
+
+- user_query: "What learning rates and epoch counts were evaluated?"
+  expected_response: "learning_rate 0.01 0.03 0.08 0.12 0.20 epochs 2 4 6 10 14."
+  score_threshold: 0.72
+
+- user_query: "What agents participated in the workflow and what activities did they run?"
+  expected_response: "HPCAgent submit_gridsearch_job Orchestrator call_hpc_agent select_best_model."
+  score_threshold: 0.72
+
+- user_query: "Plot a bar chart showing the number of tasks per activity in the workflow."
+  expected_response: "bar chart activity_id task count train_and_validate 5."
+  score_threshold: 0.55
+
+- user_query: "List the workflows in the campaign."
+  expected_response: "workflow_id name Perceptron GridSearch."
+  score_threshold: 0.72
+
+- user_query: "Which configuration achieved the highest validation accuracy?"
+  expected_response: "highest validation accuracy 1.0 cfg_2 cfg_3 cfg_4 cfg_5 train_and_validate."
+  score_threshold: 0.60
+
+- user_query: "What was the lowest validation accuracy recorded and which configuration produced it?"
+  expected_response: "lowest validation accuracy 0.125 cfg_1 train_and_validate."
+  score_threshold: 0.60
+
+- user_query: "What is the average validation accuracy for configurations with more than 5 epochs?"
+  expected_response: "average validation accuracy 1.0 epochs greater than 5."
+  score_threshold: 0.65
+
+- user_query: "What is the name and start time of the workflow?"
+  expected_response: "workflow name Perceptron GridSearch utc timestamp."
+  score_threshold: 0.60
+
+# T30: richer response cases — table, chart+table+summary
+- user_query: "List all tasks with their activity_id and status as a markdown table."
+  expected_response: "activity_id status FINISHED train_and_validate."
+  score_threshold: 0.65
+  case_id: "table"
+
+- user_query: "Display a bar chart of activity_id distribution and list the data in a table."
+  expected_response: "train_and_validate 5 activity_id bar chart."
+  score_threshold: 0.50
+  case_id: "db_table_plot_summary"
+  tool_contexts: ["db"]
+  tool_expected: "make_chart"
+
+- user_query: "Display a bar chart of activity_id distribution and list the data in a table."
+  expected_response: "train_and_validate 5 activity_id bar chart."
+  score_threshold: 0.50
+  case_id: "df_table_plot_summary"
+  tool_contexts: ["df"]
+  tool_expected: "generate_plot_code"
+
+# T32: full provenance questionnaire — all 34 unique questions from agent_sandbox/questions.csv.
+# Answers are drawn from the gridsearch fixture (single_layer_perceptron_test.py).
+# Dataset: 120 samples, split_ratio=0.8, x shape (120,2), binary labels 0/1.
+# Model: SingleLayerPerceptron (SGD, BCELoss), 2–3 params depending on n_input_neurons (1 or 2).
+# No GPU telemetry; no distributed training; user/machine info from workflow.enrich().
+
+# --- Workflow control-flow ---
+- user_query: "How many activities are present in the whole workflow?"
+  expected_response: "5 activities workflow."
+  score_threshold: 0.70
+  case_id: "t32_activity_count"
+
+- user_query: "What is the final status of the workflow?"
+  expected_response: "finished status workflow."
+  score_threshold: 0.65
+  case_id: "t32_workflow_status"
+
+- user_query: "What is the wall-clock execution time to completion of the workflow?"
+  expected_response: "seconds workflow."
+  score_threshold: 0.75
+  case_id: "t32_wall_clock_time"
+
+- user_query: "What was the specific execution order of the tasks?"
+  expected_response: "call_hpc_agent submit_gridsearch_job get_dataset train_and_validate select_best_model."
+  score_threshold: 0.65
+  case_id: "t32_execution_order"
+
+# DF path cannot compute per-task durations from the in-memory DataFrame; db-only.
+- user_query: "What was the bottleneck during the workflow (activity taking the longest)?"
+  expected_response: "train_and_validate longest bottleneck."
+  score_threshold: 0.55
+  case_id: "t32_bottleneck"
+  tool_contexts: ["db"]
+
+# --- Workflow scheduling / hardware ---
+- user_query: "What hardware was used in the workflow?"
+  expected_response: "cpu machine hardware platform processor."
+  score_threshold: 0.45
+  case_id: "t32_hardware"
+
+- user_query: "Who is responsible for this workflow (person or username or entity)?"
+  expected_response: "user responsible workflow."
+  score_threshold: 0.50
+  case_id: "t32_responsible_user"
+
+# The gridsearch fixture uses HPCAgent/submit_gridsearch_job, so agents may infer HPC/distributed.
+- user_query: "Has the model been trained in a distributed setting?"
+  expected_response: "training distributed setting."
+  score_threshold: 0.45
+  case_id: "t32_distributed"
+
+# --- Workflow dataflow ---
+- user_query: "List all the parameters of the first activity of the workflow."
+  expected_response: "call_hpc_agent activity parameters."
+  score_threshold: 0.55
+  case_id: "t32_first_activity_params"
+
+- user_query: "List all parameters for all activities in the workflow."
+  expected_response: "n_samples split_ratio learning_rate epochs n_input_neurons dataset_id val_accuracy config_id."
+  score_threshold: 0.60
+  case_id: "t32_all_activity_params"
+
+- user_query: "What significant input artifacts are involved in the generation of the finetuned model?"
+  expected_response: "dataset epochs learning input artifacts."
+  score_threshold: 0.65
+  case_id: "t32_input_artifacts"
+
+# --- Workflow telemetry ---
+- user_query: "What was the total energy consumption in kilowatt-hours of the GPU(s) during the workflow?"
+  expected_response: "gpu energy not."
+  score_threshold: 0.60
+  case_id: "t32_gpu_energy_kwh"
+
+- user_query: "What was the total power consumption in Watts of the GPU(s) during the workflow?"
+  expected_response: "gpu power not."
+  score_threshold: 0.60
+  case_id: "t32_gpu_power_watts"
+
+- user_query: "What is the total energy use for completing the workflow?"
+  expected_response: "energy not."
+  score_threshold: 0.65
+  case_id: "t32_total_energy"
+
+# --- Data artifacts ---
+- user_query: "List all workflow input files with size larger than 100Mb."
+  expected_response: "files 100."
+  score_threshold: 0.80
+  case_id: "t32_files_larger_100mb"
+
+- user_query: "List all different object types in the workflow."
+  expected_response: "dataset ml_model object_type objects."
+  score_threshold: 0.55
+  case_id: "t32_file_types"
+
+- user_query: "Identify the largest output of the workflow (by file size)."
+  expected_response: "ml_model dataset object largest."
+  score_threshold: 0.45
+  case_id: "t32_largest_output"
+
+- user_query: "What is the science domain of the dataset?"
+  expected_response: "not available science domain dataset."
+  score_threshold: 0.40
+  case_id: "t32_dataset_science_domain"
+
+- user_query: "Does the dataset have a predetermined train-test split?"
+  expected_response: "split ratio train test."
+  score_threshold: 0.55
+  case_id: "t32_train_test_split"
+
+- user_query: "How many samples are present in the whole dataset?"
+  expected_response: "120 samples dataset."
+  score_threshold: 0.75
+  case_id: "t32_dataset_sample_count"
+
+- user_query: "What is the semantic format (e.g. strings; ints; bounding boxes) of the ground truth (if present)?"
+  expected_response: "ground truth not."
+  score_threshold: 0.60
+  case_id: "t32_ground_truth_format"
+
+- user_query: "What is the specific task for which the dataset was created?"
+  expected_response: "not available task dataset."
+  score_threshold: 0.40
+  case_id: "t32_dataset_task"
+
+- user_query: "What is the size in byte of one sample?"
+  expected_response: "bytes sample features shape."
+  score_threshold: 0.40
+  case_id: "t32_sample_size_bytes"
+
+- user_query: "What is the total size of the whole dataset?"
+  expected_response: "size dataset bytes samples."
+  score_threshold: 0.40
+  case_id: "t32_dataset_total_size"
+
+# --- ML model ---
+- user_query: "What are the designed uses for this model?"
+  expected_response: "not available designed uses model."
+  score_threshold: 0.40
+  case_id: "t32_model_designed_uses"
+
+- user_query: "What distinct epoch counts were used in the finetuning configurations?"
+  expected_response: "epochs 2 4 6 10 14 configurations training."
+  score_threshold: 0.60
+  case_id: "t32_epochs"
+
+- user_query: "How many model parameters (weights) does the model have?"
+  expected_response: "params parameters 2 3 model."
+  score_threshold: 0.55
+  case_id: "t32_model_params"
+
+- user_query: "What is the science domain of the model?"
+  expected_response: "not available science domain model."
+  score_threshold: 0.40
+  case_id: "t32_model_science_domain"
+
+- user_query: "What is the task solved by this model (regression or classification or forecast etc.)?"
+  expected_response: "not available task model."
+  score_threshold: 0.40
+  case_id: "t32_model_task"
+
+- user_query: "What is the intended use of this model?"
+  expected_response: "not available intended use model."
+  score_threshold: 0.40
+  case_id: "t32_model_intended_use"
+
+- user_query: "What is the size of the final model in Mb?"
+  expected_response: "model size mb small."
+  score_threshold: 0.40
+  case_id: "t32_model_size_mb"
+
+- user_query: "What technique was used to fine-tune the model? (e.g. LoRa; GAN...)"
+  expected_response: "not available technique fine-tune."
+  score_threshold: 0.40
+  case_id: "t32_finetuning_technique"
+
+- user_query: "What is the computational throughput of the model?"
+  expected_response: "not available throughput computational."
+  score_threshold: 0.40
+  case_id: "t32_throughput"
+
+- user_query: "Are the performance shown in the pretrained version improved in the finetuning?"
+  expected_response: "no pretrained scratch trained from."
+  score_threshold: 0.45
+  case_id: "t32_pretrained_improvement"
diff --git a/tests/webservice/conftest.py b/tests/webservice/conftest.py
new file mode 100644
index 00000000..4e1c2531
--- /dev/null
+++ b/tests/webservice/conftest.py
@@ -0,0 +1,108 @@
+"""Session-level fixtures for webservice integration tests."""
+
+from __future__ import annotations
+
+import time
+from uuid import uuid4
+
+import pytest
+
+from flowcept import Flowcept
+from flowcept.commons.flowcept_logger import FlowceptLogger
+from flowcept.configs import MONGO_ENABLED
+
+
+def _wait_for_tasks(workflow_id: str, min_count: int, timeout: float = 60.0) -> bool:
+    deadline = time.time() + timeout
+    while time.time() < deadline:
+        count = len(Flowcept.db.task_query(filter={"workflow_id": workflow_id}) or [])
+        if count >= min_count:
+            return True
+        time.sleep(0.5)
+    return False
+
+
+def _wait_for_objects(workflow_id: str, min_count: int, timeout: float = 60.0) -> bool:
+    from flowcept.flowcept_api.db_api import DBAPI
+
+    deadline = time.time() + timeout
+    while time.time() < deadline:
+        count = len(DBAPI().blob_object_query(filter={"workflow_id": workflow_id}) or [])
+        if count >= min_count:
+            return True
+        time.sleep(0.5)
+    return False
+
+
+def _wait_for_agents(workflow_id: str, min_count: int, timeout: float = 60.0) -> bool:
+    from flowcept.commons.daos.docdb_dao.mongodb_dao import MongoDBDAO
+
+    deadline = time.time() + timeout
+    while time.time() < deadline:
+        count = len(MongoDBDAO().agent_query(filter={"workflow_id": workflow_id}) or [])
+        if count >= min_count:
+            return True
+        time.sleep(0.5)
+    return False
+
+
+@pytest.fixture(scope="session")
+def gridsearch_run_data():
+    """Run the Perceptron GridSearch experiment once and yield its artifacts.
+
+    Skips automatically when:
+    - MongoDB is disabled.
+    - Flowcept infrastructure services (MQ/KVDB/Mongo) are not alive.
+    - The LLM agent is not configured (api_key / service_provider missing).
+
+    Yields
+    ------
+    dict
+        Keys: ``workflow_id``, ``tasks``, ``configs``, ``results``, ``selected``,
+        ``campaign_id``.
+    Cleanup: deletes the campaign and all its data after the session ends.
+    """
+    logger = FlowceptLogger()
+
+    if not MONGO_ENABLED:
+        pytest.skip("MongoDB is disabled; gridsearch fixture requires Mongo.")
+    if not Flowcept.services_alive():
+        logger.warning("Skipping gridsearch session fixture: one or more services not ready (see ERROR logs above).")
+        pytest.skip("One or more services not ready.")
+
+    from tests.instrumentation_tests.ml_tests.single_layer_perceptron_test import run_gridsearch_experiment
+
+    campaign_id = f"chat-test-gs-{uuid4()}"
+    run_data = run_gridsearch_experiment(campaign_id=campaign_id)
+    run_data["campaign_id"] = campaign_id
+
+    workflow_id = run_data["workflow_id"]
+    # Wait for all tasks to land in MongoDB before any chat test reads them.
+    min_tasks = len(run_data.get("configs", [])) + 3  # train tasks + setup tasks
+    ok = _wait_for_tasks(workflow_id, min_count=min_tasks)
+    if not ok:
+        count = len(Flowcept.db.task_query(filter={"workflow_id": workflow_id}) or [])
+        logger.warning(f"gridsearch fixture: only {count} tasks persisted after timeout.")
+
+    # Wait for blob objects (dataset + ml_model checkpoints) — needed by DF-path object queries.
+    ok = _wait_for_objects(workflow_id, min_count=2)
+    if not ok:
+        from flowcept.flowcept_api.db_api import DBAPI
+
+        count = len(DBAPI().blob_object_query(filter={"workflow_id": workflow_id}) or [])
+        logger.warning(f"gridsearch fixture: only {count} objects persisted after timeout.")
+
+    # Wait for agents (HPCAgent + Orchestrator) — needed by list_agents tool calls.
+    ok = _wait_for_agents(workflow_id, min_count=2)
+    if not ok:
+        from flowcept.commons.daos.docdb_dao.mongodb_dao import MongoDBDAO
+
+        count = len(MongoDBDAO().agent_query(filter={"workflow_id": workflow_id}) or [])
+        logger.warning(f"gridsearch fixture: only {count} agents persisted after timeout.")
+
+    yield run_data
+
+    try:
+        Flowcept.db.delete_campaign_data(campaign_id)
+    except Exception as exc:
+        logger.warning(f"gridsearch fixture cleanup failed for campaign {campaign_id}: {exc}")
diff --git a/tests/webservice/test_imports.py b/tests/webservice/test_imports.py
deleted file mode 100644
index dca9c0bd..00000000
--- a/tests/webservice/test_imports.py
+++ /dev/null
@@ -1,7 +0,0 @@
-"""Basic import smoke test for webservice package."""
-
-
-def test_webservice_imports():
-    from flowcept.webservice.main import app
-
-    assert app is not None
diff --git a/tests/webservice/test_webservice_api.py b/tests/webservice/test_webservice_api.py
deleted file mode 100644
index a9d844b6..00000000
--- a/tests/webservice/test_webservice_api.py
+++ /dev/null
@@ -1,908 +0,0 @@
-"""Webservice API tests with a mocked DBAPI dependency."""
-
-from __future__ import annotations
-
-from pathlib import Path
-from unittest.mock import patch
-
-from fastapi.testclient import TestClient
-
-from flowcept.commons.flowcept_dataclasses.blob_object import BlobObject
-from flowcept.commons.flowcept_dataclasses.workflow_object import WorkflowObject
-from flowcept.webservice.deps import get_db_api
-from flowcept.webservice.main import create_app
-from flowcept.webservice.services.dashboard_store import get_dashboard_store
-
-
-class FakeDB:
-    """Simple fake DBAPI for endpoint tests."""
-
-    def __init__(self):
-        self.workflows = [
-            {"workflow_id": "wf-1", "user": "alice", "campaign_id": "c1", "name": "run-a", "utc_timestamp": 200},
-            {"workflow_id": "wf-2", "user": "bob", "campaign_id": "c2", "name": "run-b", "utc_timestamp": 100},
-        ]
-        self.tasks = [
-            {"task_id": "t2", "workflow_id": "wf-1", "status": "running", "started_at": 20},
-            {"task_id": "t1", "workflow_id": "wf-1", "status": "finished", "started_at": 10},
-            {"task_id": "t3", "workflow_id": "wf-2", "status": "finished", "started_at": 30},
-        ]
-        self.agents = []
-        self.objects = [
-            {
-                "object_id": "o1",
-                "workflow_id": "wf-1",
-                "task_id": "t1",
-                "object_type": "dataset",
-                "version": 1,
-                "custom_metadata": {"k": "v1"},
-                "data": b"payload-1",
-                "created_at": "2025-01-02T00:00:00",
-            },
-            {
-                "object_id": "o2",
-                "workflow_id": "wf-2",
-                "task_id": "t3",
-                "object_type": "ml_model",
-                "version": 2,
-                "custom_metadata": {"k": "v2", "loss": 0.42},
-                "data": b"payload-2",
-                "created_at": "2025-01-01T00:00:00",
-            },
-            {
-                "object_id": "o3",
-                "workflow_id": "wf-1",
-                "task_id": "t2",
-                "object_type": "ml_model",
-                "version": 3,
-                "custom_metadata": {"k": "v3", "loss": 0.11},
-                "data": b"payload-2",
-                "created_at": "2025-01-01T00:00:00",
-            },
-        ]
-
-    @staticmethod
-    def _nested_get(item, field):
-        value = item
-        for part in field.split("."):
-            if not isinstance(value, dict):
-                return None
-            value = value.get(part)
-        return value
-
-    @classmethod
-    def _matches_filter(cls, item, filter_doc):
-        if not filter_doc:
-            return True
-
-        for key, value in filter_doc.items():
-            if key == "$and":
-                return all(cls._matches_filter(item, clause) for clause in value)
-            if key == "$or":
-                return any(cls._matches_filter(item, clause) for clause in value)
-
-            field_value = cls._nested_get(item, key)
-            if isinstance(value, dict):
-                for op, expected in value.items():
-                    if op == "$exists":
-                        exists = field_value is not None
-                        if bool(expected) != exists:
-                            return False
-                    elif op == "$eq":
-                        if field_value != expected:
-                            return False
-                    elif op == "$ne":
-                        if field_value == expected:
-                            return False
-                    elif op == "$in":
-                        if field_value not in expected:
-                            return False
-                    elif op == "$nin":
-                        if field_value in expected:
-                            return False
-                    elif op == "$gt":
-                        if field_value is None or not field_value > expected:
-                            return False
-                    elif op == "$gte":
-                        if field_value is None or not field_value >= expected:
-                            return False
-                    elif op == "$lt":
-                        if field_value is None or not field_value < expected:
-                            return False
-                    elif op == "$lte":
-                        if field_value is None or not field_value <= expected:
-                            return False
-                    else:
-                        raise ValueError(f"Unsupported fake operator in test DB: {op}")
-            else:
-                if field_value != value:
-                    return False
-        return True
-
-    def workflow_query(self, filter):
-        return [wf for wf in self.workflows if self._matches_filter(wf, filter)]
-
-    def get_workflow_object(self, workflow_id):
-        for wf in self.workflows:
-            if wf["workflow_id"] == workflow_id:
-                return WorkflowObject.from_dict(wf)
-        return None
-
-    def query(self, **kwargs):
-        collection = kwargs.get("collection")
-        filter_ = kwargs.get("filter") or {}
-        limit = kwargs.get("limit", 0)
-        projection = kwargs.get("projection")
-        sort = kwargs.get("sort")
-
-        if collection == "workflows":
-            rs = [wf for wf in self.workflows if self._matches_filter(wf, filter_)]
-            if sort:
-                for field, order in reversed(sort):
-                    rs = sorted(rs, key=lambda item: self._nested_get(item, field), reverse=(order == -1))
-            if projection:
-                rs = [{k: v for k, v in row.items() if k in projection} for row in rs]
-            return rs[:limit] if limit else rs
-
-        if collection == "objects":
-            rs = [obj for obj in self.objects if self._matches_filter(obj, filter_)]
-            if sort:
-                for field, order in reversed(sort):
-                    rs = sorted(rs, key=lambda item: self._nested_get(item, field), reverse=(order == -1))
-            if projection:
-                rs = [{k: v for k, v in row.items() if k in projection} for row in rs]
-            return rs[:limit] if limit else rs
-
-        if collection == "tasks":
-            rs = [task for task in self.tasks if self._matches_filter(task, filter_)]
-            if sort:
-                for field, order in reversed(sort):
-                    rs = sorted(rs, key=lambda item: self._nested_get(item, field), reverse=(order == -1))
-            if projection:
-                rs = [{k: v for k, v in row.items() if k in projection} for row in rs]
-            return rs[:limit] if limit else rs
-
-        if collection == "agents":
-            rs = [ag for ag in self.agents if self._matches_filter(ag, filter_)]
-            if sort:
-                for field, order in reversed(sort):
-                    rs = sorted(rs, key=lambda item: self._nested_get(item, field), reverse=(order == -1))
-            if projection:
-                rs = [{k: v for k, v in row.items() if k in projection} for row in rs]
-            return rs[:limit] if limit else rs
-
-        return []
-
-    def delete_agents_with_filter(self, filter):
-        self.agents = [ag for ag in self.agents if not self._matches_filter(ag, filter)]
-        return True
-
-    def agent_query(
-        self,
-        filter,
-        projection=None,
-        limit=0,
-        sort=None,
-    ):
-        rs = [ag for ag in self.agents if self._matches_filter(ag, filter or {})]
-        if sort:
-            for field, order in reversed(sort):
-                rs = sorted(rs, key=lambda item: item.get(field), reverse=(order == -1))
-        if projection:
-            rs = [{k: v for k, v in row.items() if k in projection} for row in rs]
-        return rs[:limit] if limit else rs
-
-    def task_query(
-        self,
-        filter,
-        projection=None,
-        limit=0,
-        sort=None,
-        aggregation=None,
-        remove_json_unserializables=True,
-    ):
-        rs = [task for task in self.tasks if self._matches_filter(task, filter or {})]
-
-        if sort:
-            for field, order in reversed(sort):
-                rs = sorted(rs, key=lambda item: item.get(field), reverse=(order == -1))
-
-        if projection:
-            rs = [{k: v for k, v in row.items() if k in projection} for row in rs]
-
-        return rs[:limit] if limit else rs
-
-    def blob_object_query(self, filter):
-        return [obj for obj in self.objects if self._matches_filter(obj, filter or {})]
-
-    def get_blob_object(self, object_id, version=None):
-        if version is None:
-            for obj in self.objects:
-                if obj["object_id"] == object_id:
-                    return BlobObject.from_dict(obj)
-            raise ValueError(f"Object not found for object_id={object_id}.")
-
-        for obj in self.objects:
-            if obj["object_id"] == object_id and obj["version"] == version:
-                return BlobObject.from_dict(obj)
-
-        raise ValueError(f"Object not found for object_id={object_id}, version={version}.")
-
-    def get_object_history(self, object_id):
-        return [
-            {"object_id": object_id, "version": 2, "created_at": "2025-01-02T00:00:00"},
-            {"object_id": object_id, "version": 1, "created_at": "2025-01-01T00:00:00"},
-        ]
-
-
-def build_client() -> tuple[TestClient, FakeDB]:
-    app = create_app()
-    fake_db = FakeDB()
-    app.dependency_overrides[get_db_api] = lambda: fake_db
-    return TestClient(app), fake_db
-
-
-class FakeDashboardStore:
-    """Small in-memory dashboard store for route contract tests."""
-
-    def __init__(self):
-        self.docs = {}
-
-    def save(self, dashboard):
-        self.docs[dashboard["dashboard_id"]] = dashboard
-        return True
-
-    def get(self, dashboard_id):
-        return self.docs.get(dashboard_id)
-
-    def list(self):
-        return list(self.docs.values())
-
-    def list_by_type(self, dashboard_type):
-        return [doc for doc in self.docs.values() if doc.get("dashboard_type") == dashboard_type]
-
-    def delete(self, dashboard_id):
-        return self.docs.pop(dashboard_id, None) is not None
-
-
-def test_info_endpoint():
-    from flowcept.version import __version__
-
-    client, _ = build_client()
-    rs = client.get("/api/v1/info")
-    assert rs.status_code == 200
-    assert rs.json() == {"service": "flowcept", "version": __version__}
-
-
-def test_root_and_openapi_endpoints():
-    client, _ = build_client()
-
-    root = client.get("/")
-    assert root.status_code == 200
-    if root.headers["content-type"].startswith("application/json"):
-        # No built UI assets present: root exposes the API status payload.
-        assert root.json()["service"] == "flowcept-webservice"
-    else:
-        # Built UI assets present: root serves the SPA index page.
-        assert "text/html" in root.headers["content-type"]
-
-    assert client.get("/openapi.json").status_code == 200
-    assert client.get("/docs").status_code == 200
-    assert client.get("/redoc").status_code == 200
-
-
-def test_health_endpoints():
-    client, _ = build_client()
-    assert client.get("/api/v1/health/live").json() == {"status": "ok"}
-    assert client.get("/api/v1/health/ready").json() == {"status": "ready"}
-
-
-def test_workflows_list_get_and_query():
-    client, _ = build_client()
-
-    rs = client.get("/api/v1/workflows", params={"limit": 10})
-    assert rs.status_code == 200
-    items = rs.json()["items"]
-    assert [item["workflow_id"] for item in items] == ["wf-1", "wf-2"]
-
-    rs = client.get("/api/v1/workflows", params={"user": "alice", "limit": 5})
-    assert rs.status_code == 200
-    body = rs.json()
-    assert body["count"] == 1
-    assert body["items"][0]["workflow_id"] == "wf-1"
-
-    rs = client.get("/api/v1/workflows/wf-1")
-    assert rs.status_code == 200
-    assert rs.json()["workflow_id"] == "wf-1"
-
-    rs = client.post(
-        "/api/v1/workflows/query",
-        json={"filter": {"campaign_id": "c2"}, "limit": 10, "projection": ["workflow_id"]},
-    )
-    assert rs.status_code == 200
-    assert rs.json()["count"] == 1
-
-
-def test_workflow_card_download_route():
-    client, _ = build_client()
-
-    def _fake_generate_report(**kwargs):
-        output = kwargs["output_path"]
-        Path(output).write_text("# Workflow Card\n\nworkflow: wf-1\n", encoding="utf-8")
-        return {"output": output}
-
-    with patch("flowcept.webservice.routers.workflows.Flowcept.generate_report", side_effect=_fake_generate_report):
-        rs = client.post("/api/v1/workflows/wf-1/reports/workflow-card/download")
-
-    assert rs.status_code == 200
-    assert rs.headers["content-type"].startswith("text/markdown")
-    assert 'attachment; filename="workflow_card_wf-1.md"' == rs.headers["content-disposition"]
-    assert "# Workflow Card" in rs.text
-
-
-def test_workflow_card_pdf_download_route():
-    client, _ = build_client()
-
-    def _fake_generate_report(**kwargs):
-        output = kwargs["output_path"]
-        Path(output).write_bytes(b"%PDF-1.4\n%%EOF")
-        return {"output": output}
-
-    with patch("flowcept.webservice.services.reports.generate_report", side_effect=_fake_generate_report):
-        rs = client.get("/api/v1/workflows/wf-1/workflow_card", params={"format": "pdf"})
-
-    assert rs.status_code == 200
-    assert rs.headers["content-type"].startswith("application/pdf")
-    assert rs.headers["content-disposition"] == 'attachment; filename="workflow_card_wf-1.pdf"'
-    assert rs.content.startswith(b"%PDF-1.4")
-
-
-def test_workflow_card_route_is_named_workflow_card():
-    client, _ = build_client()
-
-    openapi = client.get("/openapi.json")
-    assert openapi.status_code == 200
-    schema = openapi.json()
-    paths = schema["paths"]
-    assert "/api/v1/workflows/{workflow_id}/workflow_card" in paths
-    assert "/api/v1/workflows/{workflow_id}/provenance_card" not in paths
-
-
-def test_workflows_errors():
-    client, _ = build_client()
-
-    rs = client.get("/api/v1/workflows/does-not-exist")
-    assert rs.status_code == 404
-
-    rs = client.get("/api/v1/workflows", params={"filter_json": "not-json"})
-    assert rs.status_code == 400
-
-    rs = client.post("/api/v1/workflows/does-not-exist/reports/workflow-card/download")
-    assert rs.status_code == 404
-
-
-def test_workflow_card_download_generation_error():
-    client, _ = build_client()
-
-    with patch(
-        "flowcept.webservice.routers.workflows.Flowcept.generate_report",
-        side_effect=RuntimeError("report generation failed"),
-    ):
-        rs = client.post("/api/v1/workflows/wf-1/reports/workflow-card/download")
-
-    assert rs.status_code == 500
-    assert "Could not generate workflow card" in rs.json()["detail"]
-
-
-def test_tasks_list_get_by_workflow_and_query():
-    client, _ = build_client()
-
-    rs = client.get("/api/v1/tasks", params={"workflow_id": "wf-1", "limit": 10})
-    assert rs.status_code == 200
-    assert rs.json()["count"] == 2
-    assert [item["task_id"] for item in rs.json()["items"]] == ["t2", "t1"]
-
-    rs = client.get("/api/v1/tasks/t1")
-    assert rs.status_code == 200
-    assert rs.json()["task_id"] == "t1"
-
-    rs = client.get("/api/v1/tasks/by_workflow/wf-2")
-    assert rs.status_code == 200
-    assert rs.json()["count"] == 1
-
-    rs = client.post(
-        "/api/v1/tasks/query",
-        json={
-            "filter": {"workflow_id": "wf-1"},
-            "sort": [{"field": "started_at", "order": -1}],
-            "projection": ["task_id", "started_at"],
-            "limit": 10,
-        },
-    )
-    assert rs.status_code == 200
-    items = rs.json()["items"]
-    assert items[0]["started_at"] >= items[1]["started_at"]
-
-
-def test_tasks_errors_and_validation():
-    client, _ = build_client()
-
-    rs = client.get("/api/v1/tasks/")
-    assert rs.status_code == 404
-
-    rs = client.get("/api/v1/tasks/missing")
-    assert rs.status_code == 404
-
-    rs = client.get("/api/v1/tasks", params={"filter_json": "[]"})
-    assert rs.status_code == 400
-
-    rs = client.post(
-        "/api/v1/tasks/query",
-        json={
-            "filter": {},
-            "projection": ["task_id", "workflow_id"],
-            "aggregation": [{"operator": "max", "field": "started_at"}],
-            "limit": 10,
-        },
-    )
-    assert rs.status_code == 400
-
-
-def test_objects_list_get_version_history_and_query():
-    client, _ = build_client()
-
-    rs = client.get("/api/v1/objects", params={"workflow_id": "wf-1", "limit": 10})
-    assert rs.status_code == 200
-    assert rs.json()["count"] == 2
-    assert "data" not in rs.json()["items"][0]
-
-    rs = client.get("/api/v1/objects", params={"limit": 10})
-    assert rs.status_code == 200
-    assert [item["object_id"] for item in rs.json()["items"]] == ["o1", "o2", "o3"]
-
-    rs = client.get("/api/v1/objects/o1")
-    assert rs.status_code == 200
-    assert rs.json()["object_id"] == "o1"
-    assert "data" not in rs.json()
-
-    rs = client.get("/api/v1/objects/o1", params={"include_data": True})
-    assert rs.status_code == 200
-    assert isinstance(rs.json()["data"], str)
-
-    rs = client.get("/api/v1/objects/o2/versions/2", params={"include_data": True})
-    assert rs.status_code == 200
-    assert rs.json()["version"] == 2
-
-    rs = client.get("/api/v1/objects/o1/download")
-    assert rs.status_code == 200
-    assert rs.content == b"payload-1"
-
-    rs = client.get("/api/v1/objects/o2/versions/2/download")
-    assert rs.status_code == 200
-    assert rs.content == b"payload-2"
-
-    rs = client.get("/api/v1/objects/o2/history", params={"limit": 1})
-    assert rs.status_code == 200
-    assert rs.json()["count"] == 1
-
-    rs = client.post(
-        "/api/v1/objects/query",
-        json={
-            "filter": {},
-            "projection": ["object_id", "version"],
-            "sort": [{"field": "version", "order": -1}],
-            "limit": 1,
-            "include_data": False,
-        },
-    )
-    assert rs.status_code == 200
-    body = rs.json()
-    assert body["count"] == 1
-    assert set(body["items"][0].keys()) <= {"object_id", "version"}
-
-
-def test_objects_errors_and_validation():
-    client, _ = build_client()
-
-    rs = client.get("/api/v1/objects/unknown")
-    assert rs.status_code == 404
-
-    rs = client.get("/api/v1/objects/o1/versions/99")
-    assert rs.status_code == 404
-
-    rs = client.get("/api/v1/objects", params={"filter_json": "not-json"})
-    assert rs.status_code == 400
-
-    rs = client.post("/api/v1/objects/query", json={"filter": {}, "limit": 5001})
-    assert rs.status_code == 422
-
-
-def test_datasets_routes():
-    client, _ = build_client()
-
-    rs = client.get("/api/v1/datasets")
-    assert rs.status_code == 200
-    assert rs.json()["count"] == 1
-    assert rs.json()["items"][0]["object_type"] == "dataset"
-
-    rs = client.get("/api/v1/datasets/o1")
-    assert rs.status_code == 200
-    assert rs.json()["object_type"] == "dataset"
-
-    rs = client.get("/api/v1/datasets/o1/versions/1")
-    assert rs.status_code == 200
-    assert rs.json()["version"] == 1
-
-    rs = client.get("/api/v1/datasets/o1/download")
-    assert rs.status_code == 200
-    assert rs.content == b"payload-1"
-
-    rs = client.post("/api/v1/datasets/query", json={"filter": {}, "limit": 10})
-    assert rs.status_code == 200
-    assert rs.json()["count"] == 1
-    assert rs.json()["items"][0]["object_type"] == "dataset"
-
-    rs = client.get("/api/v1/datasets/o2")
-    assert rs.status_code == 404
-
-
-def test_models_routes():
-    client, _ = build_client()
-
-    rs = client.get("/api/v1/models")
-    assert rs.status_code == 200
-    assert rs.json()["count"] == 2
-    assert rs.json()["items"][0]["object_type"] == "ml_model"
-
-    rs = client.get("/api/v1/models/o2")
-    assert rs.status_code == 200
-    assert rs.json()["object_type"] == "ml_model"
-
-    rs = client.get("/api/v1/models/o2/versions/2")
-    assert rs.status_code == 200
-    assert rs.json()["version"] == 2
-
-    rs = client.get("/api/v1/models/o2/download")
-    assert rs.status_code == 200
-    assert rs.content == b"payload-2"
-
-    rs = client.post("/api/v1/models/query", json={"filter": {}, "limit": 10})
-    assert rs.status_code == 200
-    assert rs.json()["count"] == 2
-    assert rs.json()["items"][0]["object_type"] == "ml_model"
-
-    rs = client.get("/api/v1/models/o1")
-    assert rs.status_code == 404
-
-
-def test_unified_scoped_query_models_supports_exists_and_nested_sort():
-    client, _ = build_client()
-
-    rs = client.post(
-        "/api/v1/query/models",
-        json={
-            "filter": {
-                "workflow_id": "wf-1",
-                "custom_metadata.loss": {"$exists": True},
-            },
-            "sort": [{"field": "custom_metadata.loss", "order": 1}],
-            "projection": ["object_id", "object_type", "custom_metadata"],
-            "limit": 1,
-        },
-    )
-    assert rs.status_code == 200
-    body = rs.json()
-    assert body["count"] == 1
-    assert body["items"][0]["object_id"] == "o3"
-    assert body["items"][0]["object_type"] == "ml_model"
-    assert body["items"][0]["custom_metadata"]["loss"] == 0.11
-
-
-def test_unified_scoped_query_workflows_scope():
-    client, _ = build_client()
-    rs = client.post(
-        "/api/v1/query/workflows",
-        json={
-            "filter": {"campaign_id": "c1"},
-            "projection": ["workflow_id", "campaign_id"],
-            "limit": 10,
-        },
-    )
-    assert rs.status_code == 200
-    body = rs.json()
-    assert body["count"] == 1
-    assert body["items"][0]["workflow_id"] == "wf-1"
-
-
-def test_unified_scoped_query_tasks_scope():
-    client, _ = build_client()
-    rs = client.post(
-        "/api/v1/query/tasks",
-        json={
-            "filter": {"workflow_id": "wf-1"},
-            "sort": [{"field": "started_at", "order": -1}],
-            "projection": ["task_id", "started_at"],
-            "limit": 1,
-        },
-    )
-    assert rs.status_code == 200
-    body = rs.json()
-    assert body["count"] == 1
-    assert body["items"][0]["task_id"] == "t2"
-
-
-def test_unified_scoped_query_objects_scope():
-    client, _ = build_client()
-    rs = client.post(
-        "/api/v1/query/objects",
-        json={
-            "filter": {"object_type": "dataset"},
-            "projection": ["object_id", "object_type"],
-            "limit": 10,
-        },
-    )
-    assert rs.status_code == 200
-    body = rs.json()
-    assert body["count"] == 1
-    assert body["items"][0]["object_id"] == "o1"
-    assert body["items"][0]["object_type"] == "dataset"
-
-
-def test_unified_scoped_query_datasets_scope_enforces_type():
-    client, _ = build_client()
-    rs = client.post(
-        "/api/v1/query/datasets",
-        json={
-            "filter": {"object_type": "ml_model"},
-            "limit": 10,
-        },
-    )
-    assert rs.status_code == 200
-    assert rs.json()["count"] == 0
-
-
-def test_unified_scoped_query_rejects_unsupported_operator():
-    client, _ = build_client()
-    rs = client.post(
-        "/api/v1/query/objects",
-        json={
-            "filter": {"task_id": {"$where": "this.task_id == 't1'"}},
-            "limit": 10,
-        },
-    )
-    assert rs.status_code == 400
-    assert "Unsupported filter operator" in rs.json()["detail"]
-
-
-def test_dashboard_routes_accept_charts_contract():
-    app = create_app()
-    store = FakeDashboardStore()
-    app.dependency_overrides[get_dashboard_store] = lambda: store
-    client = TestClient(app)
-
-    spec = {
-        "name": "dashboard",
-        "context": {"workflow_id": "wf-1"},
-        "charts": [
-            {
-                "chart_id": "c1",
-                "type": "chart",
-                "data": {"source": "tasks", "filter": {"workflow_id": "wf-1"}},
-            }
-        ],
-        "layout": [{"chart_id": "c1", "x": 0, "y": 0, "w": 6, "h": 4}],
-    }
-
-    rs = client.post("/api/v1/dashboards", json=spec)
-    assert rs.status_code == 201
-    body = rs.json()
-    assert body["charts"][0]["chart_id"] == "c1"
-    assert body["layout"][0]["chart_id"] == "c1"
-
-
-def test_agents_and_dataflow_routes():
-    client, fake_db = build_client()
-
-    fake_db.tasks = [
-        {
-            "task_id": "t1",
-            "workflow_id": "wf-1",
-            "status": "finished",
-            "started_at": 10,
-            "agent_id": "agent-1",
-            "source_agent_id": "orchestrator",
-            "used": {"x": 1},
-            "generated": {"y": 2},
-        },
-        {
-            "task_id": "t2",
-            "workflow_id": "wf-1",
-            "status": "running",
-            "started_at": 20,
-            "agent_id": "agent-2",
-            "used": {"y": 2},
-            "generated": {"z": 3},
-        },
-    ]
-    fake_db.agents = [
-        {"agent_id": "agent-1", "name": "Agent 1", "registered_at": 10},
-        {"agent_id": "agent-2", "name": "Agent 2", "registered_at": 20},
-    ]
-
-    rs = client.get("/api/v1/agents")
-    assert rs.status_code == 200
-    agents = rs.json()["items"]
-    assert len(agents) == 2
-    agent_map = {a["agent_id"]: a for a in agents}
-    assert "agent-1" in agent_map
-    assert "agent-2" in agent_map
-
-    rs = client.get("/api/v1/agents/agent-1")
-    assert rs.status_code == 200
-    assert rs.json()["agent"]["agent_id"] == "agent-1"
-
-    rs = client.get("/api/v1/workflows/wf-1/dataflow")
-    assert rs.status_code == 200
-    dataflow = rs.json()
-    task_nodes = [n for n in dataflow["nodes"] if n["kind"] == "task"]
-    assert len(task_nodes) == 2
-    for node in task_nodes:
-        stats = node["stats"]
-        assert "agent_id" in stats
-        assert "source_agent_id" in stats
-        if node["id"] == "task:t1":
-            assert stats["agent_id"] == "agent-1"
-            assert stats["source_agent_id"] == "orchestrator"
-
-
-def test_dataflow_label_fallback():
-    from flowcept import configs
-
-    original_max = getattr(configs, "WEBSERVER_MAX_LABEL_LENGTH", 30)
-
-    client, fake_db = build_client()
-    fake_db.tasks = [
-        {
-            "task_id": "t1",
-            "workflow_id": "wf-1",
-            "status": "finished",
-            "started_at": 10,
-            "used": {
-                "short_key": 1,
-                "a_very_long_input_key_that_exceeds_ten_characters": 2,
-            },
-            "generated": {
-                "another_extremely_long_output_key_name_that_exceeds_ten": 3,
-            },
-        }
-    ]
-
-    try:
-        configs.WEBSERVER_MAX_LABEL_LENGTH = 10
-        rs = client.get("/api/v1/workflows/wf-1/dataflow")
-        assert rs.status_code == 200
-        dataflow = rs.json()
-
-        # Verify the chunks have fallback labels
-        chunks = [n for n in dataflow["nodes"] if n["kind"] == "chunk"]
-        assert len(chunks) == 2
-
-        # Since the labels are longer than 10 characters, they must fall back to "inputs (2)" and "outputs (1)"
-        input_chunk = next(n for n in chunks if n["stats"]["kind"] == "input")
-        output_chunk = next(n for n in chunks if n["stats"]["kind"] == "output")
-
-        assert input_chunk["label"] == "inputs (2)"
-        assert output_chunk["label"] == "outputs (1)"
-
-    finally:
-        configs.WEBSERVER_MAX_LABEL_LENGTH = original_max
-
-
-def test_dataflow_label_no_positional_args():
-    """Chunk labels must not expose raw arg_N positional-argument keys."""
-    client, fake_db = build_client()
-    fake_db.tasks = [
-        {
-            "task_id": "t1",
-            "workflow_id": "wf-1",
-            "status": "finished",
-            "started_at": 10,
-            "used": {"arg_0": 1, "arg_1": 2},
-            "generated": {"result": 42},
-        }
-    ]
-    rs = client.get("/api/v1/workflows/wf-1/dataflow")
-    assert rs.status_code == 200
-    dataflow = rs.json()
-    chunks = [n for n in dataflow["nodes"] if n["kind"] == "chunk"]
-    assert len(chunks) == 2
-    input_chunk = next(n for n in chunks if n["stats"]["kind"] == "input")
-    # "arg_0, arg_1" is not a useful label; should fall back to count form
-    assert "arg_" not in input_chunk["label"]
-    # Named output keys should still render as-is
-    output_chunk = next(n for n in chunks if n["stats"]["kind"] == "output")
-    assert "result" in output_chunk["label"]
-
-
-def test_delete_empty_agents():
-    client, fake_db = build_client()
-    fake_db.agents = [
-        {"agent_id": "agent-active", "name": "Active Agent", "registered_at": 10},
-        {"agent_id": "agent-empty", "name": "Empty Agent", "registered_at": 20},
-    ]
-    fake_db.tasks = [
-        {
-            "task_id": "t1",
-            "workflow_id": "wf-1",
-            "status": "finished",
-            "started_at": 10,
-            "agent_id": "agent-active",
-        }
-    ]
-
-    rs = client.delete("/api/v1/agents/cleanup/empty")
-    assert rs.status_code == 200
-    body = rs.json()
-    assert body["deleted_count"] == 1
-
-    # Verify agent-empty is deleted, and agent-active remains
-    agents = fake_db.agents
-    assert len(agents) == 1
-    assert agents[0]["agent_id"] == "agent-active"
-
-
-def test_dataflow_delegation_edge():
-    client, fake_db = build_client()
-
-    # case 1: task t2 has both source_agent_id and agent_id -> delegation edge should be created
-    fake_db.tasks = [
-        {
-            "task_id": "t1",
-            "workflow_id": "wf-1",
-            "status": "finished",
-            "started_at": 10,
-            "agent_id": "orchestrator",
-            "used": {"x": 1},
-        },
-        {
-            "task_id": "t2",
-            "workflow_id": "wf-1",
-            "status": "finished",
-            "started_at": 20,
-            "agent_id": "agent-1",
-            "source_agent_id": "orchestrator",
-            "used": {"y": 2},
-        },
-    ]
-    rs = client.get("/api/v1/workflows/wf-1/dataflow")
-    assert rs.status_code == 200
-    edges = rs.json()["edges"]
-    delegation_edges = [e for e in edges if e["relation"] == "delegation"]
-    assert len(delegation_edges) == 1
-    assert delegation_edges[0]["source"] == "task:t1"
-    assert delegation_edges[0]["target"] == "task:t2"
-
-    # case 2: task t2 has source_agent_id but NO agent_id -> delegation edge should NOT be created
-    fake_db.tasks = [
-        {
-            "task_id": "t1",
-            "workflow_id": "wf-1",
-            "status": "finished",
-            "started_at": 10,
-            "agent_id": "orchestrator",
-            "used": {"x": 1},
-        },
-        {
-            "task_id": "t2",
-            "workflow_id": "wf-1",
-            "status": "finished",
-            "started_at": 20,
-            "source_agent_id": "orchestrator",
-            "used": {"y": 2},
-        },
-    ]
-    rs = client.get("/api/v1/workflows/wf-1/dataflow")
-    assert rs.status_code == 200
-    edges = rs.json()["edges"]
-    delegation_edges = [e for e in edges if e["relation"] == "delegation"]
-    assert len(delegation_edges) == 0
diff --git a/tests/webservice/test_webservice_integration.py b/tests/webservice/test_webservice_integration.py
index 45fb29b0..d4e72417 100644
--- a/tests/webservice/test_webservice_integration.py
+++ b/tests/webservice/test_webservice_integration.py
@@ -14,9 +14,12 @@
 from flowcept import Flowcept, FlowceptTask, WorkflowObject
 from flowcept.commons.daos.docdb_dao.docdb_dao_base import DocumentDBDAO
 from flowcept.commons.flowcept_dataclasses.task_object import TaskObject
+from flowcept.commons.flowcept_logger import FlowceptLogger
 from flowcept.configs import MONGO_ENABLED
 from flowcept.webservice.main import create_app
 
+logger = FlowceptLogger()
+
 
 pytestmark = pytest.mark.skipif(not MONGO_ENABLED, reason="MongoDB is disabled")
 
@@ -30,6 +33,35 @@ def _wait_for(condition, timeout_sec: float = 20.0, interval_sec: float = 0.25)
     return False
 
 
+def test_webservice_static_contract_routes():
+    """Basic route contracts that do not need seeded provenance data."""
+    from flowcept.version import __version__
+
+    client = TestClient(create_app())
+
+    rs = client.get("/api/v1/info")
+    assert rs.status_code == 200
+    assert rs.json() == {"service": "flowcept", "version": __version__}
+
+    assert client.get("/api/v1/health/live").json() == {"status": "ok"}
+    assert client.get("/api/v1/health/ready").json()["status"] == "ready"
+
+    root = client.get("/")
+    assert root.status_code == 200
+    if root.headers["content-type"].startswith("application/json"):
+        assert root.json()["service"] == "flowcept-webservice"
+    else:
+        assert "text/html" in root.headers["content-type"]
+
+    openapi = client.get("/openapi.json")
+    assert openapi.status_code == 200
+    paths = openapi.json()["paths"]
+    assert "/api/v1/workflows/{workflow_id}/workflow_card" in paths
+    assert "/api/v1/workflows/{workflow_id}/provenance_card" not in paths
+    assert client.get("/docs").status_code == 200
+    assert client.get("/redoc").status_code == 200
+
+
 @pytest.fixture
 def db_cleanup(request):
     """Track ids a test inserts and delete them from MongoDB/LMDB afterwards, even on failure.
@@ -49,6 +81,7 @@ def db_cleanup(request):
             pass
 
     from flowcept.configs import LMDB_ENABLED
+
     initial_lmdb_agents = set()
     if LMDB_ENABLED and hasattr(dao, "_agents_db"):
         try:
@@ -104,6 +137,18 @@ def db_cleanup(request):
         DocumentDBDAO._instance.close()
 
 
+@pytest.fixture(scope="module")
+def mcp_server_instance():
+    """Run one MCP HTTP server per test process; reset context per test as needed."""
+    from flowcept.agents.mcp import mcp_server as agent_module
+
+    agent = agent_module.FlowceptMCPServer().start()
+    try:
+        yield agent
+    finally:
+        agent.stop()
+
+
 def test_webservice_end_to_end_with_flowcept_and_blob_apis(db_cleanup):
     """End-to-end: real workflow + blob objects, then exercise the read APIs."""
     if not Flowcept.services_alive():
@@ -118,20 +163,20 @@ def test_webservice_end_to_end_with_flowcept_and_blob_apis(db_cleanup):
             task.end(generated={"y": 2})
 
         workflow_id = Flowcept.current_workflow_id
-        generic_obj_id = Flowcept.db.save_or_update_object(
+        generic_obj_id = Flowcept.insert_or_update_object(
             object=b"generic-blob-payload",
             object_type="artifact",
             save_data_in_collection=True,
             custom_metadata={"kind": "generic"},
         )
 
-        dataset_obj_id = Flowcept.db.save_or_update_dataset(
+        dataset_obj_id = Flowcept.insert_or_update_dataset(
             object=b"dataset-blob-payload",
             save_data_in_collection=True,
             custom_metadata={"split": "train"},
         )
 
-        model_obj_id = Flowcept.db.save_or_update_ml_model(
+        model_obj_id = Flowcept.insert_or_update_ml_model(
             object=b"model-blob-payload",
             save_data_in_collection=True,
             custom_metadata={"framework": "sklearn"},
@@ -355,6 +400,10 @@ def test_webservice_campaigns_agents_stats_and_prov_card(db_cleanup):
     rs = client.get(f"/api/v1/workflows/{workflow_id}/workflow_card", params={"format": "pdf"})
     assert rs.status_code == 200
     assert rs.headers["content-type"].startswith("application/pdf")
+    assert rs.headers["content-disposition"] == f'attachment; filename="workflow_card_{workflow_id}.pdf"'
+
+    rs = client.get(f"/api/v1/workflows/non-existent-{uuid4()}/workflow_card", params={"format": "markdown"})
+    assert rs.status_code == 404
 
     # Cleanup singleton client handles for test isolation.
     if DocumentDBDAO._instance is not None:
@@ -376,7 +425,7 @@ def test_webservice_object_versioning_and_unified_query(db_cleanup):
         with FlowceptTask(activity_id="emit", used={"x": 1}) as task:
             task.end(generated={"y": 1})
         for version in range(2):
-            Flowcept.db.save_or_update_object(
+            Flowcept.insert_or_update_object(
                 object=f"payload-v{version}".encode(),
                 object_id=obj_id,
                 object_type="ml_model",
@@ -446,9 +495,36 @@ def test_webservice_object_versioning_and_unified_query(db_cleanup):
     assert rs.status_code == 200
     assert rs.json()["count"] >= 1
 
+    rs = client.get("/api/v1/tasks/")
+    assert rs.status_code == 404
+
+    rs = client.get("/api/v1/tasks", params={"filter_json": "[]"})
+    assert rs.status_code == 400
+
+    rs = client.post(
+        "/api/v1/tasks/query",
+        json={
+            "filter": {},
+            "projection": ["task_id", "workflow_id"],
+            "aggregation": [{"operator": "max", "field": "started_at"}],
+            "limit": 10,
+        },
+    )
+    assert rs.status_code == 400
+
     rs = client.post(f"/api/v1/workflows/{workflow_id}/reports/workflow-card/download")
     assert rs.status_code == 200
     assert rs.headers["content-type"].startswith("text/markdown")
+    assert rs.headers["content-disposition"] == f'attachment; filename="workflow_card_{workflow_id}.md"'
+
+    rs = client.get(f"/api/v1/workflows/non-existent-{uuid4()}")
+    assert rs.status_code == 404
+
+    rs = client.get("/api/v1/workflows", params={"filter_json": "not-json"})
+    assert rs.status_code == 400
+
+    rs = client.post(f"/api/v1/workflows/non-existent-{uuid4()}/reports/workflow-card/download")
+    assert rs.status_code == 404
 
     if DocumentDBDAO._instance is not None:
         DocumentDBDAO._instance.close()
@@ -740,13 +816,16 @@ def test_prov_tools_shared_core(db_cleanup):
     if not Flowcept.services_alive():
         pytest.skip("Flowcept services are not alive (MQ/KVDB/Mongo).")
 
-    from flowcept.agents.tools.prov_tools import (
+    from flowcept.agents.data_query_tools.db_query_tools import (
         get_task_summary,
         list_campaigns,
-        make_chart,
         query_tasks,
         query_workflows,
     )
+    from flowcept.agents.data_query_tools.dashboard_tools import (
+        make_chart,
+        get_dashboard,
+    )
 
     campaign_id = f"ws-campaign-{uuid4()}"
     db_cleanup["campaigns"].append(campaign_id)
@@ -785,6 +864,10 @@ def test_prov_tools_shared_core(db_cleanup):
     assert result.result["rows"]
     assert result.result["chart"]["chart_id"] == "chat-c1"
 
+    # get_dashboard returns 404 for unknown id (no real dashboard needed).
+    result = get_dashboard("nonexistent-dashboard-id")
+    assert result.code == 404
+
     # Disallowed filter operators are rejected by the shared core.
     result = query_tasks(filter={"$where": "1"}, limit=10)
     assert result.code >= 400
@@ -808,50 +891,253 @@ def test_chat_endpoint_unavailable_without_llm():
     assert "LLM" in rs.json()["detail"] or "llm" in rs.json()["detail"]
 
 
-def test_chat_endpoint_real_llm_tool_roundtrip(db_cleanup):
-    """Real LLM chat round-trip: the model must call a query tool and answer (env-gated)."""
-    from flowcept.commons.flowcept_logger import FlowceptLogger
+def _load_chat_query_cases():
+    """Load path-agnostic chat integration questions."""
+    import pathlib
+    import yaml
+
+    yaml_path = pathlib.Path(__file__).parent / "chat_query_tests.yaml"
+    cases = yaml.safe_load(yaml_path.read_text())
+    assert cases, "No chat query cases found in chat_query_tests.yaml"
+    return cases
+
+
+def _chat_response_score(actual: str, expected: str) -> float:
+    """Return a simple token-overlap score for path-agnostic chat answer checks."""
+    import re
+
+    def _tokens(text: str) -> set[str]:
+        tokens = set()
+        for raw_token in re.findall(r"[a-zA-Z0-9_.]+", text.lower()):
+            token = raw_token.strip(".")
+            tokens.add(token)
+            tokens.update(part for part in token.split(".") if part)
+        return {token for token in tokens if token}
+
+    actual_tokens = _tokens(actual)
+    expected_tokens = _tokens(expected)
+    if not expected_tokens:
+        return 1.0
+    return len(actual_tokens & expected_tokens) / len(expected_tokens)
+
+
+def _load_gridsearch_context_into_mcp(gridsearch_run_data, mcp_server_instance):
+    """Load workflow + task + object messages into MCP context for schema and runtime-memory paths."""
+    from flowcept.agents.mcp.mcp_client import run_tool
+    from flowcept.commons.utils import normalize_docs, sanitize_json_like
+    from flowcept.flowcept_api.db_api import DBAPI
+
+    tasks = gridsearch_run_data["tasks"] or []
+    assert tasks, "gridsearch_run_data contains no tasks."
+    workflow_id = gridsearch_run_data["workflow_id"]
+    workflow_obj = Flowcept.db.get_workflow_object(workflow_id)
+    assert workflow_obj is not None
+    # normalize_docs converts BSON ObjectId → str before sanitize_json_like, which does not handle ObjectId
+    objects = normalize_docs(DBAPI().blob_object_query(filter={"workflow_id": workflow_id}) or [])
+    messages = sanitize_json_like([workflow_obj.to_dict(), *tasks, *objects], mongo_safe_keys=True)
+    loaded_result = run_tool("load_buffer_messages", kwargs={"messages": messages})[0]
+    assert '"code": 201' in loaded_result
+    loaded = run_tool(
+        "run_df_query",
+        kwargs={"query": "result = len(df)", "plot": False, "context_kind": "tasks"},
+    )[0]
+    assert "Current df is empty or null" not in loaded
+
+
+@pytest.mark.llm
+@pytest.mark.parametrize(
+    ("tool_context", "expected_tool_names"),
+    [
+        (
+            "db",
+            {
+                "query_tasks",
+                "query_workflows",
+                "get_task_summary",
+                "list_campaigns",
+                "list_agents",
+                "highlight_lineage",
+                "make_chart",
+                "query_objects",
+            },
+        ),
+        (
+            "df",
+            {
+                "generate_result_df",
+                "generate_plot_code",
+                "extract_or_fix_python_code",
+                "get_workflow_context",
+                "run_df_query",
+                "list_agents",
+                "generate_objects_df",
+            },
+        ),
+    ],
+)
+def test_chat_endpoint_real_llm_queries(gridsearch_run_data, mcp_server_instance, tool_context, expected_tool_names):
+    """Every YAML chat question works through HTTP -> LangGraph -> MCP for both tool contexts."""
     from flowcept.configs import AGENT
 
     api_key = AGENT.get("api_key")
-    if not api_key or api_key == "?":
-        FlowceptLogger().warning("Skipping real-LLM chat test because agent.api_key is not set.")
+    if not api_key or api_key in ("?", "your-api-key-here"):
         pytest.skip("agent.api_key is not set.")
     if not AGENT.get("service_provider") or AGENT.get("service_provider") == "?":
-        FlowceptLogger().warning("Skipping real-LLM chat test because agent.service_provider is not set.")
         pytest.skip("agent.service_provider is not set.")
-    if not Flowcept.services_alive():
-        pytest.skip("Flowcept services are not alive (MQ/KVDB/Mongo).")
-
-    campaign_id = f"ws-campaign-{uuid4()}"
-    db_cleanup["campaigns"].append(campaign_id)
-    with Flowcept(campaign_id=campaign_id, workflow_name=f"ws-chat-wf-{uuid4()}"):
-        workflow_id = Flowcept.current_workflow_id
-        for i in range(3):
-            with FlowceptTask(activity_id="chat_seed", used={"i": i}) as task:
-                task.end(generated={"o": i})
 
-    ok = _wait_for(lambda: len(Flowcept.db.task_query(filter={"workflow_id": workflow_id}) or []) >= 3)
-    assert ok, "Timed out waiting for persisted tasks."
+    campaign_id = gridsearch_run_data["campaign_id"]
+    workflow_id = gridsearch_run_data["workflow_id"]
 
     app = create_app()
     client = TestClient(app)
+    _load_gridsearch_context_into_mcp(gridsearch_run_data, mcp_server_instance)
+
+    import os
+
+    case_id_filter = {c.strip() for c in os.environ.get("CHAT_TEST_CASE_IDS", "").split(",") if c.strip()}
+
+    for case in _load_chat_query_cases():
+        # Skip cases restricted to a different tool_context.
+        allowed_contexts = case.get("tool_contexts", ["db", "df"])
+        if tool_context not in allowed_contexts:
+            continue
+        # Skip cases not in the explicit case_id filter (when set).
+        case_id = case.get("case_id")
+        if case_id_filter and case_id not in case_id_filter:
+            continue
+
+        # Attempt each question up to MAX_ATTEMPTS times; retry on HTTP errors or
+        # score misses (transient rate-limiting can degrade LLM response quality).
+        MAX_ATTEMPTS = 2
+        rs = body = actual = tool_trace = score = None
+        for attempt in range(MAX_ATTEMPTS):
+            rs = client.post(
+                "/api/v1/chat",
+                json={
+                    "messages": [{"role": "user", "content": case["user_query"]}],
+                    "context": {"campaign_id": campaign_id, "workflow_id": workflow_id, "tool_context": tool_context},
+                    "stream": False,
+                },
+            )
+            if rs.status_code != 200:
+                if attempt < MAX_ATTEMPTS - 1:
+                    logger.warning(
+                        f"HTTP {rs.status_code} on attempt {attempt + 1} for {case['user_query']!r}; retrying."
+                    )
+                    continue
+                break
+            body = rs.json()
+            actual = body.get("message", "")
+            tool_trace = body.get("tool_trace") or []
+            score = _chat_response_score(actual, case["expected_response"])
+            if score >= case["score_threshold"]:
+                break
+            if attempt < MAX_ATTEMPTS - 1:
+                logger.warning(
+                    f"Score {score:.2f} < {case['score_threshold']:.2f} on attempt {attempt + 1} "
+                    f"for {case['user_query']!r}; retrying."
+                )
+        assert rs.status_code == 200, f"HTTP error for query: {case['user_query']!r}; body={rs.text}"
+        assert actual, f"Empty response for query: {case['user_query']!r}"
+        assert tool_trace, f"LLM made no tool call for query: {case['user_query']!r}"
+        assert score >= case["score_threshold"], (
+            f"Low answer score for {tool_context} query {case['user_query']!r}: "
+            f"score={score:.2f}, threshold={case['score_threshold']:.2f}\n"
+            f"Expected: {case['expected_response']}\nActual: {actual}"
+        )
+        assert any(
+            event.get("name") in expected_tool_names or event.get("tool_name") in expected_tool_names
+            for event in tool_trace
+        ), f"Expected MCP {tool_context} tool path for query {case['user_query']!r}; trace={tool_trace!r}"
+
+        # Optional structured-response assertions.
+        tool_expected = case.get("tool_expected")
+        if tool_expected == "make_chart":
+            cards = body.get("cards") or []
+            assert cards, f"Expected card event for make_chart in query {case['user_query']!r}"
+        elif tool_expected == "generate_plot_code":
+            assert any(
+                e.get("name") == "generate_plot_code" for e in tool_trace
+            ), f"Expected generate_plot_code in tool_trace for query {case['user_query']!r}; trace={tool_trace!r}"
+
+    if DocumentDBDAO._instance is not None:
+        DocumentDBDAO._instance.close()
+
+
+@pytest.mark.llm
+def test_chat_endpoint_records_ai_model_usage_tasks(gridsearch_run_data, db_cleanup, mcp_server_instance):
+    """A chat request creates a Flowcept workflow with AI model invocation provenance."""
+    from flowcept.agents.chat_orchestration.chat_orchestrator_service import CHAT_WORKFLOW_NAME
+    from flowcept.commons.vocabulary import PROV_AGENT
+
+    services = Flowcept.services_status()
+    if not all(v == "ok" for v in services.values()):
+        pytest.skip(f"Flowcept services are not alive: {services}")
+    if services.get("llm") != "ok":
+        pytest.skip(f"LLM provider is not configured or not alive: {services}")
+
+    workflow_id = gridsearch_run_data["workflow_id"]
+    before = {wf["workflow_id"] for wf in Flowcept.db.workflow_query(filter={"name": CHAT_WORKFLOW_NAME}) or []}
+
+    client = TestClient(create_app())
+    mcp_server_instance.reset_context()
     rs = client.post(
         "/api/v1/chat",
         json={
-            "messages": [{"role": "user", "content": "How many tasks ran in this workflow?"}],
+            "messages": [{"role": "user", "content": "How many tasks are in this workflow? Use the query_tasks tool."}],
             "context": {"workflow_id": workflow_id},
             "stream": False,
         },
     )
-    assert rs.status_code == 200
-    body = rs.json()
-    assert body["message"]
-    assert any("3" in str(part) for part in (body["message"], body.get("tool_trace", [])))
-    assert body.get("tool_trace"), "Expected the LLM to call at least one tool."
 
-    if DocumentDBDAO._instance is not None:
-        DocumentDBDAO._instance.close()
+    assert rs.status_code == 200, rs.text
+    assert rs.json().get("message")
+    assert rs.json().get("tool_trace")
+
+    def _new_chat_workflow_ids():
+        workflows = Flowcept.db.workflow_query(filter={"name": CHAT_WORKFLOW_NAME}) or []
+        return [wf["workflow_id"] for wf in workflows if wf["workflow_id"] not in before]
+
+    ok = _wait_for(lambda: len(_new_chat_workflow_ids()) >= 1)
+    assert ok, "Timed out waiting for chat workflow to be persisted."
+    chat_workflow_id = _new_chat_workflow_ids()[0]
+    db_cleanup["workflows"].append(chat_workflow_id)
+
+    ok = _wait_for(
+        lambda: len(
+            Flowcept.db.task_query(
+                filter={
+                    "workflow_id": chat_workflow_id,
+                    "subtype": PROV_AGENT.AI_MODEL_INVOCATION.value,
+                }
+            )
+            or []
+        )
+        >= 1
+    )
+    assert ok, "Timed out waiting for AI model invocation task to be persisted."
+
+    llm_tasks = (
+        Flowcept.db.task_query(
+            filter={"workflow_id": chat_workflow_id, "subtype": PROV_AGENT.AI_MODEL_INVOCATION.value},
+        )
+        or []
+    )
+    llm_task = llm_tasks[0]
+    assert llm_task["subtype"] == PROV_AGENT.AI_MODEL_INVOCATION.value
+    assert "telemetry_at_start" not in llm_task
+    assert "telemetry_at_end" not in llm_task
+    usage = llm_task["custom_metadata"]["llm_usage"]
+    assert usage["model"]
+    assert usage["input_chars"] > 0
+    assert usage["output_tokens"] is None or usage["output_tokens"] > 0
+    assert "provider_response_metadata" in usage
+    assert any(task["custom_metadata"]["llm_usage"]["output_chars"] > 0 for task in llm_tasks)
+
+    tool_tasks = Flowcept.db.task_query(
+        filter={"workflow_id": chat_workflow_id, "subtype": PROV_AGENT.AGENT_TOOL.value},
+    )
+    assert tool_tasks, "The forced DB query should record at least one agent tool task."
 
 
 def test_recursive_delete_workflow_and_campaign(db_cleanup):
@@ -869,13 +1155,13 @@ def test_recursive_delete_workflow_and_campaign(db_cleanup):
     with Flowcept(campaign_id=campaign_id, workflow_name=f"del-wf1-{uuid4()}"):
         with FlowceptTask(activity_id="del_task", used={"x": 1}) as t1:
             t1.end(generated={"y": 1})
-        Flowcept.db.save_or_update_object(object=b"blob1", object_type="artifact", save_data_in_collection=True)
+        Flowcept.insert_or_update_object(object=b"blob1", object_type="artifact", save_data_in_collection=True)
         wf1_id = Flowcept.current_workflow_id
 
     with Flowcept(campaign_id=campaign_id, workflow_name=f"del-wf2-{uuid4()}"):
         with FlowceptTask(activity_id="del_task", used={"x": 2}) as t2:
             t2.end(generated={"y": 2})
-        Flowcept.db.save_or_update_object(object=b"blob2", object_type="artifact", save_data_in_collection=True)
+        Flowcept.insert_or_update_object(object=b"blob2", object_type="artifact", save_data_in_collection=True)
         wf2_id = Flowcept.current_workflow_id
 
     assert wf1_id and wf2_id
@@ -1036,18 +1322,25 @@ def test_agent_telemetry_timeseries(db_cleanup):
     )
 
 
-def test_file_dashboard_store_roundtrip(tmp_path):
-    """FileDashboardStore (non-Mongo fallback) persists real JSON files."""
-    from flowcept.webservice.services.dashboard_store import FileDashboardStore
+def test_lmdb_dashboard_roundtrip(tmp_path, monkeypatch):
+    """LMDB dashboard CRUD persists and retrieves dashboard documents."""
+    from flowcept.configs import LMDB_ENABLED
 
-    store = FileDashboardStore(directory=str(tmp_path))
-    doc = {"dashboard_id": "d1", "name": "local", "charts": [], "layout": []}
-    assert store.save(doc)
-    assert store.get("d1")["name"] == "local"
-    assert any(d["dashboard_id"] == "d1" for d in store.list())
-    assert store.delete("d1")
-    assert store.get("d1") is None
-    assert store.delete("d1") is False
+    if not LMDB_ENABLED:
+        pytest.skip("LMDB not enabled.")
+    from flowcept.commons.daos.docdb_dao.lmdb_dao import LMDBDAO
+    import flowcept.configs as _fc_configs
+
+    monkeypatch.setitem(_fc_configs.LMDB_SETTINGS, "path", str(tmp_path / "lmdb"))
+    dao = LMDBDAO()
+    doc = {"dashboard_id": "d1", "dashboard_type": "common_workflow", "name": "local", "charts": [], "layout": []}
+    assert dao.save_dashboard(doc)
+    assert dao.get_dashboard("d1")["name"] == "local"
+    assert any(d["dashboard_id"] == "d1" for d in dao.list_dashboards())
+    assert dao.list_dashboards(filter={"dashboard_type": "common_workflow"})
+    assert dao.delete_dashboard("d1")
+    assert dao.get_dashboard("d1") is None
+    dao.close()
 
 
 def test_webservice_dataflow_graph(db_cleanup):
@@ -1073,6 +1366,7 @@ def test_webservice_dataflow_graph(db_cleanup):
 
     # Coarse level (default): per-task input/output chunk entities (PROV Entity vs Activity).
     from flowcept import configs
+
     original_max = getattr(configs, "WEBSERVER_MAX_LABEL_LENGTH", 30)
     try:
         configs.WEBSERVER_MAX_LABEL_LENGTH = 300
@@ -1114,7 +1408,8 @@ def test_webservice_dataflow_graph(db_cleanup):
     # submit_gridsearch_job outputs configs list under the key "configs" (not "arg_0")
     submit_node = next(n for n in task_nodes if n["label"] == "submit_gridsearch_job")
     submit_output_chunks = [
-        c for c in chunk_nodes
+        c
+        for c in chunk_nodes
         if any(e["source"] == submit_node["id"] and e["target"] == c["id"] for e in body["edges"])
     ]
     assert submit_output_chunks, "submit_gridsearch_job must have output chunks"
@@ -1147,7 +1442,7 @@ def test_webservice_dataflow_graph(db_cleanup):
 
 
 def _parse_sse(text: str) -> list:
-    """Parse a raw SSE response body into a list of {event, data} dicts.
+    r"""Parse a raw SSE response body into a list of {event, data} dicts.
 
     SSE separates events with \\r\\n\\r\\n (CRLF) or \\n\\n; normalise first.
     """
@@ -1161,9 +1456,9 @@ def _parse_sse(text: str) -> list:
         ev: dict = {}
         for line in block.split("\n"):
             if line.startswith("event:"):
-                ev["event"] = line[len("event:"):].strip()
+                ev["event"] = line[len("event:") :].strip()
             elif line.startswith("data:"):
-                raw = line[len("data:"):].strip()
+                raw = line[len("data:") :].strip()
                 try:
                     ev["data"] = json.loads(raw)
                 except json.JSONDecodeError:
@@ -1227,7 +1522,12 @@ def test_chat_highlight_lineage_sse(db_cleanup):
         rs = client.post(
             "/api/v1/chat",
             json={
-                "messages": [{"role": "user", "content": f"Highlight the lineage of task {step_a_id} in the dataflow graph using the highlight_lineage tool."}],
+                "messages": [
+                    {
+                        "role": "user",
+                        "content": f"Highlight the lineage of task {step_a_id} in the dataflow graph using the highlight_lineage tool.",
+                    }
+                ],
                 "context": {"workflow_id": wf_id},
                 "stream": True,
             },
@@ -1277,10 +1577,7 @@ def test_node_positions_endpoint(db_cleanup):
     # 2. Save positions
     pos_data = {
         "graph_type": "dataflow",
-        "positions": {
-            "node-1": {"x": 12.5, "y": 45.6},
-            "node-2": {"x": 78.9, "y": 101.2}
-        }
+        "positions": {"node-1": {"x": 12.5, "y": 45.6}, "node-2": {"x": 78.9, "y": 101.2}},
     }
     rs = client.post(f"/api/v1/workflows/{workflow_id}/node_positions", json=pos_data)
     assert rs.status_code == 200
@@ -1300,6 +1597,7 @@ def test_agents_without_tasks_are_not_returned(db_cleanup):
         pytest.skip("Flowcept services are not alive.")
 
     from flowcept.commons.flowcept_dataclasses.agent_object import AgentObject
+
     empty_agent_id = f"empty-agent-{uuid4()}"
 
     agent = AgentObject()
@@ -1314,4 +1612,3 @@ def test_agents_without_tasks_are_not_returned(db_cleanup):
     assert rs.status_code == 200
     items = rs.json()["items"]
     assert not any(item["agent_id"] == empty_agent_id for item in items)
-
diff --git a/ui/src/api/types.ts b/ui/src/api/types.ts
index 775ad3c0..4047d68e 100644
--- a/ui/src/api/types.ts
+++ b/ui/src/api/types.ts
@@ -77,6 +77,7 @@ export interface Campaign {
 export interface AgentSummary {
   agent_id: string;
   name?: string;
+  workflow_id?: string;
   registered_at?: number | string | null;
   task_count: number;
   activities: string[];
diff --git a/ui/src/components/charts/TelemetryChart.tsx b/ui/src/components/charts/TelemetryChart.tsx
index 5f00cc62..86c9b4eb 100644
--- a/ui/src/components/charts/TelemetryChart.tsx
+++ b/ui/src/components/charts/TelemetryChart.tsx
@@ -30,6 +30,15 @@ function normalize(vals: number[]): number[] {
   return vals.map((v) => (v - min) / (max - min));
 }
 
+export function TelemetryEmptyMessage() {
+  return (
+    <div className="text-fg-muted py-8 text-center text-xs">
+      Tasks were found but no telemetry values are present. Ensure{" "}
+      <code className="text-xs">telemetry_capture.enable: true</code> in your Flowcept settings.
+    </div>
+  );
+}
+
 export function TelemetryChart({ filter }: { filter: Record<string, unknown> }) {
   const [visibleMetrics, setVisibleMetrics] = useState<Set<string>>(new Set(METRIC_KEYS));
   const [selectedMetric, setSelectedMetric] = useState<string>(METRIC_KEYS[0]);
@@ -165,10 +174,7 @@ export function TelemetryChart({ filter }: { filter: Record<string, unknown> })
             No tasks matched this filter.
           </div>
         ) : (
-          <div className="text-fg-muted py-8 text-center text-xs">
-            Tasks were found but no telemetry values are present.
-            Ensure <code className="text-xs">telemetry_capture.enable: true</code> in your Flowcept settings.
-          </div>
+          <TelemetryEmptyMessage />
         )}
       </div>
 
diff --git a/ui/src/components/chat/ChatPanel.tsx b/ui/src/components/chat/ChatPanel.tsx
index 9e62cfdb..32fe0d42 100644
--- a/ui/src/components/chat/ChatPanel.tsx
+++ b/ui/src/components/chat/ChatPanel.tsx
@@ -6,6 +6,7 @@ import { fetchEventSource } from "@microsoft/fetch-event-source";
 import { Bot, ChevronDown, Eraser, Maximize2, Minimize2, Send, Wrench } from "lucide-react";
 import type { PanelImperativeHandle } from "react-resizable-panels";
 import { API_BASE } from "../../api/client";
+import { chatContext, type ChatToolContext } from "../../lib/chatContext";
 import { useChatStore, type ChatMsg } from "../../stores/chatStore";
 import { useHighlightStore } from "../../stores/highlightStore";
 import { EChart } from "../charts/EChart";
@@ -20,16 +21,6 @@ function contextHint(pathname: string): string {
   return "Queries are scoped to the page you're viewing.";
 }
 
-function routeContext(pathname: string): Record<string, string> {
-  const wf = pathname.match(/\/workflows\/([^/?]+)/);
-  if (wf) return { workflow_id: decodeURIComponent(wf[1]) };
-  const camp = pathname.match(/\/campaigns\/([^/?]+)/);
-  if (camp) return { campaign_id: decodeURIComponent(camp[1]) };
-  const dash = pathname.match(/\/dashboards\/([^/?]+)/);
-  if (dash) return { dashboard_id: decodeURIComponent(dash[1]) };
-  return {};
-}
-
 interface ChatPanelProps {
   panelHandle?: PanelImperativeHandle | null;
 }
@@ -38,6 +29,7 @@ export function ChatPanel({ panelHandle }: ChatPanelProps) {
   const { busy, messages, setBusy, push, appendPart, reset } = useChatStore();
   const [input, setInput] = useState("");
   const [isMaximized, setIsMaximized] = useState(false);
+  const [toolContext, setToolContext] = useState<ChatToolContext>("db");
   const pathname = useRouterState({ select: (s) => s.location.pathname });
   const scrollRef = useRef<HTMLDivElement>(null);
 
@@ -76,7 +68,7 @@ export function ChatPanel({ panelHandle }: ChatPanelProps) {
         headers: { "Content-Type": "application/json" },
         body: JSON.stringify({
           messages: apiMessages,
-          context: routeContext(pathname),
+          context: chatContext(pathname, toolContext),
           stream: true,
           allow_dashboard_edit: pathname.startsWith("/dashboards/"),
         }),
@@ -123,6 +115,15 @@ export function ChatPanel({ panelHandle }: ChatPanelProps) {
             <Bot size={15} /> Flowcept Agent
           </span>
           <div className="flex items-center gap-2">
+            <select
+              value={toolContext}
+              onChange={(e) => setToolContext(e.target.value as ChatToolContext)}
+              title="Choose whether chat queries persisted DB records or the streaming in-memory context"
+              className="bg-surface-2 rounded border border-border px-1.5 py-1 text-[11px] text-fg-muted outline-none hover:text-fg"
+            >
+              <option value="db">DB queries</option>
+              <option value="df">Runtime in-memory queries</option>
+            </select>
             <button onClick={reset} title="Clear conversation" className="text-fg-muted hover:text-fg">
               <Eraser size={14} />
             </button>
diff --git a/ui/src/lib/aiUsage.ts b/ui/src/lib/aiUsage.ts
new file mode 100644
index 00000000..c512eb3d
--- /dev/null
+++ b/ui/src/lib/aiUsage.ts
@@ -0,0 +1,75 @@
+import type { Task } from "../api/types";
+import { taskDuration } from "./format";
+
+export const AI_MODEL_INVOCATION_SUBTYPE = "ai_model_invocation";
+
+export interface AiModelUsageRow {
+  task_id: string;
+  model?: string;
+  input_tokens?: number;
+  output_tokens?: number;
+  total_tokens?: number;
+  input_tokens_label: string;
+  output_tokens_label: string;
+  total_tokens_label: string;
+  token_count_source?: string;
+  provider_request_id?: string;
+  prompt_preview: string;
+  response_preview: string;
+  duration: number | null;
+  started_at?: Task["started_at"];
+  task: Task;
+}
+
+function asRecord(value: unknown): Record<string, unknown> {
+  return value && typeof value === "object" && !Array.isArray(value) ? (value as Record<string, unknown>) : {};
+}
+
+function asNumber(value: unknown): number | undefined {
+  return typeof value === "number" ? value : undefined;
+}
+
+function asString(value: unknown): string | undefined {
+  return typeof value === "string" ? value : undefined;
+}
+
+function tokenLabel(value: number | undefined, source: string | undefined): string {
+  if (value === undefined) return "—";
+  return source === "estimated_from_chars" ? `≈${value}` : String(value);
+}
+
+function preview(value: unknown, maxLength = 140): string {
+  const text = typeof value === "string" ? value : value == null ? "" : JSON.stringify(value);
+  const compact = text.replace(/\s+/g, " ").trim();
+  return compact.length > maxLength ? `${compact.slice(0, maxLength)}…` : compact;
+}
+
+export function getAiModelUsageRows(tasks: Task[]): AiModelUsageRow[] {
+  return tasks
+    .filter((task) => task.subtype === AI_MODEL_INVOCATION_SUBTYPE)
+    .map((task) => {
+      const metadata = asRecord(task.custom_metadata);
+      const usage = asRecord(metadata.llm_usage);
+      const inputTokens = asNumber(usage.input_tokens ?? usage.llm_input_tokens);
+      const outputTokens = asNumber(usage.output_tokens ?? usage.llm_output_tokens);
+      const totalTokens = asNumber(usage.total_tokens ?? usage.llm_total_tokens);
+      const tokenCountSource = asString(usage.token_count_source);
+      return {
+        task_id: task.task_id,
+        model: asString(usage.model ?? usage.llm_model),
+        input_tokens: inputTokens,
+        output_tokens: outputTokens,
+        total_tokens: totalTokens,
+        input_tokens_label: tokenLabel(inputTokens, tokenCountSource),
+        output_tokens_label: tokenLabel(outputTokens, tokenCountSource),
+        total_tokens_label: tokenLabel(totalTokens, tokenCountSource),
+        token_count_source: tokenCountSource,
+        provider_request_id: asString(usage.provider_request_id),
+        prompt_preview: preview(asRecord(task.used).prompt),
+        response_preview: preview(asRecord(task.generated).response),
+        duration: taskDuration(task),
+        started_at: task.started_at,
+        task,
+      };
+    });
+}
diff --git a/ui/src/lib/chatContext.ts b/ui/src/lib/chatContext.ts
new file mode 100644
index 00000000..e89d8614
--- /dev/null
+++ b/ui/src/lib/chatContext.ts
@@ -0,0 +1,15 @@
+export type ChatToolContext = "db" | "df";
+
+export function routeContext(pathname: string): Record<string, string> {
+  const wf = pathname.match(/\/workflows\/([^/?]+)/);
+  if (wf) return { workflow_id: decodeURIComponent(wf[1]) };
+  const camp = pathname.match(/\/campaigns\/([^/?]+)/);
+  if (camp) return { campaign_id: decodeURIComponent(camp[1]) };
+  const dash = pathname.match(/\/dashboards\/([^/?]+)/);
+  if (dash) return { dashboard_id: decodeURIComponent(dash[1]) };
+  return {};
+}
+
+export function chatContext(pathname: string, toolContext: ChatToolContext = "db"): Record<string, string> {
+  return { ...routeContext(pathname), tool_context: toolContext };
+}
diff --git a/ui/src/routes/agents.index.tsx b/ui/src/routes/agents.index.tsx
index cff74958..6a169619 100644
--- a/ui/src/routes/agents.index.tsx
+++ b/ui/src/routes/agents.index.tsx
@@ -53,6 +53,11 @@ function AgentsPage() {
                   {a.agent_id}
                 </div>
               )}
+              {a.workflow_id && (
+                <div className="text-[10px] text-fg-muted mt-0.5 pl-6">
+                  workflow: <span className="font-mono">{a.workflow_id}</span>
+                </div>
+              )}
             </div>
             <div className="text-fg-muted mt-2 space-y-1 text-xs">
               <div>
diff --git a/ui/src/routes/workflows.$workflowId.tsx b/ui/src/routes/workflows.$workflowId.tsx
index 5016a338..bad47612 100644
--- a/ui/src/routes/workflows.$workflowId.tsx
+++ b/ui/src/routes/workflows.$workflowId.tsx
@@ -15,7 +15,7 @@ import { DataflowView } from "../components/charts/DataflowView";
 import { CoarseDataflowView } from "../components/charts/CoarseDataflowView";
 import { GanttChart } from "../components/charts/GanttChart";
 import { StatusStrip } from "../components/charts/StatusStrip";
-import { TelemetryChart } from "../components/charts/TelemetryChart";
+import { TelemetryChart, TelemetryEmptyMessage } from "../components/charts/TelemetryChart";
 import { JsonTree } from "../components/JsonTree";
 import { Markdown } from "../components/markdown/Markdown";
 import { DataTable } from "../components/tables/DataTable";
@@ -23,11 +23,12 @@ import { TaskDrawer } from "../components/tasks/TaskDrawer";
 import { ActivityDrawer } from "../components/tasks/ActivityDrawer";
 import { apiDelete, apiPost } from "../api/client";
 import { fmtDuration, fmtTs, shortId, statusColor, taskDuration, toEpochSec, type TimeValue } from "../lib/format";
+import { getAiModelUsageRows, type AiModelUsageRow } from "../lib/aiUsage";
 import { ChartRenderer } from "../components/dashboard/ChartRenderer";
 import { chart, dashboardSpec, type DashboardSpec } from "../components/dashboard/spec";
 import { useInspectorStore } from "../stores/inspectorStore";
 
-const TABS = ["tasks", "agents", "graph", "timeline", "telemetry", "card", "artifacts", "dashboard", "raw"] as const;
+const TABS = ["tasks", "agents", "ai", "graph", "timeline", "telemetry", "card", "artifacts", "dashboard", "raw"] as const;
 
 export const Route = createFileRoute("/workflows/$workflowId")({
   component: WorkflowDetail,
@@ -279,7 +280,7 @@ function WorkflowDetail() {
                 search.tab === t ? "border-accent text-fg border-b-2" : "text-fg-muted hover:text-fg"
               }`}
             >
-              {t === "card" ? "Workflow Card" : t === "dashboard" ? "Dashboard" : t === "graph" ? "Graphs" : t}
+              {t === "card" ? "Workflow Card" : t === "dashboard" ? "Dashboard" : t === "graph" ? "Graphs" : t === "ai" ? "AI Model Usage" : t}
             </button>
           ))}
         </div>
@@ -327,6 +328,13 @@ function WorkflowDetail() {
 
       {search.tab === "agents" && <WorkflowAgentsTab workflowId={workflowId} />}
 
+      {search.tab === "ai" && (
+        <AiModelUsageTab
+          tasks={taskItems}
+          onTaskClick={(taskId) => navigate({ search: (s) => ({ ...s, task: taskId }) })}
+        />
+      )}
+
       {search.tab === "graph" && <GraphTab tasks={taskItems} workflowId={workflowId} />}
 
       {search.tab === "timeline" && (
@@ -341,7 +349,7 @@ function WorkflowDetail() {
       {search.tab === "telemetry" && (
         <div className="card p-4">
           {taskItems.length > 0 && !taskItems.some((t) => t.telemetry_at_start || t.telemetry_at_end) ? (
-            <p className="text-fg-muted text-sm">Telemetry capture was disabled for this workflow.</p>
+            <TelemetryEmptyMessage />
           ) : (
             <TelemetryChart filter={{ workflow_id: workflowId }} />
           )}
@@ -447,6 +455,115 @@ function ArtifactsTab({ workflowId }: { workflowId: string }) {
   );
 }
 
+const AI_USAGE_COLS: ColumnDef<AiModelUsageRow, any>[] = [
+  {
+    id: "status",
+    header: "Status",
+    size: 90,
+    cell: ({ row }) => {
+      const status = row.original.task.status ?? "—";
+      return (
+        <span className="inline-flex items-center gap-2">
+          <span className="inline-block h-2 w-2 rounded-full" style={{ background: statusColor(status) }} />
+          <span>{status}</span>
+        </span>
+      );
+    },
+  },
+  {
+    id: "model",
+    header: "Model",
+    size: 180,
+    cell: ({ row }) => row.original.model ?? "—",
+  },
+  {
+    id: "total_tokens",
+    header: "Tokens",
+    size: 90,
+    cell: ({ row }) => row.original.total_tokens_label,
+  },
+  {
+    id: "input_output_tokens",
+    header: "In / Out",
+    size: 100,
+    cell: ({ row }) => `${row.original.input_tokens_label} / ${row.original.output_tokens_label}`,
+  },
+  {
+    id: "prompt",
+    header: "Prompt",
+    size: 220,
+    cell: ({ row }) => <span title="Click row to inspect the full prompt">{row.original.prompt_preview || "—"}</span>,
+  },
+  {
+    id: "response",
+    header: "Response",
+    size: 220,
+    cell: ({ row }) => <span title="Click row to inspect the full response">{row.original.response_preview || "—"}</span>,
+  },
+  {
+    id: "task_id",
+    header: "Task",
+    size: 130,
+    cell: ({ row }) => <span className="font-mono text-accent">{shortId(row.original.task_id, 12)}</span>,
+  },
+  {
+    id: "started_at",
+    header: "Started",
+    size: 150,
+    cell: ({ row }) => fmtTs(row.original.started_at),
+  },
+  {
+    id: "duration",
+    header: "Duration",
+    size: 100,
+    cell: ({ row }) => fmtDuration(row.original.duration),
+  },
+];
+
+function AiModelUsageTab({ tasks, onTaskClick }: { tasks: Task[]; onTaskClick: (taskId: string) => void }) {
+  const rows = useMemo(() => getAiModelUsageRows(tasks), [tasks]);
+  const totals = useMemo(
+    () => ({
+      calls: rows.length,
+      input_tokens: rows.reduce((sum, row) => sum + (row.input_tokens ?? 0), 0),
+      output_tokens: rows.reduce((sum, row) => sum + (row.output_tokens ?? 0), 0),
+      total_tokens: rows.reduce((sum, row) => sum + (row.total_tokens ?? 0), 0),
+    }),
+    [rows],
+  );
+
+  if (!rows.length) {
+    return <div className="card p-4 text-sm text-fg-muted">No AI model invocation tasks found for this workflow.</div>;
+  }
+
+  return (
+    <div className="space-y-3">
+      <div className="grid gap-3 sm:grid-cols-4">
+        <MetricCard label="LLM calls" value={String(totals.calls)} />
+        <MetricCard label="input tokens" value={String(totals.input_tokens)} />
+        <MetricCard label="output tokens" value={String(totals.output_tokens)} />
+        <MetricCard label="total tokens" value={String(totals.total_tokens)} />
+      </div>
+      <div className="card p-4">
+        <DataTable data={rows} columns={AI_USAGE_COLS} onRowClick={(row) => onTaskClick(row.task_id)} />
+      </div>
+      <div className="card p-4">
+        <div className="mb-2 text-xs font-semibold uppercase tracking-wide text-fg-muted">Raw AI model invocation tasks</div>
+        <JsonTree data={rows.map((row) => row.task)} name="ai_model_invocations" />
+      </div>
+    </div>
+  );
+}
+
+function MetricCard({ label, value }: { label: string; value: string }) {
+  return (
+    <div className="card p-4">
+      <div className="text-xs uppercase tracking-wide text-fg-muted">{label}</div>
+      <div className="mt-1 text-lg font-semibold">{value}</div>
+    </div>
+  );
+}
+
 function GraphTab({ tasks, workflowId }: { tasks: Task[]; workflowId: string }) {
   const [graphType, setGraphType] = useState<"activity" | "task" | "provenance">("activity");
   const [provMode, setProvMode] = useState<"coarse" | "fine">("coarse");
diff --git a/ui/tests/aiUsage.test.ts b/ui/tests/aiUsage.test.ts
new file mode 100644
index 00000000..d1e39df8
--- /dev/null
+++ b/ui/tests/aiUsage.test.ts
@@ -0,0 +1,69 @@
+import { describe, expect, it } from "vitest";
+import { getAiModelUsageRows } from "../src/lib/aiUsage";
+import type { Task } from "../src/api/types";
+
+describe("getAiModelUsageRows", () => {
+  it("extracts normalized LLM usage rows from ai_model_invocation tasks", () => {
+    const tasks: Task[] = [
+      {
+        task_id: "task-1",
+        subtype: "ai_model_invocation",
+        activity_id: "llm_interaction",
+        started_at: 10,
+        ended_at: 12,
+        custom_metadata: {
+          llm_usage: {
+            model: "gpt-oss-120b",
+            input_tokens: 100,
+            output_tokens: 12,
+            total_tokens: 112,
+            token_count_source: "provider",
+            finish_reason: "stop",
+            provider_request_id: "chatcmpl-1",
+          },
+        },
+        used: { prompt: "What happened in this workflow?".repeat(10) },
+        generated: { response: "The workflow finished successfully.".repeat(10) },
+      },
+      { task_id: "task-2", subtype: "agent_tool" },
+    ];
+
+    const rows = getAiModelUsageRows(tasks);
+
+    expect(rows).toHaveLength(1);
+    expect(rows[0]).toMatchObject({
+      task_id: "task-1",
+      model: "gpt-oss-120b",
+      input_tokens: 100,
+      output_tokens: 12,
+      total_tokens: 112,
+      provider_request_id: "chatcmpl-1",
+      token_count_source: "provider",
+    });
+    expect(rows[0].prompt_preview.length).toBeLessThanOrEqual(143);
+    expect(rows[0].response_preview.length).toBeLessThanOrEqual(143);
+    expect(rows[0].duration).toBe(2);
+  });
+
+  it("marks estimated token counts when providers do not report usage", () => {
+    const rows = getAiModelUsageRows([
+      {
+        task_id: "task-1",
+        subtype: "ai_model_invocation",
+        custom_metadata: {
+          llm_usage: {
+            model: "local-model",
+            input_tokens: 10,
+            output_tokens: 5,
+            total_tokens: 15,
+            token_count_source: "estimated_from_chars",
+          },
+        },
+      },
+    ]);
+
+    expect(rows[0].input_tokens_label).toBe("≈10");
+    expect(rows[0].output_tokens_label).toBe("≈5");
+    expect(rows[0].total_tokens_label).toBe("≈15");
+  });
+});
diff --git a/ui/tests/chatContext.test.ts b/ui/tests/chatContext.test.ts
new file mode 100644
index 00000000..07051703
--- /dev/null
+++ b/ui/tests/chatContext.test.ts
@@ -0,0 +1,16 @@
+import { describe, expect, it } from "vitest";
+import { chatContext, routeContext } from "../src/lib/chatContext";
+
+describe("chatContext", () => {
+  it("defaults chat tool context to db", () => {
+    expect(chatContext("/workflows/wf-1")).toEqual({ workflow_id: "wf-1", tool_context: "db" });
+  });
+
+  it("can request streaming in-memory queries with df context", () => {
+    expect(chatContext("/campaigns/camp-1", "df")).toEqual({ campaign_id: "camp-1", tool_context: "df" });
+  });
+
+  it("keeps route context reusable without tool context", () => {
+    expect(routeContext("/dashboards/main")).toEqual({ dashboard_id: "main" });
+  });
+});