diff --git a/frontend/src/generated/core/api.schemas.ts b/frontend/src/generated/core/api.schemas.ts
index 165e42ff1e50..0355024a3771 100644
--- a/frontend/src/generated/core/api.schemas.ts
+++ b/frontend/src/generated/core/api.schemas.ts
@@ -1085,9 +1085,10 @@ export const TargetTypeEnumApi = {
  * `monthly` - Monthly
  * `yearly` - Yearly
  */
-export type FrequencyEnumApi = (typeof FrequencyEnumApi)[keyof typeof FrequencyEnumApi]
+export type SubscriptionFrequencyEnumApi =
+    (typeof SubscriptionFrequencyEnumApi)[keyof typeof SubscriptionFrequencyEnumApi]
 
-export const FrequencyEnumApi = {
+export const SubscriptionFrequencyEnumApi = {
     Daily: 'daily',
     Weekly: 'weekly',
     Monthly: 'monthly',
@@ -1131,7 +1132,7 @@ export interface SubscriptionApi {
     dashboard_export_insights?: number[]
     target_type: TargetTypeEnumApi
     target_value: string
-    frequency: FrequencyEnumApi
+    frequency: SubscriptionFrequencyEnumApi
     /**
      * @minimum -2147483648
      * @maximum 2147483647
@@ -1196,7 +1197,7 @@ export interface PatchedSubscriptionApi {
     dashboard_export_insights?: number[]
     target_type?: TargetTypeEnumApi
     target_value?: string
-    frequency?: FrequencyEnumApi
+    frequency?: SubscriptionFrequencyEnumApi
     /**
      * @minimum -2147483648
      * @maximum 2147483647
diff --git a/posthog/templates/email/evaluation_report.html b/posthog/templates/email/evaluation_report.html
new file mode 100644
index 000000000000..16424875cf08
--- /dev/null
+++ b/posthog/templates/email/evaluation_report.html
@@ -0,0 +1,19 @@
+{% extends "email/base.html" %}
+
+{% block heading %}{% endblock %}
+
+{% block section %}
+
+{% comment %}
+report_body is markdown rendered by markdown-it-py with html=False, so raw HTML in
+the markdown source is escaped. Content originates from our own LLM agent via
+structured tool outputs (not user input), and is delivered via email only.
+{% endcomment %}
+{# nosemgrep: python.flask.security.xss.audit.template-unescaped-with-safe.template-unescaped-with-safe #}
+{{ report_body|safe }}
+
+<div class="mb mt text-center">
+    <a class="button primary" href="{{ evaluation_url }}">View evaluation in PostHog</a>
+</div>
+
+{% endblock %}
diff --git a/posthog/temporal/llm_analytics/__init__.py b/posthog/temporal/llm_analytics/__init__.py
index 91a8d754ce81..15dd98396ef8 100644
--- a/posthog/temporal/llm_analytics/__init__.py
+++ b/posthog/temporal/llm_analytics/__init__.py
@@ -1,3 +1,17 @@
+from posthog.temporal.llm_analytics.eval_reports.activities import (
+    deliver_report_activity,
+    fetch_count_triggered_eval_reports_activity,
+    fetch_due_eval_reports_activity,
+    prepare_report_context_activity,
+    run_eval_report_agent_activity,
+    store_report_run_activity,
+    update_next_delivery_date_activity,
+)
+from posthog.temporal.llm_analytics.eval_reports.workflow import (
+    CheckCountTriggeredReportsWorkflow,
+    GenerateAndDeliverEvalReportWorkflow,
+    ScheduleAllEvalReportsWorkflow,
+)
 from posthog.temporal.llm_analytics.metrics import EvalsMetricsInterceptor  # noqa: F401
 from posthog.temporal.llm_analytics.run_evaluation import (
     RunEvaluationWorkflow,
@@ -64,6 +78,10 @@
     BatchTraceSummarizationCoordinatorWorkflow,
     DailyTraceClusteringWorkflow,
     TraceClusteringCoordinatorWorkflow,
+    # Evaluation reports
+    ScheduleAllEvalReportsWorkflow,
+    CheckCountTriggeredReportsWorkflow,
+    GenerateAndDeliverEvalReportWorkflow,
     # Keep sentiment workflow registered here temporarily so orphaned workflows on general-purpose queue can complete
     ClassifySentimentWorkflow,
     # Keep eval workflow registered here temporarily so orphaned workflows on general-purpose queue can complete
@@ -84,6 +102,14 @@
     perform_clustering_compute_activity,
     generate_cluster_labels_activity,
     emit_cluster_events_activity,
+    # Evaluation report activities
+    fetch_due_eval_reports_activity,
+    fetch_count_triggered_eval_reports_activity,
+    prepare_report_context_activity,
+    run_eval_report_agent_activity,
+    store_report_run_activity,
+    deliver_report_activity,
+    update_next_delivery_date_activity,
     # Keep sentiment activity registered here temporarily so orphaned workflows on general-purpose queue can complete
     classify_sentiment_activity,
     # Keep eval activities registered here temporarily so orphaned workflows on general-purpose queue can complete
diff --git a/posthog/temporal/llm_analytics/eval_reports/activities.py b/posthog/temporal/llm_analytics/eval_reports/activities.py
new file mode 100644
index 000000000000..6edcab3bd04d
--- /dev/null
+++ b/posthog/temporal/llm_analytics/eval_reports/activities.py
@@ -0,0 +1,397 @@
+"""Activities for evaluation reports workflow."""
+
+import datetime as dt
+
+import temporalio.activity
+from structlog import get_logger
+
+from posthog.sync import database_sync_to_async
+from posthog.temporal.common.heartbeat import Heartbeater
+from posthog.temporal.llm_analytics.eval_reports.types import (
+    CheckCountTriggeredReportsWorkflowInputs,
+    DeliverReportInput,
+    FetchDueEvalReportsOutput,
+    PrepareReportContextInput,
+    PrepareReportContextOutput,
+    RunEvalReportAgentInput,
+    RunEvalReportAgentOutput,
+    ScheduleAllEvalReportsWorkflowInputs,
+    StoreReportRunInput,
+    StoreReportRunOutput,
+    UpdateNextDeliveryDateInput,
+)
+
+logger = get_logger(__name__)
+
+
+@temporalio.activity.defn
+async def fetch_due_eval_reports_activity(
+    inputs: ScheduleAllEvalReportsWorkflowInputs,
+) -> FetchDueEvalReportsOutput:
+    """Return a list of time-based evaluation report IDs that are due for delivery."""
+    now_with_buffer = dt.datetime.now(tz=dt.UTC) + dt.timedelta(minutes=inputs.buffer_minutes)
+
+    @database_sync_to_async(thread_sensitive=False)
+    def get_report_ids() -> list[str]:
+        from products.llm_analytics.backend.models.evaluation_reports import EvaluationReport
+
+        return [
+            str(pk)
+            for pk in EvaluationReport.objects.filter(
+                next_delivery_date__lte=now_with_buffer,
+                enabled=True,
+                deleted=False,
+            )
+            .exclude(frequency=EvaluationReport.Frequency.EVERY_N)
+            .values_list("id", flat=True)
+        ]
+
+    report_ids = await get_report_ids()
+    await logger.ainfo(f"Found {len(report_ids)} due evaluation reports")
+    return FetchDueEvalReportsOutput(report_ids=report_ids)
+
+
+@temporalio.activity.defn
+async def fetch_count_triggered_eval_reports_activity(
+    inputs: CheckCountTriggeredReportsWorkflowInputs,
+) -> FetchDueEvalReportsOutput:
+    """Check count-based reports and return those whose eval count exceeds the threshold."""
+
+    @database_sync_to_async(thread_sensitive=False)
+    def check_reports() -> list[str]:
+        from posthog.hogql.parser import parse_select
+        from posthog.hogql.query import execute_hogql_query
+
+        from posthog.models import Team
+
+        from products.llm_analytics.backend.models.evaluation_reports import EvaluationReport, EvaluationReportRun
+
+        now = dt.datetime.now(tz=dt.UTC)
+        due: list[str] = []
+
+        reports = EvaluationReport.objects.filter(
+            frequency=EvaluationReport.Frequency.EVERY_N,
+            enabled=True,
+            deleted=False,
+            trigger_threshold__isnull=False,
+        ).select_related("evaluation")
+
+        for report in reports:
+            # Cooldown: skip if last delivery was too recent
+            if report.last_delivered_at:
+                cooldown_delta = dt.timedelta(minutes=report.cooldown_minutes)
+                if (now - report.last_delivered_at) < cooldown_delta:
+                    continue
+
+            # Daily cap: skip if too many runs today
+            today_start = now.replace(hour=0, minute=0, second=0, microsecond=0)
+            today_runs = EvaluationReportRun.objects.filter(
+                report=report,
+                created_at__gte=today_start,
+            ).count()
+            if today_runs >= report.daily_run_cap:
+                continue
+
+            # Count evals since last delivery (or start_date if first run)
+            since = report.last_delivered_at or report.start_date
+            since_str = since.strftime("%Y-%m-%d %H:%M:%S.%f")
+
+            team = Team.objects.get(id=report.team_id)
+            query = parse_select(
+                f"""
+                SELECT count() as total
+                FROM events
+                WHERE event = '$ai_evaluation'
+                    AND properties.$ai_evaluation_id = '{report.evaluation_id}'
+                    AND timestamp >= '{since_str}'
+                """
+            )
+            result = execute_hogql_query(query=query, team=team)
+            rows = result.results or []
+            count = rows[0][0] if rows else 0
+
+            if count >= report.trigger_threshold:
+                due.append(str(report.id))
+
+        return due
+
+    report_ids = await check_reports()
+    await logger.ainfo(f"Found {len(report_ids)} count-triggered evaluation reports ready")
+    return FetchDueEvalReportsOutput(report_ids=report_ids)
+
+
+def _find_nth_eval_timestamp(
+    team_id: int,
+    evaluation_id: str,
+    n: int,
+    before: dt.datetime,
+) -> dt.datetime:
+    """Find the timestamp of the Nth-most-recent eval result.
+
+    Returns the timestamp so the report window covers exactly the last N evals.
+    Falls back to 24h ago if there are fewer than N results.
+    """
+    from posthog.hogql.parser import parse_select
+    from posthog.hogql.query import execute_hogql_query
+
+    from posthog.models import Team
+
+    team = Team.objects.get(id=team_id)
+    before_str = before.strftime("%Y-%m-%d %H:%M:%S.%f")
+    query = parse_select(
+        f"""
+        SELECT min(ts) FROM (
+            SELECT timestamp as ts
+            FROM events
+            WHERE event = '$ai_evaluation'
+                AND properties.$ai_evaluation_id = '{evaluation_id}'
+                AND timestamp <= '{before_str}'
+            ORDER BY timestamp DESC
+            LIMIT {int(n)}
+        )
+        """
+    )
+    result = execute_hogql_query(query=query, team=team)
+    rows = result.results or []
+    if rows and rows[0][0] is not None:
+        ts = rows[0][0]
+        if isinstance(ts, dt.datetime):
+            if ts.tzinfo is None:
+                return ts.replace(tzinfo=dt.UTC)
+            return ts
+    # Fallback: 24h ago
+    return before - dt.timedelta(days=1)
+
+
+@temporalio.activity.defn
+async def prepare_report_context_activity(
+    inputs: PrepareReportContextInput,
+) -> PrepareReportContextOutput:
+    """Load evaluation from Postgres and calculate time windows."""
+
+    @database_sync_to_async(thread_sensitive=False)
+    def prepare() -> PrepareReportContextOutput:
+        from products.llm_analytics.backend.models.evaluation_reports import EvaluationReport
+
+        report = EvaluationReport.objects.select_related("evaluation").get(id=inputs.report_id)
+        evaluation = report.evaluation
+        now = dt.datetime.now(tz=dt.UTC)
+
+        # Period end is now, period start depends on context
+        period_end = now
+        freq_deltas = {
+            "hourly": dt.timedelta(hours=1),
+            "daily": dt.timedelta(days=1),
+            "weekly": dt.timedelta(weeks=1),
+        }
+
+        if inputs.manual:
+            # Manual "Generate now": always look back one full frequency period
+            # so the user always gets a meaningful report regardless of last delivery.
+            if report.frequency == "every_n":
+                # For count-triggered reports, sample the most recent N evals so
+                # "Generate now" always produces something useful even if the
+                # threshold hasn't been crossed yet.
+                period_start = _find_nth_eval_timestamp(
+                    team_id=report.team_id,
+                    evaluation_id=str(evaluation.id),
+                    n=report.trigger_threshold or 100,
+                    before=now,
+                )
+            else:
+                period_start = now - freq_deltas.get(report.frequency, dt.timedelta(days=1))
+        elif report.last_delivered_at:
+            period_start = report.last_delivered_at
+        else:
+            # First run: look back one period (or to start_date for count-triggered)
+            if report.frequency == "every_n":
+                period_start = report.start_date
+            else:
+                period_start = now - freq_deltas.get(report.frequency, dt.timedelta(days=1))
+
+        # Previous period for comparison (same duration, shifted back)
+        period_duration = period_end - period_start
+        previous_period_start = period_start - period_duration
+
+        # `report_prompt_guidance` is a per-report TextField that lets users steer
+        # the agent. Added in migration 0024 (Commit 2 of the v2 schema refactor).
+        # `getattr` with fallback keeps this activity compatible with the unmigrated
+        # database state during Commit 1 local testing.
+        guidance = getattr(report, "report_prompt_guidance", "") or ""
+
+        return PrepareReportContextOutput(
+            report_id=str(report.id),
+            team_id=report.team_id,
+            evaluation_id=str(evaluation.id),
+            evaluation_name=evaluation.name,
+            evaluation_description=evaluation.description or "",
+            evaluation_prompt=evaluation.evaluation_config.get("prompt", ""),
+            evaluation_type=evaluation.evaluation_type,
+            period_start=period_start.isoformat(),
+            period_end=period_end.isoformat(),
+            previous_period_start=previous_period_start.isoformat(),
+            report_prompt_guidance=guidance,
+        )
+
+    return await prepare()
+
+
+@temporalio.activity.defn
+async def run_eval_report_agent_activity(
+    inputs: RunEvalReportAgentInput,
+) -> RunEvalReportAgentOutput:
+    """Run the LLM report agent."""
+    async with Heartbeater():
+        await logger.ainfo(
+            "Running eval report agent",
+            report_id=inputs.report_id,
+            evaluation_id=inputs.evaluation_id,
+        )
+
+        @database_sync_to_async(thread_sensitive=False)
+        def run_agent():
+            from posthog.temporal.llm_analytics.eval_reports.report_agent import run_eval_report_agent
+
+            return run_eval_report_agent(
+                team_id=inputs.team_id,
+                evaluation_id=inputs.evaluation_id,
+                evaluation_name=inputs.evaluation_name,
+                evaluation_description=inputs.evaluation_description,
+                evaluation_prompt=inputs.evaluation_prompt,
+                evaluation_type=inputs.evaluation_type,
+                period_start=inputs.period_start,
+                period_end=inputs.period_end,
+                previous_period_start=inputs.previous_period_start,
+                report_prompt_guidance=inputs.report_prompt_guidance,
+            )
+
+        content = await run_agent()
+
+        return RunEvalReportAgentOutput(
+            report_id=inputs.report_id,
+            content=content.to_dict(),
+            period_start=inputs.period_start,
+            period_end=inputs.period_end,
+        )
+
+
+@temporalio.activity.defn
+async def store_report_run_activity(
+    inputs: StoreReportRunInput,
+) -> StoreReportRunOutput:
+    """Save the generated report as an EvaluationReportRun and emit a $ai_evaluation_report event."""
+
+    @database_sync_to_async(thread_sensitive=False)
+    def store() -> str:
+        import uuid
+
+        from posthog.models.event.util import create_event
+        from posthog.models.team import Team
+
+        from products.llm_analytics.backend.models.evaluation_reports import EvaluationReportRun
+
+        # Mirror content.metrics into the legacy `metadata` JSONField so existing
+        # consumers that read from it (e.g. the UI's run preview before Commit 2's
+        # frontend refresh) still work.
+        content = inputs.content or {}
+        metrics = content.get("metrics", {}) or {}
+
+        run = EvaluationReportRun.objects.create(
+            report_id=inputs.report_id,
+            content=content,
+            metadata=metrics,
+            period_start=inputs.period_start,
+            period_end=inputs.period_end,
+        )
+
+        # Emit $ai_evaluation_report event to ClickHouse
+        team = Team.objects.get(id=inputs.team_id)
+
+        # Collect citations from structured content (v2), not from per-section lists
+        citations = content.get("citations", []) or []
+        all_referenced_ids = [c.get("generation_id", "") for c in citations if c.get("generation_id")]
+
+        properties: dict = {
+            "$ai_evaluation_id": inputs.evaluation_id,
+            "$ai_evaluation_report_id": str(run.report_id),
+            "$ai_evaluation_report_run_id": str(run.id),
+            "$ai_report_title": content.get("title", ""),
+            "$ai_report_period_start": inputs.period_start,
+            "$ai_report_period_end": inputs.period_end,
+            # Metrics for querying/alerting (flattened from content.metrics)
+            "$ai_report_total_runs": metrics.get("total_runs", 0),
+            "$ai_report_pass_count": metrics.get("pass_count", 0),
+            "$ai_report_fail_count": metrics.get("fail_count", 0),
+            "$ai_report_na_count": metrics.get("na_count", 0),
+            "$ai_report_pass_rate": metrics.get("pass_rate", 0.0),
+            "$ai_report_previous_pass_rate": metrics.get("previous_pass_rate"),
+            "$ai_report_previous_total_runs": metrics.get("previous_total_runs"),
+            # Structured content + citations for downstream consumption
+            "$ai_report_content": content,
+            "$ai_report_citations": citations,
+            "$ai_report_referenced_generation_ids": all_referenced_ids,
+            "$ai_report_section_count": len(content.get("sections", [])),
+        }
+
+        create_event(
+            event_uuid=uuid.uuid4(),
+            event="$ai_evaluation_report",
+            team=team,
+            distinct_id=f"eval_report_{inputs.team_id}",
+            properties=properties,
+        )
+
+        return str(run.id)
+
+    run_id = await store()
+    return StoreReportRunOutput(report_run_id=run_id)
+
+
+@temporalio.activity.defn
+async def deliver_report_activity(
+    inputs: DeliverReportInput,
+) -> None:
+    """Deliver the report via configured delivery targets (email/Slack)."""
+    async with Heartbeater():
+        await logger.ainfo(
+            "Delivering evaluation report",
+            report_id=inputs.report_id,
+            report_run_id=inputs.report_run_id,
+        )
+
+        @database_sync_to_async(thread_sensitive=False)
+        def deliver():
+            from posthog.temporal.llm_analytics.eval_reports.delivery import deliver_report
+
+            deliver_report(
+                report_id=inputs.report_id,
+                report_run_id=inputs.report_run_id,
+            )
+
+        await deliver()
+
+
+@temporalio.activity.defn
+async def update_next_delivery_date_activity(
+    inputs: UpdateNextDeliveryDateInput,
+) -> None:
+    """Update the report's next_delivery_date and last_delivered_at.
+
+    last_delivered_at is set to the report's period_end (captured at the start of
+    this run) rather than the current wall-clock time. This guarantees that the
+    next run's period_start picks up exactly where this run's period_end left off,
+    so any time spent generating/delivering does not create a coverage gap.
+    """
+
+    @database_sync_to_async(thread_sensitive=False)
+    def update():
+        import datetime as dt_mod
+
+        from products.llm_analytics.backend.models.evaluation_reports import EvaluationReport
+
+        report = EvaluationReport.objects.get(id=inputs.report_id)
+        report.last_delivered_at = dt_mod.datetime.fromisoformat(inputs.period_end)
+        report.set_next_delivery_date()
+        report.save(update_fields=["last_delivered_at", "next_delivery_date"])
+
+    await update()
diff --git a/posthog/temporal/llm_analytics/eval_reports/delivery.py b/posthog/temporal/llm_analytics/eval_reports/delivery.py
new file mode 100644
index 000000000000..6a3655117066
--- /dev/null
+++ b/posthog/temporal/llm_analytics/eval_reports/delivery.py
@@ -0,0 +1,427 @@
+"""Delivery logic for evaluation reports (email and Slack).
+
+Content shape: `EvalReportContent` has a `title`, 1-6 titled `sections`, a list
+of structured `citations`, and a `metrics` block. The renderers below build the
+email HTML body and Slack Block Kit payloads from that shape.
+"""
+
+import re
+from datetime import UTC, datetime
+
+import structlog
+from markdown_it import MarkdownIt
+from markdown_to_mrkdwn import SlackMarkdownConverter
+
+from posthog.temporal.llm_analytics.eval_reports.report_agent.schema import EvalReportContent, EvalReportMetrics
+
+logger = structlog.get_logger(__name__)
+
+# Matches a leading markdown heading line at the very start of a section's content.
+# The renderer (email/Slack/UI) already emits its own section title, so if the agent
+# also started the section with its own `## Executive summary` heading we strip it
+# to avoid duplicated titles. See EvaluationReportViewer.tsx for the parallel fix.
+_LEADING_HEADING_RE = re.compile(r"^\s*#{1,6}\s+(.+?)\s*(?:\r?\n|$)")
+
+# html=False escapes any raw HTML in the markdown source — defense in depth
+# even though the markdown is produced by our own LLM agent via structured tools.
+_md = MarkdownIt("commonmark", {"html": False}).enable("table")
+_slack_converter = SlackMarkdownConverter()
+
+# Inline styles for email-safe HTML (many clients strip <style> blocks)
+_EMAIL_TABLE_STYLE = 'style="border-collapse: collapse; width: 100%; margin: 8px 0; font-size: 14px;"'
+_EMAIL_TH_STYLE = (
+    'style="border: 1px solid #ddd; padding: 8px 12px; background-color: #f5f5f5; text-align: left; font-weight: 600;"'
+)
+_EMAIL_TD_STYLE = 'style="border: 1px solid #ddd; padding: 8px 12px;"'
+
+
+def _inline_email_styles(html: str) -> str:
+    """Add inline styles to HTML elements for email client compatibility."""
+    html = html.replace("<table>", f"<table {_EMAIL_TABLE_STYLE}>")
+    html = re.sub(r"<th(?=>| )", f"<th {_EMAIL_TH_STYLE}", html)
+    html = re.sub(r"<td(?=>| )", f"<td {_EMAIL_TD_STYLE}", html)
+    return html
+
+
+def _format_period_for_display(iso_str: str) -> str:
+    """Format an ISO-8601 timestamp string for display in emails and Slack messages.
+
+    Parses the ISO string and converts to UTC, returning e.g. "Apr 08, 2026 14:01 UTC".
+    Falls back to the raw string if parsing fails, so a bad timestamp never breaks delivery.
+    """
+    try:
+        dt = datetime.fromisoformat(iso_str).astimezone(UTC)
+    except (ValueError, TypeError):
+        return iso_str
+    return dt.strftime("%b %d, %Y %H:%M UTC")
+
+
+def _build_citation_map(citations: list) -> dict[str, str]:
+    """Build a generation_id → trace_id lookup from structured citations."""
+    return {c.generation_id: c.trace_id for c in citations if c.generation_id and c.trace_id}
+
+
+def _make_trace_link(project_id: int, generation_id: str, trace_id: str) -> str:
+    """Build the trace URL for a cited generation."""
+    from posthog.utils import absolute_uri
+
+    return absolute_uri(f"/project/{project_id}/llm-analytics/traces/{trace_id}?event={generation_id}")
+
+
+def _linkify_citations(text: str, project_id: int, citation_map: dict[str, str]) -> str:
+    """Replace cited generation IDs with clickable markdown links.
+
+    Uses the structured citation map (from add_citation calls) rather than
+    scanning for UUID patterns. Only IDs the agent explicitly cited get linked.
+    Handles common LLM formatting wrappers (backticks, angle brackets).
+
+    Two-phase approach avoids double-replacement: first swap every occurrence
+    of each gen_id to a unique placeholder, then replace placeholders with the
+    actual markdown links. This prevents gen_ids inside URLs from being matched.
+    """
+    if not citation_map:
+        return text
+
+    # Phase 1: replace all occurrences of each gen_id with a placeholder.
+    placeholders: dict[str, str] = {}
+    for i, gen_id in enumerate(citation_map):
+        placeholder = f"\x00CITE{i}\x00"
+        placeholders[placeholder] = gen_id
+
+        for wrapper in [f"`` `{gen_id}` ``", f"`{gen_id}`", f"<{gen_id}>"]:
+            text = text.replace(wrapper, placeholder)
+        text = text.replace(gen_id, placeholder)
+
+    # Phase 2: replace placeholders with markdown links.
+    for placeholder, gen_id in placeholders.items():
+        trace_id = citation_map[gen_id]
+        link = _make_trace_link(project_id, gen_id, trace_id)
+        text = text.replace(placeholder, f"[{gen_id[:8]}...]({link})")
+
+    return text
+
+
+def _strip_redundant_leading_heading(content: str, section_title: str) -> str:
+    """Strip a leading markdown heading line if it matches the section title.
+
+    The agent sometimes prefixes each section's content with its own heading
+    (e.g. `## Executive summary`), which duplicates the heading the renderer
+    emits separately. Match on canonical-title prefix so near-matches like
+    "Trend analysis (hourly)" are also stripped.
+    """
+    match = _LEADING_HEADING_RE.match(content)
+    if not match:
+        return content
+    if match.group(1).strip().lower().startswith(section_title.lower()):
+        return content[match.end() :].lstrip()
+    return content
+
+
+def _format_pass_rate(rate: float | None) -> str:
+    if rate is None:
+        return "—"
+    return f"{rate:.2f}%"
+
+
+def _render_metrics_block_html(metrics: EvalReportMetrics) -> str:
+    """Render the metrics block as HTML (table + period-over-period row).
+
+    Lives at the top of the email body so the reader sees the trusted numbers
+    before reading the agent's analysis.
+    """
+    period = f"{_format_period_for_display(metrics.period_start)} → {_format_period_for_display(metrics.period_end)}"
+    delta = ""
+    if metrics.previous_pass_rate is not None:
+        diff = metrics.pass_rate - metrics.previous_pass_rate
+        arrow = "▲" if diff > 0 else ("▼" if diff < 0 else "—")
+        delta = f" ({arrow} {abs(diff):.2f}pp vs previous)"
+
+    table = (
+        "<table>"
+        "<tr><th>Total runs</th><th>Pass</th><th>Fail</th><th>N/A</th><th>Pass rate</th></tr>"
+        f"<tr>"
+        f"<td>{metrics.total_runs}</td>"
+        f"<td>{metrics.pass_count}</td>"
+        f"<td>{metrics.fail_count}</td>"
+        f"<td>{metrics.na_count}</td>"
+        f"<td><strong>{_format_pass_rate(metrics.pass_rate)}</strong>{delta}</td>"
+        f"</tr>"
+        "</table>"
+    )
+    table = _inline_email_styles(table)
+    return f'<p class="muted"><strong>Period</strong>: {period}</p>\n{table}\n'
+
+
+def _build_pass_rate_bar(pass_rate: float, width: int = 30) -> str:
+    """Build an ASCII bar representing the pass rate percentage."""
+    filled = round(pass_rate / 100 * width)
+    return "█" * filled + "·" * (width - filled)
+
+
+def _render_metrics_slack_blocks(metrics: EvalReportMetrics) -> list[dict]:
+    """Render the metrics block as a Slack code block with ASCII dashboard style."""
+    W = 36  # inner width between │ pipes
+
+    delta = ""
+    if metrics.previous_pass_rate is not None:
+        diff = metrics.pass_rate - metrics.previous_pass_rate
+        arrow = "▲" if diff > 0 else ("▼" if diff < 0 else "—")
+        delta = f"  {arrow} {abs(diff):.2f}pp"
+
+    bar = _build_pass_rate_bar(metrics.pass_rate)
+    rate = _format_pass_rate(metrics.pass_rate)
+    runs_label = f"{metrics.total_runs} runs"
+
+    # Line with rate left-aligned and runs right-aligned
+    rate_str = f"  {rate}{delta}"
+    rate_line = f"{rate_str}{runs_label:>{W - len(rate_str)}}"
+
+    counts = f"  pass {metrics.pass_count} · fail {metrics.fail_count} · n/a {metrics.na_count}"
+
+    top = f"┌─ pass rate {'─' * (W - 12)}┐"
+    bot = f"└{'─' * W}┘"
+
+    code_block = f"{top}\n│{f'  {bar}':<{W}}│\n│{rate_line:<{W}}│\n│{counts:<{W}}│\n{bot}"
+
+    blocks: list[dict] = [
+        {
+            "type": "section",
+            "text": {"type": "mrkdwn", "text": f"```{code_block}```"},
+        },
+    ]
+    return blocks
+
+
+def _render_section_html(title: str, content: str, project_id: int, citation_map: dict[str, str]) -> str:
+    """Render a titled markdown section as HTML with clickable trace links."""
+    content = _strip_redundant_leading_heading(content, title)
+    content_with_links = _linkify_citations(content, project_id, citation_map)
+    html_content = _md.render(content_with_links)
+    html_content = _inline_email_styles(html_content)
+    return f"<h2>{title}</h2>\n{html_content}\n"
+
+
+def _render_section_mrkdwn(title: str, content: str, project_id: int, citation_map: dict[str, str]) -> str:
+    """Render a titled markdown section as Slack mrkdwn with clickable trace links."""
+    content = _strip_redundant_leading_heading(content, title)
+    content = _linkify_citations(content, project_id, citation_map)
+    mrkdwn_content = _slack_converter.convert(content)
+    return f"*{title}*\n{mrkdwn_content}"
+
+
+def deliver_email_report(
+    report_run,
+    targets: list[dict],
+    evaluation_name: str,
+    evaluation_id: str,
+    project_id: int,
+    period_start: str,
+    period_end: str,
+) -> list[str]:
+    """Send report via email. Returns list of errors (empty if all succeeded)."""
+    from posthog.email import EmailMessage
+    from posthog.utils import absolute_uri
+
+    content = EvalReportContent.from_dict(report_run.content)
+    citation_map = _build_citation_map(content.citations)
+    errors: list[str] = []
+
+    # Metrics block first, then each section
+    body_parts = [_render_metrics_block_html(content.metrics)]
+    for section in content.sections:
+        body_parts.append(_render_section_html(section.title, section.content, project_id, citation_map))
+    body_html = "\n".join(body_parts)
+
+    evaluation_url = absolute_uri(f"/project/{project_id}/llm-analytics/evaluations/{evaluation_id}")
+    period_start_display = _format_period_for_display(period_start)
+    period_end_display = _format_period_for_display(period_end)
+    subject_title = content.title or "Evaluation report"
+    subject = f"{evaluation_name}: {subject_title}"
+
+    for target in targets:
+        if target.get("type") != "email":
+            continue
+
+        emails = [e.strip() for e in target.get("value", "").split(",") if e.strip()]
+        for email_addr in emails:
+            try:
+                message = EmailMessage(
+                    campaign_key=f"eval_report_{report_run.report_id}_{report_run.id}",
+                    subject=subject,
+                    template_name="evaluation_report",
+                    template_context={
+                        "evaluation_name": evaluation_name,
+                        "period_start": period_start_display,
+                        "period_end": period_end_display,
+                        "report_body": body_html,
+                        "evaluation_url": evaluation_url,
+                    },
+                    reply_to="hey@posthog.com",
+                )
+                message.add_recipient(email=email_addr)
+                message.send()
+            except Exception as e:
+                error_msg = f"Failed to send email to {email_addr}: {e}"
+                logger.exception(error_msg)
+                errors.append(error_msg)
+
+    return errors
+
+
+def deliver_slack_report(
+    report_run,
+    targets: list[dict],
+    evaluation_name: str,
+    team_id: int,
+    project_id: int,
+    period_start: str,
+    period_end: str,
+) -> list[str]:
+    """Send report via Slack. Returns list of errors (empty if all succeeded).
+
+    Main message = agent title (Block Kit header) + metrics context + first section.
+    Thread replies = sections[1:]. If there's only one section, no thread replies.
+    """
+    from posthog.models.integration import Integration, SlackIntegration
+
+    content = EvalReportContent.from_dict(report_run.content)
+    citation_map = _build_citation_map(content.citations)
+    errors: list[str] = []
+
+    header_text = f"{evaluation_name}: {content.title}" if content.title else f"Evaluation report: {evaluation_name}"
+    # Slack header blocks are limited to 150 chars, enforce that here.
+    if len(header_text) > 150:
+        header_text = header_text[:147] + "..."
+
+    period_line = (
+        f"*{evaluation_name}*  ·  {_format_period_for_display(period_start)} → {_format_period_for_display(period_end)}"
+    )
+
+    for target in targets:
+        if target.get("type") != "slack":
+            continue
+
+        integration_id = target.get("integration_id")
+        channel = target.get("channel", "")
+        if not integration_id or not channel:
+            continue
+
+        try:
+            integration = Integration.objects.get(id=integration_id, team_id=team_id, kind="slack")
+            client = SlackIntegration(integration).client
+
+            # Main message: header + context + metrics grid + first section (if any)
+            blocks: list[dict] = [
+                {
+                    "type": "header",
+                    "text": {"type": "plain_text", "text": header_text},
+                },
+                {
+                    "type": "context",
+                    "elements": [{"type": "mrkdwn", "text": period_line}],
+                },
+                *_render_metrics_slack_blocks(content.metrics),
+                {"type": "divider"},
+            ]
+
+            if content.sections:
+                first_section_mrkdwn = _render_section_mrkdwn(
+                    content.sections[0].title, content.sections[0].content, project_id, citation_map
+                )
+                blocks.append(
+                    {
+                        "type": "section",
+                        "text": {"type": "mrkdwn", "text": first_section_mrkdwn[:3000]},
+                    }
+                )
+
+            result = client.chat_postMessage(
+                channel=channel,
+                blocks=blocks,
+                text=header_text,
+            )
+
+            # Thread replies: remaining sections, one per reply
+            thread_ts = result.get("ts")
+            if thread_ts and len(content.sections) > 1:
+                for section in content.sections[1:]:
+                    mrkdwn_text = _render_section_mrkdwn(section.title, section.content, project_id, citation_map)
+                    client.chat_postMessage(
+                        channel=channel,
+                        thread_ts=thread_ts,
+                        text=mrkdwn_text[:3000],
+                    )
+
+        except Exception as e:
+            error_msg = f"Failed to send Slack message to {channel}: {e}"
+            logger.exception(error_msg)
+            errors.append(error_msg)
+
+    return errors
+
+
+def deliver_report(report_id: str, report_run_id: str) -> None:
+    """Deliver a report run via all configured delivery targets.
+
+    Raises RuntimeError after persisting FAILED status if ALL delivery targets
+    fail, so the Temporal activity surfaces the failure and the retry policy
+    kicks in. Partial failures return normally (with delivery_status=partial_failure).
+    """
+    from products.llm_analytics.backend.models.evaluation_reports import EvaluationReport, EvaluationReportRun
+
+    report_run = EvaluationReportRun.objects.get(id=report_run_id)
+    report = EvaluationReport.objects.select_related("evaluation", "team").get(id=report_id)
+
+    evaluation_name = report.evaluation.name
+    evaluation_id = str(report.evaluation.id)
+    project_id = report.team.id
+    team_id = report.team_id
+    period_start = report_run.period_start.isoformat()
+    period_end = report_run.period_end.isoformat()
+    targets = report.delivery_targets or []
+
+    all_errors: list[str] = []
+
+    email_targets = [t for t in targets if t.get("type") == "email"]
+    if email_targets:
+        all_errors.extend(
+            deliver_email_report(
+                report_run, email_targets, evaluation_name, evaluation_id, project_id, period_start, period_end
+            )
+        )
+
+    slack_targets = [t for t in targets if t.get("type") == "slack"]
+    if slack_targets:
+        all_errors.extend(
+            deliver_slack_report(
+                report_run, slack_targets, evaluation_name, team_id, project_id, period_start, period_end
+            )
+        )
+
+    had_any_target = bool(email_targets or slack_targets)
+    all_failed = (
+        had_any_target
+        and len(all_errors) > 0
+        and (
+            # Check if every attempted target failed. We count attempts implicitly by
+            # summing target counts — an exception in delivery appends 1 error, and
+            # targets with an attempt that succeeded don't append anything.
+            len(all_errors) >= len(email_targets) + len(slack_targets)
+        )
+    )
+
+    if not had_any_target:
+        report_run.delivery_status = EvaluationReportRun.DeliveryStatus.PENDING
+    elif all_failed:
+        report_run.delivery_status = EvaluationReportRun.DeliveryStatus.FAILED
+    elif all_errors:
+        report_run.delivery_status = EvaluationReportRun.DeliveryStatus.PARTIAL_FAILURE
+    else:
+        report_run.delivery_status = EvaluationReportRun.DeliveryStatus.DELIVERED
+
+    report_run.delivery_errors = all_errors
+    report_run.save(update_fields=["delivery_status", "delivery_errors"])
+
+    if all_failed:
+        # Raise so the Temporal activity fails and retries fire per DELIVER_RETRY_POLICY.
+        raise RuntimeError(f"All delivery targets failed for report run {report_run_id}: {'; '.join(all_errors)}")
diff --git a/posthog/temporal/llm_analytics/eval_reports/schedule.py b/posthog/temporal/llm_analytics/eval_reports/schedule.py
new file mode 100644
index 000000000000..2d961097bca0
--- /dev/null
+++ b/posthog/temporal/llm_analytics/eval_reports/schedule.py
@@ -0,0 +1,56 @@
+"""Temporal schedule registration for evaluation reports."""
+
+from dataclasses import asdict
+from datetime import timedelta
+
+from django.conf import settings
+
+from temporalio.client import Client, Schedule, ScheduleActionStartWorkflow, ScheduleIntervalSpec, ScheduleSpec
+
+from posthog.temporal.common.schedule import a_create_schedule, a_schedule_exists, a_update_schedule
+from posthog.temporal.llm_analytics.eval_reports.constants import (
+    CHECK_COUNT_TRIGGERED_REPORTS_WORKFLOW_NAME,
+    COUNT_TRIGGER_SCHEDULE_ID,
+    SCHEDULE_ALL_EVAL_REPORTS_WORKFLOW_NAME,
+    SCHEDULE_ID,
+)
+from posthog.temporal.llm_analytics.eval_reports.types import (
+    CheckCountTriggeredReportsWorkflowInputs,
+    ScheduleAllEvalReportsWorkflowInputs,
+)
+
+
+async def create_eval_reports_schedule(client: Client):
+    """Create or update the hourly schedule for time-based evaluation reports."""
+    schedule = Schedule(
+        action=ScheduleActionStartWorkflow(
+            SCHEDULE_ALL_EVAL_REPORTS_WORKFLOW_NAME,
+            asdict(ScheduleAllEvalReportsWorkflowInputs()),
+            id=SCHEDULE_ID,
+            task_queue=settings.GENERAL_PURPOSE_TASK_QUEUE,
+        ),
+        spec=ScheduleSpec(intervals=[ScheduleIntervalSpec(every=timedelta(hours=1))]),
+    )
+
+    if await a_schedule_exists(client, SCHEDULE_ID):
+        await a_update_schedule(client, SCHEDULE_ID, schedule)
+    else:
+        await a_create_schedule(client, SCHEDULE_ID, schedule, trigger_immediately=False)
+
+
+async def create_count_trigger_schedule(client: Client):
+    """Create or update the 5-minute schedule for count-based evaluation reports."""
+    schedule = Schedule(
+        action=ScheduleActionStartWorkflow(
+            CHECK_COUNT_TRIGGERED_REPORTS_WORKFLOW_NAME,
+            asdict(CheckCountTriggeredReportsWorkflowInputs()),
+            id=COUNT_TRIGGER_SCHEDULE_ID,
+            task_queue=settings.GENERAL_PURPOSE_TASK_QUEUE,
+        ),
+        spec=ScheduleSpec(intervals=[ScheduleIntervalSpec(every=timedelta(minutes=5))]),
+    )
+
+    if await a_schedule_exists(client, COUNT_TRIGGER_SCHEDULE_ID):
+        await a_update_schedule(client, COUNT_TRIGGER_SCHEDULE_ID, schedule)
+    else:
+        await a_create_schedule(client, COUNT_TRIGGER_SCHEDULE_ID, schedule, trigger_immediately=False)
diff --git a/posthog/temporal/llm_analytics/eval_reports/test/test_activities.py b/posthog/temporal/llm_analytics/eval_reports/test/test_activities.py
new file mode 100644
index 000000000000..c2562b9cbb37
--- /dev/null
+++ b/posthog/temporal/llm_analytics/eval_reports/test/test_activities.py
@@ -0,0 +1,119 @@
+import datetime as dt
+
+from posthog.test.base import BaseTest
+
+from django.utils import timezone
+
+from products.llm_analytics.backend.models.evaluation_reports import EvaluationReport
+from products.llm_analytics.backend.models.evaluations import Evaluation
+
+
+def _prepare_sync(report_id: str, manual: bool = False):
+    """Call the inner sync logic of prepare_report_context_activity directly."""
+    report = EvaluationReport.objects.select_related("evaluation").get(id=report_id)
+    evaluation = report.evaluation
+    now = dt.datetime.now(tz=dt.UTC)
+
+    period_end = now
+    freq_deltas = {
+        "hourly": dt.timedelta(hours=1),
+        "daily": dt.timedelta(days=1),
+        "weekly": dt.timedelta(weeks=1),
+    }
+
+    if manual:
+        period_start = now - freq_deltas.get(report.frequency, dt.timedelta(days=1))
+    elif report.last_delivered_at:
+        period_start = report.last_delivered_at
+    else:
+        period_start = now - freq_deltas.get(report.frequency, dt.timedelta(days=1))
+
+    period_duration = period_end - period_start
+    previous_period_start = period_start - period_duration
+
+    return {
+        "report_id": str(report.id),
+        "team_id": report.team_id,
+        "evaluation_id": str(evaluation.id),
+        "evaluation_name": evaluation.name,
+        "period_start": period_start,
+        "period_end": period_end,
+        "previous_period_start": previous_period_start,
+        "manual": manual,
+    }
+
+
+class TestPrepareReportContext(BaseTest):
+    def _create_report(self, **kwargs) -> EvaluationReport:
+        evaluation = Evaluation.objects.create(
+            team=self.team,
+            name="Test Eval",
+            evaluation_type="llm_judge",
+            evaluation_config={"prompt": "test prompt"},
+            output_type="boolean",
+            output_config={},
+            enabled=True,
+            created_by=self.user,
+            conditions=[{"id": "c1", "rollout_percentage": 100, "properties": []}],
+        )
+        defaults = {
+            "team": self.team,
+            "evaluation": evaluation,
+            "frequency": "hourly",
+            "start_date": timezone.now() - dt.timedelta(hours=5),
+            "delivery_targets": [{"type": "email", "value": "test@example.com"}],
+        }
+        defaults.update(kwargs)
+        return EvaluationReport.objects.create(**defaults)
+
+    def test_manual_run_uses_full_frequency_lookback(self):
+        report = self._create_report(frequency="hourly")
+        result = _prepare_sync(str(report.id), manual=True)
+        # Manual hourly: period_start should be ~1 hour before period_end
+        duration = result["period_end"] - result["period_start"]
+        self.assertAlmostEqual(duration.total_seconds(), 3600, delta=5)
+
+    def test_manual_daily_uses_full_day_lookback(self):
+        report = self._create_report(frequency="daily")
+        result = _prepare_sync(str(report.id), manual=True)
+        duration = result["period_end"] - result["period_start"]
+        self.assertAlmostEqual(duration.total_seconds(), 86400, delta=5)
+
+    def test_manual_weekly_uses_full_week_lookback(self):
+        report = self._create_report(frequency="weekly")
+        result = _prepare_sync(str(report.id), manual=True)
+        duration = result["period_end"] - result["period_start"]
+        self.assertAlmostEqual(duration.total_seconds(), 7 * 86400, delta=5)
+
+    def test_scheduled_first_run_uses_frequency_lookback(self):
+        report = self._create_report(frequency="hourly")
+        result = _prepare_sync(str(report.id), manual=False)
+        duration = result["period_end"] - result["period_start"]
+        self.assertAlmostEqual(duration.total_seconds(), 3600, delta=5)
+
+    def test_scheduled_run_uses_last_delivered_at(self):
+        last_delivered = dt.datetime.now(tz=dt.UTC) - dt.timedelta(minutes=30)
+        report = self._create_report(frequency="hourly", last_delivered_at=last_delivered)
+        result = _prepare_sync(str(report.id), manual=False)
+        self.assertEqual(result["period_start"], last_delivered)
+
+    def test_previous_period_calculation(self):
+        report = self._create_report(frequency="hourly")
+        result = _prepare_sync(str(report.id), manual=True)
+        period_duration = result["period_end"] - result["period_start"]
+        expected_prev = result["period_start"] - period_duration
+        self.assertEqual(result["previous_period_start"], expected_prev)
+
+    def test_manual_run_ignores_last_delivered_at(self):
+        last_delivered = dt.datetime.now(tz=dt.UTC) - dt.timedelta(minutes=15)
+        report = self._create_report(frequency="hourly", last_delivered_at=last_delivered)
+        result = _prepare_sync(str(report.id), manual=True)
+        # Manual should use full frequency (1h), not time since last_delivered_at (15m)
+        duration = result["period_end"] - result["period_start"]
+        self.assertAlmostEqual(duration.total_seconds(), 3600, delta=5)
+
+    def test_context_includes_evaluation_metadata(self):
+        report = self._create_report()
+        result = _prepare_sync(str(report.id))
+        self.assertEqual(result["evaluation_name"], "Test Eval")
+        self.assertEqual(result["team_id"], self.team.id)
diff --git a/posthog/temporal/llm_analytics/eval_reports/test/test_delivery.py b/posthog/temporal/llm_analytics/eval_reports/test/test_delivery.py
new file mode 100644
index 000000000000..c3e6cc400952
--- /dev/null
+++ b/posthog/temporal/llm_analytics/eval_reports/test/test_delivery.py
@@ -0,0 +1,372 @@
+from unittest.mock import MagicMock, patch
+
+from django.test import SimpleTestCase
+
+from posthog.temporal.llm_analytics.eval_reports.delivery import (
+    _format_period_for_display,
+    _inline_email_styles,
+    _linkify_citations,
+    _render_metrics_block_html,
+    _render_metrics_block_mrkdwn,
+    _render_section_html,
+    _render_section_mrkdwn,
+    _strip_redundant_leading_heading,
+    deliver_report,
+)
+from posthog.temporal.llm_analytics.eval_reports.report_agent.schema import (
+    Citation,
+    EvalReportContent,
+    EvalReportMetrics,
+    ReportSection,
+)
+
+
+class TestLinkifyCitations(SimpleTestCase):
+    def test_links_cited_generation_id_in_backticks(self):
+        text = "See `12345678-1234-1234-1234-123456789abc` here."
+        citation_map = {"12345678-1234-1234-1234-123456789abc": "trace-abc"}
+        result = _linkify_citations(text, project_id=42, citation_map=citation_map)
+        self.assertIn("[12345678...]", result)
+        self.assertIn("/project/42/llm-analytics/traces/trace-abc?event=12345678-1234-1234-1234-123456789abc", result)
+
+    def test_links_cited_generation_id_in_double_backticks(self):
+        text = "See `` `12345678-1234-1234-1234-123456789abc` `` here."
+        citation_map = {"12345678-1234-1234-1234-123456789abc": "trace-abc"}
+        result = _linkify_citations(text, project_id=1, citation_map=citation_map)
+        self.assertIn("[12345678...]", result)
+        self.assertNotIn("``", result)
+
+    def test_links_cited_generation_id_bare(self):
+        text = "See 12345678-1234-1234-1234-123456789abc here."
+        citation_map = {"12345678-1234-1234-1234-123456789abc": "trace-abc"}
+        result = _linkify_citations(text, project_id=1, citation_map=citation_map)
+        self.assertIn("[12345678...]", result)
+
+    def test_leaves_uncited_ids_alone(self):
+        text = "See `12345678-1234-1234-1234-123456789abc` here."
+        result = _linkify_citations(text, project_id=1, citation_map={})
+        self.assertEqual(text, result)
+
+    def test_leaves_non_id_backticks_alone(self):
+        text = "Use `some_function()` here."
+        citation_map = {"12345678-1234-1234-1234-123456789abc": "trace-abc"}
+        result = _linkify_citations(text, project_id=1, citation_map=citation_map)
+        self.assertEqual(text, result)
+
+    def test_no_double_replacement_when_id_appears_multiple_times(self):
+        gen_id = "639a38ba-6cc6-4e0c-b5ff-ad269f6f9cf6"
+        citation_map = {gen_id: "trace-abc"}
+        text = f"- `{gen_id}`: satisfied\n1. {gen_id} — reason"
+        result = _linkify_citations(text, project_id=1, citation_map=citation_map)
+        self.assertNotIn(f"?event=[", result)
+        self.assertNotIn(f"?event=%5B", result)
+        self.assertEqual(result.count("[639a38ba...]"), 2)
+
+    def test_multiple_citations_no_cross_contamination(self):
+        citation_map = {
+            "aaaa1111-1111-1111-1111-111111111111": "trace-a",
+            "bbbb2222-2222-2222-2222-222222222222": "trace-b",
+        }
+        text = "First: `aaaa1111-1111-1111-1111-111111111111`, second: `bbbb2222-2222-2222-2222-222222222222`."
+        result = _linkify_citations(text, project_id=1, citation_map=citation_map)
+        self.assertIn("traces/trace-a?event=aaaa1111", result)
+        self.assertIn("traces/trace-b?event=bbbb2222", result)
+        self.assertNotIn("?event=[", result)
+
+    def test_handles_non_uuid_trace_id(self):
+        text = "See `gen-123` here."
+        citation_map = {"gen-123": "my-custom-trace-id"}
+        result = _linkify_citations(text, project_id=1, citation_map=citation_map)
+        self.assertIn("/traces/my-custom-trace-id?event=gen-123", result)
+
+
+class TestRenderSectionHtml(SimpleTestCase):
+    """v2: renderer takes a title directly, no more SECTION_TITLES lookup."""
+
+    def test_renders_title_as_h2(self):
+        html = _render_section_html("Summary", "Some content", project_id=1, citation_map={})
+        self.assertIn("<h2>Summary</h2>", html)
+
+    def test_renders_agent_chosen_title(self):
+        html = _render_section_html("Volume drop at 14:00", "body", project_id=1, citation_map={})
+        self.assertIn("<h2>Volume drop at 14:00</h2>", html)
+
+    def test_renders_bold_markdown(self):
+        html = _render_section_html("Stats", "**Pass rate**: 80%", project_id=1, citation_map={})
+        self.assertIn("<strong>Pass rate</strong>", html)
+
+    def test_converts_cited_id_to_link(self):
+        citation_map = {"12345678-1234-1234-1234-123456789abc": "trace-abc"}
+        html = _render_section_html(
+            "Failures",
+            "Failed: `12345678-1234-1234-1234-123456789abc`",
+            project_id=42,
+            citation_map=citation_map,
+        )
+        self.assertIn("/project/42/llm-analytics/traces/trace-abc", html)
+        self.assertIn("12345678...", html)
+
+    def test_renders_lists(self):
+        html = _render_section_html("Stats", "- item 1\n- item 2", project_id=1, citation_map={})
+        self.assertIn("<li>item 1</li>", html)
+        self.assertIn("<li>item 2</li>", html)
+        self.assertIn("<ul>", html)
+
+    def test_renders_tables(self):
+        md = "| Metric | Value |\n|--------|-------|\n| Pass rate | 80% |"
+        html = _render_section_html("Stats", md, project_id=1, citation_map={})
+        self.assertIn("<table", html)
+        self.assertIn("<th", html)
+        self.assertIn("Pass rate", html)
+
+    def test_renders_italic(self):
+        html = _render_section_html("Stats", "*emphasis*", project_id=1, citation_map={})
+        self.assertIn("<em>emphasis</em>", html)
+
+
+class TestRenderSectionMrkdwn(SimpleTestCase):
+    def test_renders_title_bold(self):
+        result = _render_section_mrkdwn("Summary", "Some content", project_id=1, citation_map={})
+        self.assertIn("*Summary*", result)
+
+    def test_renders_agent_chosen_title(self):
+        result = _render_section_mrkdwn("Cost spike in gpt-5.2", "Body", project_id=1, citation_map={})
+        self.assertIn("*Cost spike in gpt-5.2*", result)
+
+    def test_converts_bold(self):
+        result = _render_section_mrkdwn("Stats", "**Pass rate**: 80%", project_id=1, citation_map={})
+        self.assertIn("*Pass rate*", result)
+
+    def test_converts_lists(self):
+        result = _render_section_mrkdwn("Stats", "- item 1\n- item 2", project_id=1, citation_map={})
+        self.assertIn("item 1", result)
+        self.assertIn("item 2", result)
+
+
+class TestStripRedundantLeadingHeading(SimpleTestCase):
+    def test_strips_exact_match(self):
+        content = "## Executive Summary\n\nPass rate is 94%."
+        result = _strip_redundant_leading_heading(content, "Executive Summary")
+        self.assertEqual(result, "Pass rate is 94%.")
+
+    def test_strips_case_insensitive(self):
+        content = "## executive summary\n\nBody text."
+        result = _strip_redundant_leading_heading(content, "Executive Summary")
+        self.assertEqual(result, "Body text.")
+
+    def test_strips_with_suffix(self):
+        # The agent sometimes emits "Trend analysis (hourly)" as the heading
+        content = "## Trend analysis (hourly)\n\n- 13:00 bucket: 96%"
+        result = _strip_redundant_leading_heading(content, "Trend Analysis")
+        self.assertEqual(result, "- 13:00 bucket: 96%")
+
+    def test_strips_h1_through_h6(self):
+        for prefix in ("#", "##", "###", "####", "#####", "######"):
+            content = f"{prefix} Statistics\n\nBody"
+            result = _strip_redundant_leading_heading(content, "Statistics")
+            self.assertEqual(result, "Body", f"failed for prefix {prefix!r}")
+
+    def test_leaves_content_alone_when_no_heading(self):
+        content = "Pass rate is 94%."
+        result = _strip_redundant_leading_heading(content, "Executive Summary")
+        self.assertEqual(result, content)
+
+    def test_leaves_content_alone_when_heading_does_not_match(self):
+        content = "## Something Else\n\nBody"
+        result = _strip_redundant_leading_heading(content, "Executive Summary")
+        self.assertEqual(result, content)
+
+    def test_does_not_strip_non_leading_headings(self):
+        content = "Intro paragraph.\n\n## Executive Summary\n\nBody"
+        result = _strip_redundant_leading_heading(content, "Executive Summary")
+        self.assertEqual(result, content)
+
+    def test_render_section_html_does_not_duplicate_heading(self):
+        content = "## Summary\n\nPass rate is 94%."
+        html = _render_section_html("Summary", content, project_id=1, citation_map={})
+        self.assertEqual(html.count("Summary"), 1)
+        self.assertIn("<h2>Summary</h2>", html)
+        self.assertIn("Pass rate is 94%", html)
+
+    def test_render_section_mrkdwn_does_not_duplicate_heading(self):
+        content = "## Summary\n\nPass rate is 94%."
+        result = _render_section_mrkdwn("Summary", content, project_id=1, citation_map={})
+        self.assertEqual(result.count("Summary"), 1)
+        self.assertTrue(result.startswith("*Summary*"))
+
+
+class TestFormatPeriodForDisplay(SimpleTestCase):
+    def test_formats_utc_iso_timestamp(self):
+        result = _format_period_for_display("2026-04-08T14:01:42.951661+00:00")
+        self.assertEqual(result, "Apr 08, 2026 14:01 UTC")
+
+    def test_formats_non_utc_iso_timestamp_by_converting_to_utc(self):
+        # 10:00 in America/New_York (UTC-4 in April) → 14:00 UTC
+        result = _format_period_for_display("2026-04-08T10:00:00-04:00")
+        self.assertEqual(result, "Apr 08, 2026 14:00 UTC")
+
+    def test_falls_back_to_raw_string_on_parse_error(self):
+        result = _format_period_for_display("not a timestamp")
+        self.assertEqual(result, "not a timestamp")
+
+    def test_falls_back_on_none(self):
+        result = _format_period_for_display(None)  # type: ignore[arg-type]
+        self.assertIsNone(result)
+
+
+class TestInlineEmailStyles(SimpleTestCase):
+    def test_adds_table_styles(self):
+        html = "<table><tr><th>A</th></tr><tr><td>1</td></tr></table>"
+        styled = _inline_email_styles(html)
+        self.assertIn("border-collapse", styled)
+        self.assertIn("background-color", styled)
+
+    def test_no_op_without_tables(self):
+        html = "<p>Just text</p>"
+        self.assertEqual(html, _inline_email_styles(html))
+
+
+class TestMetricsBlockHtml(SimpleTestCase):
+    def test_renders_all_counts(self):
+        metrics = EvalReportMetrics(
+            total_runs=100,
+            pass_count=80,
+            fail_count=18,
+            na_count=2,
+            pass_rate=81.63,
+            period_start="2026-04-08T14:00:00+00:00",
+            period_end="2026-04-08T15:00:00+00:00",
+        )
+        html = _render_metrics_block_html(metrics)
+        self.assertIn("100", html)  # total_runs
+        self.assertIn("80", html)  # pass_count
+        self.assertIn("18", html)  # fail_count
+        self.assertIn("2", html)  # na_count
+        self.assertIn("81.63%", html)
+        self.assertIn("Apr 08, 2026 14:00 UTC", html)
+
+    def test_renders_delta_up(self):
+        metrics = EvalReportMetrics(total_runs=10, pass_count=9, pass_rate=90.0, previous_pass_rate=80.0)
+        html = _render_metrics_block_html(metrics)
+        self.assertIn("▲", html)
+        self.assertIn("10.00pp", html)
+
+    def test_renders_delta_down(self):
+        metrics = EvalReportMetrics(total_runs=10, pass_count=5, pass_rate=50.0, previous_pass_rate=80.0)
+        html = _render_metrics_block_html(metrics)
+        self.assertIn("▼", html)
+        self.assertIn("30.00pp", html)
+
+    def test_no_delta_when_previous_is_none(self):
+        metrics = EvalReportMetrics(total_runs=10, pass_count=9, pass_rate=90.0, previous_pass_rate=None)
+        html = _render_metrics_block_html(metrics)
+        self.assertNotIn("▲", html)
+        self.assertNotIn("▼", html)
+        self.assertNotIn("pp vs previous", html)
+
+
+class TestMetricsBlockMrkdwn(SimpleTestCase):
+    def test_compact_format(self):
+        metrics = EvalReportMetrics(total_runs=100, pass_count=80, fail_count=18, na_count=2, pass_rate=81.63)
+        text = _render_metrics_block_mrkdwn(metrics)
+        self.assertIn("*Pass rate:*", text)
+        self.assertIn("81.63%", text)
+        self.assertIn("100", text)
+        self.assertIn("80", text)
+        self.assertIn("18", text)
+        self.assertIn("*N/A:*", text)
+
+    def test_with_delta(self):
+        metrics = EvalReportMetrics(pass_rate=90.0, previous_pass_rate=80.0)
+        text = _render_metrics_block_mrkdwn(metrics)
+        self.assertIn("▲", text)
+
+
+class TestDeliverReport(SimpleTestCase):
+    """End-to-end tests for deliver_report — mocks the email+slack sub-functions."""
+
+    def _make_v2_content_dict(self, title: str = "A nice punchline") -> dict:
+        """Build an EvalReportContent dict in v2 shape."""
+        return EvalReportContent(
+            title=title,
+            sections=[ReportSection(title="Summary", content="All good.")],
+            citations=[Citation(generation_id="g", trace_id="t", reason="example")],
+            metrics=EvalReportMetrics(total_runs=10, pass_count=9, pass_rate=90.0),
+        ).to_dict()
+
+    def _make_report_run(self):
+        run = MagicMock()
+        run.content = self._make_v2_content_dict()
+        run.period_start = MagicMock(isoformat=MagicMock(return_value="2026-03-01T00:00:00+00:00"))
+        run.period_end = MagicMock(isoformat=MagicMock(return_value="2026-03-02T00:00:00+00:00"))
+        run.report_id = "report-id"
+        run.id = "run-id"
+        return run
+
+    def _make_report(self, targets):
+        report = MagicMock()
+        report.evaluation.name = "Test Eval"
+        report.evaluation.id = "eval-id"
+        report.team.id = 1
+        report.team_id = 1
+        report.delivery_targets = targets
+        return report
+
+    @patch("posthog.temporal.llm_analytics.eval_reports.delivery.deliver_email_report")
+    @patch("posthog.temporal.llm_analytics.eval_reports.delivery.deliver_slack_report")
+    @patch("products.llm_analytics.backend.models.evaluation_reports.EvaluationReportRun.objects")
+    @patch("products.llm_analytics.backend.models.evaluation_reports.EvaluationReport.objects")
+    def test_deliver_report_calls_email(self, mock_report_qs, mock_run_qs, _mock_slack, mock_email):
+        targets = [{"type": "email", "value": "test@example.com"}]
+        report = self._make_report(targets)
+        run = self._make_report_run()
+
+        mock_report_qs.select_related.return_value.get.return_value = report
+        mock_run_qs.get.return_value = run
+        mock_email.return_value = []
+
+        deliver_report("report-id", "run-id")
+
+        mock_email.assert_called_once()
+        self.assertEqual(run.delivery_status, "delivered")
+
+    @patch("posthog.temporal.llm_analytics.eval_reports.delivery.deliver_email_report")
+    @patch("posthog.temporal.llm_analytics.eval_reports.delivery.deliver_slack_report")
+    @patch("products.llm_analytics.backend.models.evaluation_reports.EvaluationReportRun.objects")
+    @patch("products.llm_analytics.backend.models.evaluation_reports.EvaluationReport.objects")
+    def test_deliver_report_handles_failures(self, mock_report_qs, mock_run_qs, _mock_slack, mock_email):
+        targets = [{"type": "email", "value": "test@example.com"}]
+        report = self._make_report(targets)
+        run = self._make_report_run()
+
+        mock_report_qs.select_related.return_value.get.return_value = report
+        mock_run_qs.get.return_value = run
+        mock_email.return_value = ["send failed"]
+
+        with self.assertRaises(RuntimeError) as cm:
+            deliver_report("report-id", "run-id")
+        self.assertIn("send failed", str(cm.exception))
+
+        self.assertEqual(run.delivery_status, "failed")
+        self.assertEqual(run.delivery_errors, ["send failed"])
+
+    @patch("posthog.temporal.llm_analytics.eval_reports.delivery.deliver_email_report")
+    @patch("posthog.temporal.llm_analytics.eval_reports.delivery.deliver_slack_report")
+    @patch("products.llm_analytics.backend.models.evaluation_reports.EvaluationReportRun.objects")
+    @patch("products.llm_analytics.backend.models.evaluation_reports.EvaluationReport.objects")
+    def test_deliver_report_partial_failure(self, mock_report_qs, mock_run_qs, mock_slack, mock_email):
+        targets = [
+            {"type": "email", "value": "test@example.com"},
+            {"type": "slack", "integration_id": 1, "channel": "#reports"},
+        ]
+        report = self._make_report(targets)
+        run = self._make_report_run()
+
+        mock_report_qs.select_related.return_value.get.return_value = report
+        mock_run_qs.get.return_value = run
+        mock_email.return_value = []
+        mock_slack.return_value = ["slack failed"]
+
+        deliver_report("report-id", "run-id")
+
+        self.assertEqual(run.delivery_status, "partial_failure")
diff --git a/posthog/temporal/llm_analytics/eval_reports/workflow.py b/posthog/temporal/llm_analytics/eval_reports/workflow.py
new file mode 100644
index 000000000000..cec9b412978b
--- /dev/null
+++ b/posthog/temporal/llm_analytics/eval_reports/workflow.py
@@ -0,0 +1,202 @@
+"""Temporal workflows for evaluation reports."""
+
+import json
+import asyncio
+
+import temporalio.workflow
+from structlog import get_logger
+
+from posthog.temporal.common.base import PostHogWorkflow
+from posthog.temporal.llm_analytics.eval_reports.activities import (
+    deliver_report_activity,
+    fetch_count_triggered_eval_reports_activity,
+    fetch_due_eval_reports_activity,
+    prepare_report_context_activity,
+    run_eval_report_agent_activity,
+    store_report_run_activity,
+    update_next_delivery_date_activity,
+)
+from posthog.temporal.llm_analytics.eval_reports.constants import (
+    AGENT_ACTIVITY_TIMEOUT,
+    AGENT_HEARTBEAT_TIMEOUT,
+    AGENT_RETRY_POLICY,
+    CHECK_COUNT_TRIGGERED_REPORTS_WORKFLOW_NAME,
+    DELIVER_ACTIVITY_TIMEOUT,
+    DELIVER_HEARTBEAT_TIMEOUT,
+    DELIVER_RETRY_POLICY,
+    FETCH_ACTIVITY_TIMEOUT,
+    FETCH_RETRY_POLICY,
+    GENERATE_EVAL_REPORT_WORKFLOW_NAME,
+    PREPARE_ACTIVITY_TIMEOUT,
+    SCHEDULE_ALL_EVAL_REPORTS_WORKFLOW_NAME,
+    STORE_ACTIVITY_TIMEOUT,
+    STORE_RETRY_POLICY,
+    UPDATE_SCHEDULE_ACTIVITY_TIMEOUT,
+    UPDATE_SCHEDULE_RETRY_POLICY,
+    WORKFLOW_EXECUTION_TIMEOUT,
+)
+from posthog.temporal.llm_analytics.eval_reports.types import (
+    CheckCountTriggeredReportsWorkflowInputs,
+    DeliverReportInput,
+    GenerateAndDeliverEvalReportWorkflowInput,
+    PrepareReportContextInput,
+    RunEvalReportAgentInput,
+    ScheduleAllEvalReportsWorkflowInputs,
+    StoreReportRunInput,
+    UpdateNextDeliveryDateInput,
+)
+
+logger = get_logger(__name__)
+
+
+@temporalio.workflow.defn(name=SCHEDULE_ALL_EVAL_REPORTS_WORKFLOW_NAME)
+class ScheduleAllEvalReportsWorkflow(PostHogWorkflow):
+    """Hourly workflow that finds due evaluation reports and fans out generation."""
+
+    @staticmethod
+    def parse_inputs(inputs: list[str]) -> ScheduleAllEvalReportsWorkflowInputs:
+        if not inputs:
+            return ScheduleAllEvalReportsWorkflowInputs()
+        loaded = json.loads(inputs[0])
+        return ScheduleAllEvalReportsWorkflowInputs(**loaded)
+
+    @temporalio.workflow.run
+    async def run(self, inputs: ScheduleAllEvalReportsWorkflowInputs) -> None:
+        result = await temporalio.workflow.execute_activity(
+            fetch_due_eval_reports_activity,
+            inputs,
+            start_to_close_timeout=FETCH_ACTIVITY_TIMEOUT,
+            retry_policy=FETCH_RETRY_POLICY,
+        )
+
+        if not result.report_ids:
+            return
+
+        # Fan-out: start child workflow per due report
+        tasks = []
+        for report_id in result.report_ids:
+            task = temporalio.workflow.execute_child_workflow(
+                GenerateAndDeliverEvalReportWorkflow.run,
+                GenerateAndDeliverEvalReportWorkflowInput(report_id=report_id),
+                id=f"eval-report-{report_id}",
+                execution_timeout=WORKFLOW_EXECUTION_TIMEOUT,
+            )
+            tasks.append(task)
+
+        await asyncio.gather(*tasks, return_exceptions=True)
+
+
+@temporalio.workflow.defn(name=CHECK_COUNT_TRIGGERED_REPORTS_WORKFLOW_NAME)
+class CheckCountTriggeredReportsWorkflow(PostHogWorkflow):
+    """5-minute workflow that checks count-based evaluation reports for threshold crossings."""
+
+    @staticmethod
+    def parse_inputs(inputs: list[str]) -> CheckCountTriggeredReportsWorkflowInputs:
+        if not inputs:
+            return CheckCountTriggeredReportsWorkflowInputs()
+        loaded = json.loads(inputs[0])
+        return CheckCountTriggeredReportsWorkflowInputs(**loaded)
+
+    @temporalio.workflow.run
+    async def run(self, inputs: CheckCountTriggeredReportsWorkflowInputs) -> None:
+        result = await temporalio.workflow.execute_activity(
+            fetch_count_triggered_eval_reports_activity,
+            inputs,
+            start_to_close_timeout=FETCH_ACTIVITY_TIMEOUT,
+            retry_policy=FETCH_RETRY_POLICY,
+        )
+
+        if not result.report_ids:
+            return
+
+        tasks = []
+        for report_id in result.report_ids:
+            task = temporalio.workflow.execute_child_workflow(
+                GenerateAndDeliverEvalReportWorkflow.run,
+                GenerateAndDeliverEvalReportWorkflowInput(report_id=report_id),
+                id=f"eval-report-count-{report_id}",
+                execution_timeout=WORKFLOW_EXECUTION_TIMEOUT,
+            )
+            tasks.append(task)
+
+        await asyncio.gather(*tasks, return_exceptions=True)
+
+
+@temporalio.workflow.defn(name=GENERATE_EVAL_REPORT_WORKFLOW_NAME)
+class GenerateAndDeliverEvalReportWorkflow(PostHogWorkflow):
+    """Per-report workflow: prepare context, run agent, store, deliver, update schedule."""
+
+    @staticmethod
+    def parse_inputs(inputs: list[str]) -> GenerateAndDeliverEvalReportWorkflowInput:
+        loaded = json.loads(inputs[0])
+        return GenerateAndDeliverEvalReportWorkflowInput(**loaded)
+
+    @temporalio.workflow.run
+    async def run(self, inputs: GenerateAndDeliverEvalReportWorkflowInput) -> None:
+        # 1. Prepare context
+        context = await temporalio.workflow.execute_activity(
+            prepare_report_context_activity,
+            PrepareReportContextInput(report_id=inputs.report_id, manual=inputs.manual),
+            start_to_close_timeout=PREPARE_ACTIVITY_TIMEOUT,
+            retry_policy=FETCH_RETRY_POLICY,
+        )
+
+        # 2. Run agent
+        agent_result = await temporalio.workflow.execute_activity(
+            run_eval_report_agent_activity,
+            RunEvalReportAgentInput(
+                report_id=context.report_id,
+                team_id=context.team_id,
+                evaluation_id=context.evaluation_id,
+                evaluation_name=context.evaluation_name,
+                evaluation_description=context.evaluation_description,
+                evaluation_prompt=context.evaluation_prompt,
+                evaluation_type=context.evaluation_type,
+                period_start=context.period_start,
+                period_end=context.period_end,
+                previous_period_start=context.previous_period_start,
+                report_prompt_guidance=context.report_prompt_guidance,
+            ),
+            start_to_close_timeout=AGENT_ACTIVITY_TIMEOUT,
+            heartbeat_timeout=AGENT_HEARTBEAT_TIMEOUT,
+            retry_policy=AGENT_RETRY_POLICY,
+        )
+
+        # 3. Store report run + emit event
+        store_result = await temporalio.workflow.execute_activity(
+            store_report_run_activity,
+            StoreReportRunInput(
+                report_id=agent_result.report_id,
+                team_id=context.team_id,
+                evaluation_id=context.evaluation_id,
+                content=agent_result.content,
+                period_start=agent_result.period_start,
+                period_end=agent_result.period_end,
+            ),
+            start_to_close_timeout=STORE_ACTIVITY_TIMEOUT,
+            retry_policy=STORE_RETRY_POLICY,
+        )
+
+        # 4. Deliver
+        await temporalio.workflow.execute_activity(
+            deliver_report_activity,
+            DeliverReportInput(
+                report_id=inputs.report_id,
+                report_run_id=store_result.report_run_id,
+            ),
+            start_to_close_timeout=DELIVER_ACTIVITY_TIMEOUT,
+            heartbeat_timeout=DELIVER_HEARTBEAT_TIMEOUT,
+            retry_policy=DELIVER_RETRY_POLICY,
+        )
+
+        # 5. Update next delivery date (skip for manual runs to avoid disrupting schedule)
+        if not inputs.manual:
+            await temporalio.workflow.execute_activity(
+                update_next_delivery_date_activity,
+                UpdateNextDeliveryDateInput(
+                    report_id=inputs.report_id,
+                    period_end=context.period_end,
+                ),
+                start_to_close_timeout=UPDATE_SCHEDULE_ACTIVITY_TIMEOUT,
+                retry_policy=UPDATE_SCHEDULE_RETRY_POLICY,
+            )
diff --git a/posthog/temporal/schedule.py b/posthog/temporal/schedule.py
index 18bfa05c9b2d..a2ff0acc65eb 100644
--- a/posthog/temporal/schedule.py
+++ b/posthog/temporal/schedule.py
@@ -33,6 +33,10 @@
 )
 from posthog.temporal.health_checks.schedule import create_health_check_schedules
 from posthog.temporal.ingestion_acceptance_test.schedule import create_ingestion_acceptance_test_schedule
+from posthog.temporal.llm_analytics.eval_reports.schedule import (
+    create_count_trigger_schedule,
+    create_eval_reports_schedule,
+)
 from posthog.temporal.llm_analytics.trace_clustering.schedule import (
     create_generation_clustering_coordinator_schedule,
     create_trace_clustering_coordinator_schedule,
@@ -53,8 +57,6 @@
 from posthog.temporal.subscriptions.types import ScheduleAllSubscriptionsWorkflowInputs
 from posthog.temporal.weekly_digest.types import WeeklyDigestInput
 
-from products.web_analytics.backend.temporal.weekly_digest.types import WAWeeklyDigestInput
-
 from ee.billing.salesforce_enrichment.constants import DEFAULT_CHUNK_SIZE
 
 logger = structlog.get_logger(__name__)
@@ -289,40 +291,6 @@ async def create_weekly_digest_schedule(client: Client):
         )
 
 
-async def create_wa_weekly_digest_schedule(client: Client):
-    """Create or update the schedule for the WA weekly digest workflow."""
-    wa_digest_schedule = Schedule(
-        action=ScheduleActionStartWorkflow(
-            "wa-weekly-digest",
-            WAWeeklyDigestInput(),
-            id="wa-weekly-digest-schedule",
-            task_queue=settings.MESSAGING_TASK_QUEUE,
-            retry_policy=common.RetryPolicy(
-                maximum_attempts=1,
-            ),
-        ),
-        spec=ScheduleSpec(
-            calendars=[
-                ScheduleCalendarSpec(
-                    comment="Weekly at Monday 9 AM UTC",
-                    hour=[ScheduleRange(start=9, end=9)],
-                    day_of_week=[ScheduleRange(start=1, end=1)],
-                )
-            ]
-        ),
-    )
-
-    if await a_schedule_exists(client, "wa-weekly-digest-schedule"):
-        await a_update_schedule(client, "wa-weekly-digest-schedule", wa_digest_schedule)
-    else:
-        await a_create_schedule(
-            client,
-            "wa-weekly-digest-schedule",
-            wa_digest_schedule,
-            trigger_immediately=False,
-        )
-
-
 async def create_ducklake_compaction_schedule(client: Client):
     """Create or update the schedule for the DuckLake compaction workflow.
 
@@ -473,6 +441,8 @@ async def create_count_all_playlists_schedule(client: Client):
     create_batch_generation_summarization_schedule,
     create_trace_clustering_coordinator_schedule,
     create_generation_clustering_coordinator_schedule,
+    create_eval_reports_schedule,
+    create_count_trigger_schedule,
     create_video_segment_clustering_coordinator_schedule,
     create_ducklake_compaction_schedule,
     create_purge_deleted_recording_metadata_schedule,
@@ -481,7 +451,6 @@ async def create_count_all_playlists_schedule(client: Client):
     create_all_realtime_cohort_calculation_schedules,
     create_ingestion_acceptance_test_schedule,
     create_health_check_schedules,
-    create_wa_weekly_digest_schedule,
     create_logs_alert_check_schedule,
 ]
 
diff --git a/products/llm_analytics/frontend/generated/api.schemas.ts b/products/llm_analytics/frontend/generated/api.schemas.ts
index 06af22ad3d5b..bee6e11bae36 100644
--- a/products/llm_analytics/frontend/generated/api.schemas.ts
+++ b/products/llm_analytics/frontend/generated/api.schemas.ts
@@ -319,6 +319,140 @@ export interface ClusteringRunRequestApi {
     clustering_job_id?: string | null
 }
 
+/**
+ * * `hourly` - Hourly
+ * `daily` - Daily
+ * `weekly` - Weekly
+ * `every_n` - Every N
+ */
+export type EvaluationReportFrequencyEnumApi =
+    (typeof EvaluationReportFrequencyEnumApi)[keyof typeof EvaluationReportFrequencyEnumApi]
+
+export const EvaluationReportFrequencyEnumApi = {
+    Hourly: 'hourly',
+    Daily: 'daily',
+    Weekly: 'weekly',
+    EveryN: 'every_n',
+} as const
+
+/**
+ * * `monday` - Monday
+ * `tuesday` - Tuesday
+ * `wednesday` - Wednesday
+ * `thursday` - Thursday
+ * `friday` - Friday
+ * `saturday` - Saturday
+ * `sunday` - Sunday
+ */
+export type ByweekdayEnumApi = (typeof ByweekdayEnumApi)[keyof typeof ByweekdayEnumApi]
+
+export const ByweekdayEnumApi = {
+    Monday: 'monday',
+    Tuesday: 'tuesday',
+    Wednesday: 'wednesday',
+    Thursday: 'thursday',
+    Friday: 'friday',
+    Saturday: 'saturday',
+    Sunday: 'sunday',
+} as const
+
+export interface EvaluationReportApi {
+    readonly id: string
+    evaluation: string
+    frequency?: EvaluationReportFrequencyEnumApi
+    /** @nullable */
+    byweekday?: ByweekdayEnumApi[] | null
+    start_date: string
+    /** @nullable */
+    readonly next_delivery_date: string | null
+    delivery_targets?: unknown
+    /**
+     * @minimum -2147483648
+     * @maximum 2147483647
+     */
+    max_sample_size?: number
+    enabled?: boolean
+    deleted?: boolean
+    /** @nullable */
+    readonly last_delivered_at: string | null
+    report_prompt_guidance?: string
+    /**
+     * Number of new eval results that triggers a report
+     * @minimum -2147483648
+     * @maximum 2147483647
+     * @nullable
+     */
+    trigger_threshold?: number | null
+    /**
+     * Minimum minutes between count-triggered reports
+     * @minimum -2147483648
+     * @maximum 2147483647
+     */
+    cooldown_minutes?: number
+    /**
+     * Maximum count-triggered report runs per calendar day (UTC)
+     * @minimum -2147483648
+     * @maximum 2147483647
+     */
+    daily_run_cap?: number
+    /** @nullable */
+    readonly created_by: number | null
+    readonly created_at: string
+}
+
+export interface PaginatedEvaluationReportListApi {
+    count: number
+    /** @nullable */
+    next?: string | null
+    /** @nullable */
+    previous?: string | null
+    results: EvaluationReportApi[]
+}
+
+export interface PatchedEvaluationReportApi {
+    readonly id?: string
+    evaluation?: string
+    frequency?: EvaluationReportFrequencyEnumApi
+    /** @nullable */
+    byweekday?: ByweekdayEnumApi[] | null
+    start_date?: string
+    /** @nullable */
+    readonly next_delivery_date?: string | null
+    delivery_targets?: unknown
+    /**
+     * @minimum -2147483648
+     * @maximum 2147483647
+     */
+    max_sample_size?: number
+    enabled?: boolean
+    deleted?: boolean
+    /** @nullable */
+    readonly last_delivered_at?: string | null
+    report_prompt_guidance?: string
+    /**
+     * Number of new eval results that triggers a report
+     * @minimum -2147483648
+     * @maximum 2147483647
+     * @nullable
+     */
+    trigger_threshold?: number | null
+    /**
+     * Minimum minutes between count-triggered reports
+     * @minimum -2147483648
+     * @maximum 2147483647
+     */
+    cooldown_minutes?: number
+    /**
+     * Maximum count-triggered report runs per calendar day (UTC)
+     * @minimum -2147483648
+     * @maximum 2147483647
+     */
+    daily_run_cap?: number
+    /** @nullable */
+    readonly created_by?: number | null
+    readonly created_at?: string
+}
+
 /**
  * * `all` - all
  * `pass` - pass
@@ -1281,6 +1415,17 @@ export type LlmAnalyticsClusteringJobsListParams = {
     offset?: number
 }
 
+export type LlmAnalyticsEvaluationReportsListParams = {
+    /**
+     * Number of results to return per page.
+     */
+    limit?: number
+    /**
+     * The initial index from which to return the results.
+     */
+    offset?: number
+}
+
 export type LlmAnalyticsEvaluationSummaryCreate400 = { [key: string]: unknown }
 
 export type LlmAnalyticsEvaluationSummaryCreate403 = { [key: string]: unknown }
diff --git a/products/llm_analytics/frontend/generated/api.ts b/products/llm_analytics/frontend/generated/api.ts
index 23c7251483a5..25424ef6433c 100644
--- a/products/llm_analytics/frontend/generated/api.ts
+++ b/products/llm_analytics/frontend/generated/api.ts
@@ -18,6 +18,7 @@ import type {
     DatasetItemsListParams,
     DatasetsListParams,
     EvaluationApi,
+    EvaluationReportApi,
     EvaluationSummaryRequestApi,
     EvaluationSummaryResponseApi,
     EvaluationsListParams,
@@ -27,6 +28,7 @@ import type {
     LLMPromptResolveResponseApi,
     LLMProviderKeyApi,
     LlmAnalyticsClusteringJobsListParams,
+    LlmAnalyticsEvaluationReportsListParams,
     LlmAnalyticsProviderKeysListParams,
     LlmAnalyticsReviewQueueItemsListParams,
     LlmAnalyticsReviewQueuesListParams,
@@ -39,6 +41,7 @@ import type {
     PaginatedDatasetItemListApi,
     PaginatedDatasetListApi,
     PaginatedEvaluationListApi,
+    PaginatedEvaluationReportListApi,
     PaginatedLLMPromptListListApi,
     PaginatedLLMProviderKeyListApi,
     PaginatedReviewQueueItemListApi,
@@ -48,6 +51,7 @@ import type {
     PatchedClusteringJobApi,
     PatchedDatasetApi,
     PatchedDatasetItemApi,
+    PatchedEvaluationReportApi,
     PatchedLLMPromptPublishApi,
     PatchedLLMProviderKeyApi,
     PatchedReviewQueueItemUpdateApi,
@@ -385,6 +389,173 @@ export const llmAnalyticsEvaluationConfigSetActiveKeyCreate = async (
     })
 }
 
+/**
+ * CRUD for evaluation report configurations + report run history.
+ */
+export const getLlmAnalyticsEvaluationReportsListUrl = (
+    projectId: string,
+    params?: LlmAnalyticsEvaluationReportsListParams
+) => {
+    const normalizedParams = new URLSearchParams()
+
+    Object.entries(params || {}).forEach(([key, value]) => {
+        if (value !== undefined) {
+            normalizedParams.append(key, value === null ? 'null' : value.toString())
+        }
+    })
+
+    const stringifiedParams = normalizedParams.toString()
+
+    return stringifiedParams.length > 0
+        ? `/api/environments/${projectId}/llm_analytics/evaluation_reports/?${stringifiedParams}`
+        : `/api/environments/${projectId}/llm_analytics/evaluation_reports/`
+}
+
+export const llmAnalyticsEvaluationReportsList = async (
+    projectId: string,
+    params?: LlmAnalyticsEvaluationReportsListParams,
+    options?: RequestInit
+): Promise<PaginatedEvaluationReportListApi> => {
+    return apiMutator<PaginatedEvaluationReportListApi>(getLlmAnalyticsEvaluationReportsListUrl(projectId, params), {
+        ...options,
+        method: 'GET',
+    })
+}
+
+/**
+ * CRUD for evaluation report configurations + report run history.
+ */
+export const getLlmAnalyticsEvaluationReportsCreateUrl = (projectId: string) => {
+    return `/api/environments/${projectId}/llm_analytics/evaluation_reports/`
+}
+
+export const llmAnalyticsEvaluationReportsCreate = async (
+    projectId: string,
+    evaluationReportApi: NonReadonly<EvaluationReportApi>,
+    options?: RequestInit
+): Promise<EvaluationReportApi> => {
+    return apiMutator<EvaluationReportApi>(getLlmAnalyticsEvaluationReportsCreateUrl(projectId), {
+        ...options,
+        method: 'POST',
+        headers: { 'Content-Type': 'application/json', ...options?.headers },
+        body: JSON.stringify(evaluationReportApi),
+    })
+}
+
+/**
+ * CRUD for evaluation report configurations + report run history.
+ */
+export const getLlmAnalyticsEvaluationReportsRetrieveUrl = (projectId: string, id: string) => {
+    return `/api/environments/${projectId}/llm_analytics/evaluation_reports/${id}/`
+}
+
+export const llmAnalyticsEvaluationReportsRetrieve = async (
+    projectId: string,
+    id: string,
+    options?: RequestInit
+): Promise<EvaluationReportApi> => {
+    return apiMutator<EvaluationReportApi>(getLlmAnalyticsEvaluationReportsRetrieveUrl(projectId, id), {
+        ...options,
+        method: 'GET',
+    })
+}
+
+/**
+ * CRUD for evaluation report configurations + report run history.
+ */
+export const getLlmAnalyticsEvaluationReportsUpdateUrl = (projectId: string, id: string) => {
+    return `/api/environments/${projectId}/llm_analytics/evaluation_reports/${id}/`
+}
+
+export const llmAnalyticsEvaluationReportsUpdate = async (
+    projectId: string,
+    id: string,
+    evaluationReportApi: NonReadonly<EvaluationReportApi>,
+    options?: RequestInit
+): Promise<EvaluationReportApi> => {
+    return apiMutator<EvaluationReportApi>(getLlmAnalyticsEvaluationReportsUpdateUrl(projectId, id), {
+        ...options,
+        method: 'PUT',
+        headers: { 'Content-Type': 'application/json', ...options?.headers },
+        body: JSON.stringify(evaluationReportApi),
+    })
+}
+
+/**
+ * CRUD for evaluation report configurations + report run history.
+ */
+export const getLlmAnalyticsEvaluationReportsPartialUpdateUrl = (projectId: string, id: string) => {
+    return `/api/environments/${projectId}/llm_analytics/evaluation_reports/${id}/`
+}
+
+export const llmAnalyticsEvaluationReportsPartialUpdate = async (
+    projectId: string,
+    id: string,
+    patchedEvaluationReportApi: NonReadonly<PatchedEvaluationReportApi>,
+    options?: RequestInit
+): Promise<EvaluationReportApi> => {
+    return apiMutator<EvaluationReportApi>(getLlmAnalyticsEvaluationReportsPartialUpdateUrl(projectId, id), {
+        ...options,
+        method: 'PATCH',
+        headers: { 'Content-Type': 'application/json', ...options?.headers },
+        body: JSON.stringify(patchedEvaluationReportApi),
+    })
+}
+
+/**
+ * CRUD for evaluation report configurations + report run history.
+ */
+export const getLlmAnalyticsEvaluationReportsDestroyUrl = (projectId: string, id: string) => {
+    return `/api/environments/${projectId}/llm_analytics/evaluation_reports/${id}/`
+}
+
+export const llmAnalyticsEvaluationReportsDestroy = async (
+    projectId: string,
+    id: string,
+    options?: RequestInit
+): Promise<void> => {
+    return apiMutator<void>(getLlmAnalyticsEvaluationReportsDestroyUrl(projectId, id), {
+        ...options,
+        method: 'DELETE',
+    })
+}
+
+/**
+ * Trigger immediate report generation.
+ */
+export const getLlmAnalyticsEvaluationReportsGenerateCreateUrl = (projectId: string, id: string) => {
+    return `/api/environments/${projectId}/llm_analytics/evaluation_reports/${id}/generate/`
+}
+
+export const llmAnalyticsEvaluationReportsGenerateCreate = async (
+    projectId: string,
+    id: string,
+    options?: RequestInit
+): Promise<void> => {
+    return apiMutator<void>(getLlmAnalyticsEvaluationReportsGenerateCreateUrl(projectId, id), {
+        ...options,
+        method: 'POST',
+    })
+}
+
+/**
+ * List report runs (history) for this report.
+ */
+export const getLlmAnalyticsEvaluationReportsRunsRetrieveUrl = (projectId: string, id: string) => {
+    return `/api/environments/${projectId}/llm_analytics/evaluation_reports/${id}/runs/`
+}
+
+export const llmAnalyticsEvaluationReportsRunsRetrieve = async (
+    projectId: string,
+    id: string,
+    options?: RequestInit
+): Promise<EvaluationReportApi> => {
+    return apiMutator<EvaluationReportApi>(getLlmAnalyticsEvaluationReportsRunsRetrieveUrl(projectId, id), {
+        ...options,
+        method: 'GET',
+    })
+}
+
 /**
  * 
 Generate an AI-powered summary of evaluation results.
diff --git a/products/llm_analytics/mcp/tools.yaml b/products/llm_analytics/mcp/tools.yaml
index ab571a3f18f6..fda008946a05 100644
--- a/products/llm_analytics/mcp/tools.yaml
+++ b/products/llm_analytics/mcp/tools.yaml
@@ -43,10 +43,9 @@ tools:
             idempotent: true
         title: List clustering jobs
         description: >
-            List all clustering job configurations for the current team (max 5 per team).
-            Each job defines an analysis level (trace or generation) and event filters that
-            scope which traces are included in clustering runs. Cluster results are stored
-            as $ai_trace_clusters and $ai_generation_clusters events — use docs-search or
+            List all clustering job configurations for the current team (max 5 per team). Each job defines an analysis
+            level (trace or generation) and event filters that scope which traces are included in clustering runs.
+            Cluster results are stored as $ai_trace_clusters and $ai_generation_clusters events — use docs-search or
             execute-sql to query them.
     llm-analytics-clustering-jobs-create:
         operation: llm_analytics_clustering_jobs_create
@@ -69,19 +68,15 @@ tools:
             readOnly: false
             destructive: false
             idempotent: true
-        requires_ai_consent: true
         title: Summarize evaluation results
         description: >
-            Generate an AI-powered summary of LLM evaluation results for a given
-            evaluation config. Pass an evaluation_id and an optional filter
-            ("all", "pass", "fail", or "na") to scope which runs are analyzed.
-            Returns an overall assessment, pattern groups for passing, failing,
-            and N/A runs (each with title, description, frequency, and example
-            generation IDs), actionable recommendations, and run statistics.
-            Optionally pass generation_ids to restrict the analysis to specific
-            runs. Results are cached for one hour — use force_refresh to
-            recompute. Rate-limited; requires AI data processing approval for
-            the organization.
+            Generate an AI-powered summary of LLM evaluation results for a given evaluation config. Pass an
+            evaluation_id and an optional filter ("all", "pass", "fail", or "na") to scope which runs are analyzed.
+            Returns an overall assessment, pattern groups for passing, failing, and N/A runs (each with title,
+            description, frequency, and example generation IDs), actionable recommendations, and run statistics.
+            Optionally pass generation_ids to restrict the analysis to specific runs. Results are cached for one hour —
+            use force_refresh to recompute. Rate-limited; requires AI data processing approval for the organization.
+        requires_ai_consent: true
     llm-analytics-models-retrieve:
         operation: llm_analytics_models_retrieve
         enabled: false
@@ -120,11 +115,10 @@ tools:
             idempotent: true
         title: Analyze sentiment
         description: >
-            Classify sentiment of LLM trace or generation user messages as positive,
-            neutral, or negative. Pass a list of trace or generation IDs and an
-            analysis_level ("trace" or "generation"). Returns per-ID sentiment labels
-            with confidence scores and per-message breakdowns. Results are cached —
-            use force_refresh to recompute. Rate-limited.
+            Classify sentiment of LLM trace or generation user messages as positive, neutral, or negative. Pass a list
+            of trace or generation IDs and an analysis_level ("trace" or "generation"). Returns per-ID sentiment labels
+            with confidence scores and per-message breakdowns. Results are cached — use force_refresh to recompute.
+            Rate-limited.
     llm-analytics-summarization-create:
         operation: llm_analytics_summarization_create
         enabled: true
@@ -136,11 +130,10 @@ tools:
             idempotent: true
         title: Summarize trace or generation
         description: >
-            Generate an AI-powered summary of an LLM trace or generation. Pass a
-            trace_id or generation_id with a date_from — the backend fetches the data
-            and returns a structured summary with title, flow diagram, summary bullets,
-            and interesting notes. Results are cached. Use mode "minimal" (default) for
-            3-5 points or "detailed" for 5-10 points. Rate-limited.
+            Generate an AI-powered summary of an LLM trace or generation. Pass a trace_id or generation_id with a
+            date_from — the backend fetches the data and returns a structured summary with title, flow diagram, summary
+            bullets, and interesting notes. Results are cached. Use mode "minimal" (default) for 3-5 points or
+            "detailed" for 5-10 points. Rate-limited.
     llm-analytics-summarization-batch-check-create:
         operation: llm_analytics_summarization_batch_check_create
         enabled: false
@@ -215,8 +208,8 @@ tools:
             idempotent: true
         title: Get clustering job
         description: >
-            Retrieve a specific clustering job configuration by ID. Returns the job name,
-            analysis level (trace or generation), event filters, enabled status, and timestamps.
+            Retrieve a specific clustering job configuration by ID. Returns the job name, analysis level (trace or
+            generation), event filters, enabled status, and timestamps.
     llm-analytics-clustering-jobs-update:
         operation: llm_analytics_clustering_jobs_update
         enabled: false
@@ -298,3 +291,27 @@ tools:
     llm-analytics-provider-keys-assign-create:
         operation: llm_analytics_provider_keys_assign_create
         enabled: false
+    llm-analytics-evaluation-reports-list:
+        operation: llm_analytics_evaluation_reports_list
+        enabled: false
+    llm-analytics-evaluation-reports-create:
+        operation: llm_analytics_evaluation_reports_create
+        enabled: false
+    llm-analytics-evaluation-reports-retrieve:
+        operation: llm_analytics_evaluation_reports_retrieve
+        enabled: false
+    llm-analytics-evaluation-reports-update:
+        operation: llm_analytics_evaluation_reports_update
+        enabled: false
+    llm-analytics-evaluation-reports-partial-update:
+        operation: llm_analytics_evaluation_reports_partial_update
+        enabled: false
+    llm-analytics-evaluation-reports-destroy:
+        operation: llm_analytics_evaluation_reports_destroy
+        enabled: false
+    llm-analytics-evaluation-reports-generate-create:
+        operation: llm_analytics_evaluation_reports_generate_create
+        enabled: false
+    llm-analytics-evaluation-reports-runs-retrieve:
+        operation: llm_analytics_evaluation_reports_runs_retrieve
+        enabled: false
diff --git a/services/mcp/src/api/generated.ts b/services/mcp/src/api/generated.ts
index 388914a4efc5..aedcbfb5bd93 100644
--- a/services/mcp/src/api/generated.ts
+++ b/services/mcp/src/api/generated.ts
@@ -14467,6 +14467,66 @@ export namespace Schemas {
       example_generation_ids: string[];
     }
 
+    /**
+     * * `hourly` - Hourly
+    * `daily` - Daily
+    * `weekly` - Weekly
+    * `every_n` - Every N
+     */
+    export type EvaluationReportFrequencyEnum = typeof EvaluationReportFrequencyEnum[keyof typeof EvaluationReportFrequencyEnum];
+
+
+    export const EvaluationReportFrequencyEnum = {
+      Hourly: 'hourly',
+      Daily: 'daily',
+      Weekly: 'weekly',
+      EveryN: 'every_n',
+    } as const;
+
+    export interface EvaluationReport {
+      readonly id: string;
+      evaluation: string;
+      frequency?: EvaluationReportFrequencyEnum;
+      /** @nullable */
+      byweekday?: ByweekdayEnum[] | null;
+      start_date: string;
+      /** @nullable */
+      readonly next_delivery_date: string | null;
+      delivery_targets?: unknown;
+      /**
+       * @minimum -2147483648
+       * @maximum 2147483647
+       */
+      max_sample_size?: number;
+      enabled?: boolean;
+      deleted?: boolean;
+      /** @nullable */
+      readonly last_delivered_at: string | null;
+      report_prompt_guidance?: string;
+      /**
+       * Number of new eval results that triggers a report
+       * @minimum -2147483648
+       * @maximum 2147483647
+       * @nullable
+       */
+      trigger_threshold?: number | null;
+      /**
+       * Minimum minutes between count-triggered reports
+       * @minimum -2147483648
+       * @maximum 2147483647
+       */
+      cooldown_minutes?: number;
+      /**
+       * Maximum count-triggered report runs per calendar day (UTC)
+       * @minimum -2147483648
+       * @maximum 2147483647
+       */
+      daily_run_cap?: number;
+      /** @nullable */
+      readonly created_by: number | null;
+      readonly created_at: string;
+    }
+
     /**
      * * `all` - all
     * `pass` - pass
@@ -16195,22 +16255,6 @@ export namespace Schemas {
       refreshing: boolean;
     }
 
-    /**
-     * * `daily` - Daily
-    * `weekly` - Weekly
-    * `monthly` - Monthly
-    * `yearly` - Yearly
-     */
-    export type FrequencyEnum = typeof FrequencyEnum[keyof typeof FrequencyEnum];
-
-
-    export const FrequencyEnum = {
-      Daily: 'daily',
-      Weekly: 'weekly',
-      Monthly: 'monthly',
-      Yearly: 'yearly',
-    } as const;
-
     export type GenerateRequestStepsItem = {[key: string]: unknown};
 
     export interface GenerateRequest {
@@ -20494,6 +20538,15 @@ export namespace Schemas {
       results: Evaluation[];
     }
 
+    export interface PaginatedEvaluationReportList {
+      count: number;
+      /** @nullable */
+      next?: string | null;
+      /** @nullable */
+      previous?: string | null;
+      results: EvaluationReport[];
+    }
+
     export interface PaginatedEventSchemaList {
       count: number;
       /** @nullable */
@@ -21719,6 +21772,22 @@ export namespace Schemas {
       Webhook: 'webhook',
     } as const;
 
+    /**
+     * * `daily` - Daily
+    * `weekly` - Weekly
+    * `monthly` - Monthly
+    * `yearly` - Yearly
+     */
+    export type SubscriptionFrequencyEnum = typeof SubscriptionFrequencyEnum[keyof typeof SubscriptionFrequencyEnum];
+
+
+    export const SubscriptionFrequencyEnum = {
+      Daily: 'daily',
+      Weekly: 'weekly',
+      Monthly: 'monthly',
+      Yearly: 'yearly',
+    } as const;
+
     /**
      * Standard Subscription serializer.
      */
@@ -21735,7 +21804,7 @@ export namespace Schemas {
       dashboard_export_insights?: number[];
       target_type: TargetTypeEnum;
       target_value: string;
-      frequency: FrequencyEnum;
+      frequency: SubscriptionFrequencyEnum;
       /**
        * @minimum -2147483648
        * @maximum 2147483647
@@ -23913,6 +23982,50 @@ export namespace Schemas {
       deleted?: boolean;
     }
 
+    export interface PatchedEvaluationReport {
+      readonly id?: string;
+      evaluation?: string;
+      frequency?: EvaluationReportFrequencyEnum;
+      /** @nullable */
+      byweekday?: ByweekdayEnum[] | null;
+      start_date?: string;
+      /** @nullable */
+      readonly next_delivery_date?: string | null;
+      delivery_targets?: unknown;
+      /**
+       * @minimum -2147483648
+       * @maximum 2147483647
+       */
+      max_sample_size?: number;
+      enabled?: boolean;
+      deleted?: boolean;
+      /** @nullable */
+      readonly last_delivered_at?: string | null;
+      report_prompt_guidance?: string;
+      /**
+       * Number of new eval results that triggers a report
+       * @minimum -2147483648
+       * @maximum 2147483647
+       * @nullable
+       */
+      trigger_threshold?: number | null;
+      /**
+       * Minimum minutes between count-triggered reports
+       * @minimum -2147483648
+       * @maximum 2147483647
+       */
+      cooldown_minutes?: number;
+      /**
+       * Maximum count-triggered report runs per calendar day (UTC)
+       * @minimum -2147483648
+       * @maximum 2147483647
+       */
+      daily_run_cap?: number;
+      /** @nullable */
+      readonly created_by?: number | null;
+      readonly created_at?: string;
+    }
+
     export interface PatchedEventSchema {
       readonly id?: string;
       event_definition?: string;
@@ -25550,7 +25663,7 @@ export namespace Schemas {
       dashboard_export_insights?: number[];
       target_type?: TargetTypeEnum;
       target_value?: string;
-      frequency?: FrequencyEnum;
+      frequency?: SubscriptionFrequencyEnum;
       /**
        * @minimum -2147483648
        * @maximum 2147483647
@@ -33585,6 +33698,17 @@ export namespace Schemas {
     offset?: number;
     };
 
+    export type LlmAnalyticsEvaluationReportsListParams = {
+    /**
+     * Number of results to return per page.
+     */
+    limit?: number;
+    /**
+     * The initial index from which to return the results.
+     */
+    offset?: number;
+    };
+
     export type LlmAnalyticsEvaluationSummaryCreate400 = {[key: string]: unknown};
 
     export type LlmAnalyticsEvaluationSummaryCreate403 = {[key: string]: unknown};