antinomyhq · amitksingh1490 · Apr 4, 2026 · Apr 4, 2026 · Apr 7, 2026 · Apr 7, 2026
diff --git a/crates/forge_app/src/app.rs b/crates/forge_app/src/app.rs
@@ -9,7 +9,10 @@ use forge_stream::MpscStream;
 use crate::apply_tunable_parameters::ApplyTunableParameters;
 use crate::changed_files::ChangedFiles;
 use crate::dto::ToolsOverview;
-use crate::hooks::{CompactionHandler, DoomLoopDetector, TitleGenerationHandler, TracingHandler};
+use crate::hooks::{
+    CompactionHandler, DoomLoopDetector, PendingTodosHandler, TitleGenerationHandler,
+    TracingHandler,
+};
 use crate::init_conversation_metrics::InitConversationMetrics;
 use crate::orch::Orchestrator;
 use crate::services::{AgentRegistry, CustomInstructionsService, ProviderAuthService};
@@ -142,17 +145,29 @@ impl<S: Services + EnvironmentInfra<Config = forge_config::ForgeConfig>> ForgeAp
         // Create the orchestrator with all necessary dependencies
         let tracing_handler = TracingHandler::new();
         let title_handler = TitleGenerationHandler::new(services.clone());
+
+        // Build the on_end hook, conditionally adding PendingTodosHandler based on
+        // config
+        let on_end_hook = if forge_config.verify_todos {
+            tracing_handler
+                .clone()
+                .and(title_handler.clone())
+                .and(PendingTodosHandler::new())
+        } else {
+            tracing_handler.clone().and(title_handler.clone())
+        };
+
         let hook = Hook::default()
-            .on_start(tracing_handler.clone().and(title_handler.clone()))
+            .on_start(tracing_handler.clone().and(title_handler))
             .on_request(tracing_handler.clone().and(DoomLoopDetector::default()))
             .on_response(
                 tracing_handler
                     .clone()
                     .and(CompactionHandler::new(agent.clone(), environment.clone())),
             )
             .on_toolcall_start(tracing_handler.clone())
-            .on_toolcall_end(tracing_handler.clone())
-            .on_end(tracing_handler.and(title_handler));
+            .on_toolcall_end(tracing_handler)
+            .on_end(on_end_hook);
 
         let orch = Orchestrator::new(
             services.clone(),

diff --git a/crates/forge_app/src/hooks/mod.rs b/crates/forge_app/src/hooks/mod.rs
@@ -1,9 +1,11 @@
 mod compaction;
 mod doom_loop;
+mod pending_todos;
 mod title_generation;
 mod tracing;
 
 pub use compaction::CompactionHandler;
 pub use doom_loop::DoomLoopDetector;
+pub use pending_todos::PendingTodosHandler;
 pub use title_generation::TitleGenerationHandler;
 pub use tracing::TracingHandler;
diff --git a/crates/forge_app/src/hooks/pending_todos.rs b/crates/forge_app/src/hooks/pending_todos.rs
@@ -0,0 +1,272 @@
+use std::collections::HashSet;
+
+use async_trait::async_trait;
+use forge_domain::{
+    ContextMessage, Conversation, EndPayload, EventData, EventHandle, Template, TodoStatus,
+};
+use forge_template::Element;
+use serde::Serialize;
+
+use crate::TemplateEngine;
+
+/// A single todo item prepared for template rendering.
+#[derive(Serialize)]
+struct TodoReminderItem {
+    status: &'static str,
+    content: String,
+}
+
+/// Template context for the pending-todos reminder.
+#[derive(Serialize)]
+struct PendingTodosContext {
+    todos: Vec<TodoReminderItem>,
+}
+
+/// Detects when the LLM signals task completion while there are still
+/// pending or in-progress todo items.
+///
+/// When triggered, it injects a formatted reminder listing all
+/// outstanding todos into the conversation context, preventing the
+/// orchestrator from yielding prematurely.
+#[derive(Debug, Clone, Default)]
+pub struct PendingTodosHandler;
+
+impl PendingTodosHandler {
+    /// Creates a new pending-todos handler
+    pub fn new() -> Self {
+        Self
+    }
+}
+
+#[async_trait]
+impl EventHandle<EventData<EndPayload>> for PendingTodosHandler {
+    async fn handle(
+        &self,
+        _event: &EventData<EndPayload>,
+        conversation: &mut Conversation,
+    ) -> anyhow::Result<()> {
+        let pending_todos = conversation.metrics.get_active_todos();
+        if pending_todos.is_empty() {
+            return Ok(());
+        }
+
+        // Build a set of current pending todo contents for comparison
+        let current_todo_set: HashSet<String> = pending_todos
+            .iter()
+            .map(|todo| todo.content.clone())
+            .collect();
+
+        // Check if we already have a reminder with the exact same set of todos
+        // This prevents duplicate reminders while still allowing new reminders
+        // when todos change (e.g., some completed but others still pending)
+        let should_add_reminder = if let Some(context) = &conversation.context {
+            // Find the most recent reminder message by looking for the template content
+            // pattern
+            let last_reminder_todos: Option<HashSet<String>> = context
+                .messages
+                .iter()
+                .rev()
+                .filter_map(|entry| {
+                    let content = entry.message.content()?;
+                    // Check if this is a pending todos reminder
+                    if content.contains("You have pending todo items") {
+                        // Extract todo items from the reminder message
+                        // Format: "- [STATUS] Content"
+                        let todos: HashSet<String> = content
+                            .lines()
+                            .filter(|line| line.starts_with("- ["))
+                            .map(|line| {
+                                // Extract content after "- [STATUS] "
+                                line.split_once("] ")
+                                    .map(|x| x.1)
+                                    .map(|s| s.to_string())
+                                    .unwrap_or_default()
+                            })
+                            .collect();
+                        Some(todos)
+                    } else {
+                        None
+                    }
+                })
+                .next();
+
+            match last_reminder_todos {
+                Some(last_todos) => last_todos != current_todo_set,
+                None => true, // No previous reminder found, should add
+            }
+        } else {
+            true // No context, should add reminder
+        };
+
+        if !should_add_reminder {
+            return Ok(());
+        }
+
+        let todo_items: Vec<TodoReminderItem> = pending_todos
+            .iter()
+            .filter_map(|todo| {
+                let status = match todo.status {
+                    TodoStatus::Pending => "PENDING",
+                    TodoStatus::InProgress => "IN_PROGRESS",
+                    _ => return None,
+                };
+                Some(TodoReminderItem { status, content: todo.content.clone() })
+            })
+            .collect();
+
+        let ctx = PendingTodosContext { todos: todo_items };
+        let reminder = TemplateEngine::default().render(
+            Template::<PendingTodosContext>::new("forge-pending-todos-reminder.md"),
+            &ctx,
+        )?;
+
+        if let Some(context) = conversation.context.as_mut() {
+            let content = Element::new("system_reminder").text(reminder);
+            context
+                .messages
+                .push(ContextMessage::user(content, None).into());
+        }
+
+        Ok(())
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use forge_domain::{
+        Agent, Context, Conversation, EndPayload, EventData, EventHandle, Metrics, ModelId, Todo,
+        TodoStatus,
+    };
+    use pretty_assertions::assert_eq;
+
+    use super::*;
+
+    fn fixture_agent() -> Agent {
+        Agent::new(
+            "test-agent",
+            "test-provider".to_string().into(),
+            ModelId::new("test-model"),
+        )
+    }
+
+    fn fixture_conversation(todos: Vec<Todo>) -> Conversation {
+        let mut conversation = Conversation::generate();
+        conversation.context = Some(Context::default());
+        conversation.metrics = Metrics::default().todos(todos);
+        conversation
+    }
+
+    fn fixture_event() -> EventData<EndPayload> {
+        EventData::new(fixture_agent(), ModelId::new("test-model"), EndPayload)
+    }
+
+    #[tokio::test]
+    async fn test_no_pending_todos_does_nothing() {
+        let handler = PendingTodosHandler::new();
+        let event = fixture_event();
+        let mut conversation = fixture_conversation(vec![]);
+
+        let initial_msg_count = conversation.context.as_ref().unwrap().messages.len();
+        handler.handle(&event, &mut conversation).await.unwrap();
+
+        let actual = conversation.context.as_ref().unwrap().messages.len();
+        let expected = initial_msg_count;
+        assert_eq!(actual, expected);
+    }
+
+    #[tokio::test]
+    async fn test_pending_todos_injects_reminder() {
+        let handler = PendingTodosHandler::new();
+        let event = fixture_event();
+        let mut conversation = fixture_conversation(vec![
+            Todo::new("Fix the build").status(TodoStatus::Pending),
+            Todo::new("Write tests").status(TodoStatus::InProgress),
+        ]);
+
+        handler.handle(&event, &mut conversation).await.unwrap();
+
+        let actual = conversation.context.as_ref().unwrap().messages.len();
+        let expected = 1;
+        assert_eq!(actual, expected);
+    }
+
+    #[tokio::test]
+    async fn test_reminder_contains_formatted_list() {
+        let handler = PendingTodosHandler::new();
+        let event = fixture_event();
+        let mut conversation = fixture_conversation(vec![
+            Todo::new("Fix the build").status(TodoStatus::Pending),
+            Todo::new("Write tests").status(TodoStatus::InProgress),
+        ]);
+
+        handler.handle(&event, &mut conversation).await.unwrap();
+
+        let entry = &conversation.context.as_ref().unwrap().messages[0];
+        let actual = entry.message.content().unwrap();
+        assert!(actual.contains("- [PENDING] Fix the build"));
+        assert!(actual.contains("- [IN_PROGRESS] Write tests"));
+    }
+
+    #[tokio::test]
+    async fn test_completed_todos_not_included() {
+        let handler = PendingTodosHandler::new();
+        let event = fixture_event();
+        let mut conversation = fixture_conversation(vec![
+            Todo::new("Completed task").status(TodoStatus::Completed),
+            Todo::new("Cancelled task").status(TodoStatus::Cancelled),
+        ]);
+
+        let initial_msg_count = conversation.context.as_ref().unwrap().messages.len();
+        handler.handle(&event, &mut conversation).await.unwrap();
+
+        let actual = conversation.context.as_ref().unwrap().messages.len();
+        let expected = initial_msg_count;
+        assert_eq!(actual, expected);
+    }
+
+    #[tokio::test]
+    async fn test_reminder_not_duplicated_for_same_todos() {
+        let handler = PendingTodosHandler::new();
+        let event = fixture_event();
+        let mut conversation =
+            fixture_conversation(vec![Todo::new("Fix the build").status(TodoStatus::Pending)]);
+
+        // First call should inject a reminder
+        handler.handle(&event, &mut conversation).await.unwrap();
+        let after_first = conversation.context.as_ref().unwrap().messages.len();
+        assert_eq!(after_first, 1);
+
+        // Second call with the same pending todos should NOT add another reminder
+        handler.handle(&event, &mut conversation).await.unwrap();
+        let after_second = conversation.context.as_ref().unwrap().messages.len();
+        assert_eq!(after_second, 1); // Still 1, no duplicate
+    }
+
+    #[tokio::test]
+    async fn test_reminder_added_when_todos_change() {
+        let handler = PendingTodosHandler::new();
+        let event = fixture_event();
+        let mut conversation = fixture_conversation(vec![
+            Todo::new("Fix the build").status(TodoStatus::Pending),
+            Todo::new("Write tests").status(TodoStatus::InProgress),
+        ]);
+
+        // First call should inject a reminder
+        handler.handle(&event, &mut conversation).await.unwrap();
+        let after_first = conversation.context.as_ref().unwrap().messages.len();
+        assert_eq!(after_first, 1);
+
+        // Simulate LLM completing one todo but leaving another pending
+        // Update the conversation metrics with different todos
+        conversation.metrics = conversation.metrics.clone().todos(vec![
+            Todo::new("Fix the build").status(TodoStatus::Completed),
+            Todo::new("Write tests").status(TodoStatus::InProgress),
+            Todo::new("Add documentation").status(TodoStatus::Pending),
+        ]);
+
+        // Second call with different pending todos should add a new reminder
+        handler.handle(&event, &mut conversation).await.unwrap();
+        let after_second = conversation.context.as_ref().unwrap().messages.len();
+        assert_eq!(after_second, 2); // New reminder added because todos changed
+    }
+}
diff --git a/crates/forge_app/src/orch.rs b/crates/forge_app/src/orch.rs
@@ -258,7 +258,6 @@ impl<S: AgentService + EnvironmentInfra<Config = forge_config::ForgeConfig>> Orc
             self.conversation.context = Some(context.clone());
             self.services.update(self.conversation.clone()).await?;
 
-            // Fire the Request lifecycle event
             let request_event = LifecycleEvent::Request(EventData::new(
                 self.agent.clone(),
                 model_id.clone(),
@@ -325,7 +324,7 @@ impl<S: AgentService + EnvironmentInfra<Config = forge_config::ForgeConfig>> Orc
                 .execute_tool_calls(&message.tool_calls, &tool_context)
                 .await?;
 
-            // Update context from conversation after tool-call hooks run
+            // Update context from conversation after response / tool-call hooks run
             if let Some(updated_context) = &self.conversation.context {
                 context = updated_context.clone();
             }
@@ -403,19 +402,32 @@ impl<S: AgentService + EnvironmentInfra<Config = forge_config::ForgeConfig>> Orc
             tool_context.with_metrics(|metrics| {
                 self.conversation.metrics = metrics.clone();
             })?;
-        }
 
-        // Fire the End lifecycle event (title will be set here by the hook)
-        self.hook
-            .handle(
-                &LifecycleEvent::End(EventData::new(
-                    self.agent.clone(),
-                    model_id.clone(),
-                    EndPayload,
-                )),
-                &mut self.conversation,
-            )
-            .await?;
+            // If completing (should_yield is due), fire End hook and check if
+            // it adds messages
+            if should_yield {
+                let end_count_before = self.conversation.len();
+                self.hook
+                    .handle(
+                        &LifecycleEvent::End(EventData::new(
+                            self.agent.clone(),
+                            model_id.clone(),
+                            EndPayload,
+                        )),
+                        &mut self.conversation,
+                    )
+                    .await?;
+                self.services.update(self.conversation.clone()).await?;
+                // Check if End hook added messages - if so, continue the loop
+                if self.conversation.len() > end_count_before {
+                    // End hook added messages, sync context and continue
+                    if let Some(updated_context) = &self.conversation.context {
+                        context = updated_context.clone();
+                    }
+                    should_yield = false;
+                }
+            }
+        }
 
         self.services.update(self.conversation.clone()).await?;