fix: enhance ReActAgent's reasoning iterations and update planning prompt structure

2026-03-06 22:03:39 +00:00 · 2025-05-23 15:10:12 +01:00
parent 5475e6f7c5
commit de47df3bf9
2 changed files with 70 additions and 53 deletions
--- a/application/agents/react_agent.py
+++ b/application/agents/react_agent.py
@@ -20,6 +20,8 @@ with open(
    "r",
 ) as f:
    final_prompt_template = f.read()
+    
+MAX_ITERATIONS_REASONING = 10

 class ReActAgent(BaseAgent):
    def __init__(self, *args, **kwargs):
@@ -71,7 +73,6 @@ class ReActAgent(BaseAgent):
                        content_piece = chunk.delta.text
                    elif isinstance(chunk, str): # Simplest case: stream of strings
                        content_piece = chunk
-                    # Add other stream chunk formats as needed

                    if content_piece:
                        collected_content.append(content_piece)
@@ -98,64 +99,76 @@ class ReActAgent(BaseAgent):
        self._prepare_tools(tools_dict)

        docs_together = "\n".join([doc["text"] for doc in retrieved_data])
+        iterating_reasoning = 0
+        while iterating_reasoning < MAX_ITERATIONS_REASONING:
+            iterating_reasoning += 1
+            # 1. Create Plan
+            logger.info("ReActAgent: Creating plan...")
+            plan_stream = self._create_plan(query, docs_together, log_context)
+            current_plan_parts = []
+            yield {"thought": f"Reasoning... (iteration {iterating_reasoning})\n\n"}
+            for line_chunk in plan_stream:
+                current_plan_parts.append(line_chunk)
+                yield {"thought": line_chunk}
+            self.plan = "".join(current_plan_parts)
+            if self.plan:
+                self.observations.append(f"Plan: {self.plan} Iteration: {iterating_reasoning}")

-        # 1. Create Plan
-        logger.info("ReActAgent: Creating plan...")
-        plan_stream = self._create_plan(query, docs_together, log_context)
-        current_plan_parts = []
-        for line_chunk in plan_stream:
-            current_plan_parts.append(line_chunk)
-            yield {"thought": line_chunk}
-        self.plan = "".join(current_plan_parts)
-        if self.plan:
-            self.observations.append(f"Plan: {self.plan}")

-        # 2. Execute Plan (First Reasoning Step)
-        execution_prompt_str = (self.prompt or "") + f"\n\nFollow this plan:\n{self.plan}"
-        
-        messages = self._build_messages(execution_prompt_str, query, retrieved_data)
-
-        resp_from_llm_gen = self._llm_gen(messages, log_context)
-
-        initial_llm_thought_content = self._extract_content_from_llm_response(resp_from_llm_gen)
-        if initial_llm_thought_content:
-            self.observations.append(f"Initial thought/response: {initial_llm_thought_content}")
-        else:
-            logger.info("ReActAgent: Initial LLM response (before handler) had no textual content (might be only tool calls).")
-
-        logger.info("Executing plan")
-        resp_after_handler = self._llm_handler(resp_from_llm_gen, tools_dict, messages, log_context)
-
-        for tool_call_info in self.tool_calls: # Iterate over self.tool_calls populated by _llm_handler
-            observation_string = (
-                f"Executed Action: Tool '{tool_call_info.get('tool_name', 'N/A')}' "
-                f"with arguments '{tool_call_info.get('arguments', '{}')}'. Result: '{str(tool_call_info.get('result', ''))[:200]}...'"
+            max_obs_len = 20000
+            obs_str = "\n".join(self.observations)
+            if len(obs_str) > max_obs_len:
+                obs_str = obs_str[:max_obs_len] + "\n...[observations truncated]"
+            execution_prompt_str = (
+                (self.prompt or "")
+                + f"\n\nFollow this plan:\n{self.plan}"
+                + f"\n\nObservations:\n{obs_str}"
+                + f"\n\nIf there is enough data to complete user query '{query}', Respond with 'SATISFIED' only. Otherwise, continue. Dont Menstion 'SATISFIED' in your response if you are not ready. "
            )
-            self.observations.append(observation_string)
+            
+            messages = self._build_messages(execution_prompt_str, query, retrieved_data)

-        content_after_handler = self._extract_content_from_llm_response(resp_after_handler)
-        if content_after_handler:
-            self.observations.append(f"Response after tool execution: {content_after_handler}")
-            logger.info(f"ReActAgent: LLM response after tool execution: {content_after_handler[:500]}...")
-        else:
-            logger.info("ReActAgent: LLM response after handler had no textual content.")
+            resp_from_llm_gen = self._llm_gen(messages, log_context)

+            initial_llm_thought_content = self._extract_content_from_llm_response(resp_from_llm_gen)
+            if initial_llm_thought_content:
+                self.observations.append(f"Initial thought/response: {initial_llm_thought_content}")
+            else:
+                logger.info("ReActAgent: Initial LLM response (before handler) had no textual content (might be only tool calls).")
+            resp_after_handler = self._llm_handler(resp_from_llm_gen, tools_dict, messages, log_context)
+            
+            for tool_call_info in self.tool_calls: # Iterate over self.tool_calls populated by _llm_handler
+                observation_string = (
+                    f"Executed Action: Tool '{tool_call_info.get('tool_name', 'N/A')}' "
+                    f"with arguments '{tool_call_info.get('arguments', '{}')}'. Result: '{str(tool_call_info.get('result', ''))[:200]}...'"
+                )
+                self.observations.append(observation_string)

-        if log_context:
-            log_context.stacks.append(
-                {"component": "agent_tool_calls", "data": {"tool_calls": self.tool_calls.copy()}}
-            )
+            content_after_handler = self._extract_content_from_llm_response(resp_after_handler)
+            if content_after_handler:
+                self.observations.append(f"Response after tool execution: {content_after_handler}")
+            else:
+                logger.info("ReActAgent: LLM response after handler had no textual content.")

-        yield {"sources": retrieved_data}
+            if log_context:
+                log_context.stacks.append(
+                    {"component": "agent_tool_calls", "data": {"tool_calls": self.tool_calls.copy()}}
+                )

-        display_tool_calls = []
-        for tc in self.tool_calls:
-            cleaned_tc = tc.copy()
-            if len(str(cleaned_tc.get("result", ""))) > 50:
-                cleaned_tc["result"] = str(cleaned_tc["result"])[:50] + "..."
-            display_tool_calls.append(cleaned_tc)
-        if display_tool_calls:
-            yield {"tool_calls": display_tool_calls}
+            yield {"sources": retrieved_data}
+
+            display_tool_calls = []
+            for tc in self.tool_calls:
+                cleaned_tc = tc.copy()
+                if len(str(cleaned_tc.get("result", ""))) > 50:
+                    cleaned_tc["result"] = str(cleaned_tc["result"])[:50] + "..."
+                display_tool_calls.append(cleaned_tc)
+            if display_tool_calls:
+                yield {"tool_calls": display_tool_calls}
+            
+            if "SATISFIED" in content_after_handler:
+                logger.info("ReActAgent: LLM satisfied with the plan and data. Stopping reasoning.")
+                break

        # 3. Create Final Answer based on all observations
        final_answer_stream = self._create_final_answer(query, self.observations, log_context)
@@ -170,6 +183,8 @@ class ReActAgent(BaseAgent):
        if "{summaries}" in plan_prompt_filled:
            summaries = docs_data if docs_data else "No documents retrieved."
            plan_prompt_filled = plan_prompt_filled.replace("{summaries}", summaries)
+        plan_prompt_filled = plan_prompt_filled.replace("{prompt}", self.prompt or "")
+        plan_prompt_filled = plan_prompt_filled.replace("{observations}", "\n".join(self.observations))

        messages = [{"role": "user", "content": plan_prompt_filled}]

--- a/application/prompts/react_planning_prompt.txt
+++ b/application/prompts/react_planning_prompt.txt
@@ -5,7 +5,9 @@ Include the following elements in your thought and execution process:
 2. Determine any relevant context or background information needed to understand the query.
 3. List potential approaches or methods to address the query.
 4. Highlight any critical factors or constraints that may influence the outcome.
-5. Use available tools to help you with the analysis and execute them. Execute tools needed now instead of later.
+5. Plan with available tools to help you with the analysis but dont execute them. Tools will be executed by another AI.

 Query: {query}  
-Summaries: {summaries}
+Summaries: {summaries}
+Prompt: {prompt}
+Observations(potentially previous tool calls): {observations}