feat: agent templates and seeding premade agents (#1910)

* feat: agent templates and seeding premade agents * fix: ensure ObjectId is used for source reference in agent configuration * fix: improve source handling in DatabaseSeeder and update tool config processing * feat: add prompt handling in DatabaseSeeder for agent configuration * Docs premade agents * link to prescraped docs * feat: add template agent retrieval and adopt agent functionality * feat: simplify agent descriptions in premade_agents.yaml added docs --------- Co-authored-by: Pavel <pabin@yandex.ru> Co-authored-by: Alex <a@tushynski.me>
2026-03-05 05:14:08 +00:00 · 2025-10-07 15:30:14 +05:30
parent 8b8e616557
commit da6317a242
21 changed files with 1053 additions and 574 deletions
--- a/application/agents/react_agent.py
+++ b/application/agents/react_agent.py
@@ -20,9 +20,10 @@ with open(
    "r",
 ) as f:
    final_prompt_template = f.read()
-    
+
 MAX_ITERATIONS_REASONING = 10

+
 class ReActAgent(BaseAgent):
    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)
@@ -38,49 +39,69 @@ class ReActAgent(BaseAgent):
        collected_content = []
        if isinstance(resp, str):
            collected_content.append(resp)
-        elif ( # OpenAI non-streaming or Anthropic non-streaming (older SDK style)
+        elif (  # OpenAI non-streaming or Anthropic non-streaming (older SDK style)
            hasattr(resp, "message")
            and hasattr(resp.message, "content")
            and resp.message.content is not None
        ):
            collected_content.append(resp.message.content)
-        elif ( # OpenAI non-streaming (Pydantic model), Anthropic new SDK non-streaming
-            hasattr(resp, "choices") and resp.choices and
-            hasattr(resp.choices[0], "message") and
-            hasattr(resp.choices[0].message, "content") and
-            resp.choices[0].message.content is not None
+        elif (  # OpenAI non-streaming (Pydantic model), Anthropic new SDK non-streaming
+            hasattr(resp, "choices")
+            and resp.choices
+            and hasattr(resp.choices[0], "message")
+            and hasattr(resp.choices[0].message, "content")
+            and resp.choices[0].message.content is not None
        ):
-            collected_content.append(resp.choices[0].message.content) # OpenAI
-        elif ( # Anthropic new SDK non-streaming content block
-             hasattr(resp, "content") and isinstance(resp.content, list) and resp.content and
-             hasattr(resp.content[0], "text")
+            collected_content.append(resp.choices[0].message.content)  # OpenAI
+        elif (  # Anthropic new SDK non-streaming content block
+            hasattr(resp, "content")
+            and isinstance(resp.content, list)
+            and resp.content
+            and hasattr(resp.content[0], "text")
        ):
-            collected_content.append(resp.content[0].text) # Anthropic
+            collected_content.append(resp.content[0].text)  # Anthropic
        else:
            # Assume resp is a stream if not a recognized object
+            chunk = None
            try:
-                for chunk in resp: # This will fail if resp is not iterable (e.g. a non-streaming response object)
+                for (
+                    chunk
+                ) in (
+                    resp
+                ):  # This will fail if resp is not iterable (e.g. a non-streaming response object)
                    content_piece = ""
                    # OpenAI-like stream
-                    if hasattr(chunk, 'choices') and len(chunk.choices) > 0 and \
-                       hasattr(chunk.choices[0], 'delta') and \
-                       hasattr(chunk.choices[0].delta, 'content') and \
-                       chunk.choices[0].delta.content is not None:
+                    if (
+                        hasattr(chunk, "choices")
+                        and len(chunk.choices) > 0
+                        and hasattr(chunk.choices[0], "delta")
+                        and hasattr(chunk.choices[0].delta, "content")
+                        and chunk.choices[0].delta.content is not None
+                    ):
                        content_piece = chunk.choices[0].delta.content
                    # Anthropic-like stream (ContentBlockDelta)
-                    elif hasattr(chunk, 'type') and chunk.type == 'content_block_delta' and \
-                         hasattr(chunk, 'delta') and hasattr(chunk.delta, 'text'):
+                    elif (
+                        hasattr(chunk, "type")
+                        and chunk.type == "content_block_delta"
+                        and hasattr(chunk, "delta")
+                        and hasattr(chunk.delta, "text")
+                    ):
                        content_piece = chunk.delta.text
-                    elif isinstance(chunk, str): # Simplest case: stream of strings
+                    elif isinstance(chunk, str):  # Simplest case: stream of strings
                        content_piece = chunk

                    if content_piece:
                        collected_content.append(content_piece)
-            except TypeError: # If resp is not iterable (e.g. a final response object that wasn't caught above)
-                logger.debug(f"Response type {type(resp)} could not be iterated as a stream. It might be a non-streaming object not handled by specific checks.")
+            except (
+                TypeError
+            ):  # If resp is not iterable (e.g. a final response object that wasn't caught above)
+                logger.debug(
+                    f"Response type {type(resp)} could not be iterated as a stream. It might be a non-streaming object not handled by specific checks."
+                )
            except Exception as e:
-                logger.error(f"Error processing potential stream chunk: {e}, chunk was: {getattr(chunk, '__dict__', chunk)}")
-
+                logger.error(
+                    f"Error processing potential stream chunk: {e}, chunk was: {getattr(chunk, '__dict__', chunk) if chunk is not None else 'N/A'}"
+                )

        return "".join(collected_content)

@@ -112,8 +133,9 @@ class ReActAgent(BaseAgent):
                yield {"thought": line_chunk}
            self.plan = "".join(current_plan_parts)
            if self.plan:
-                self.observations.append(f"Plan: {self.plan} Iteration: {iterating_reasoning}")
-
+                self.observations.append(
+                    f"Plan: {self.plan} Iteration: {iterating_reasoning}"
+                )

            max_obs_len = 20000
            obs_str = "\n".join(self.observations)
@@ -125,34 +147,55 @@ class ReActAgent(BaseAgent):
                + f"\n\nObservations:\n{obs_str}"
                + f"\n\nIf there is enough data to complete user query '{query}', Respond with 'SATISFIED' only. Otherwise, continue. Dont Menstion 'SATISFIED' in your response if you are not ready. "
            )
-            
+
            messages = self._build_messages(execution_prompt_str, query, retrieved_data)

            resp_from_llm_gen = self._llm_gen(messages, log_context)

-            initial_llm_thought_content = self._extract_content_from_llm_response(resp_from_llm_gen)
+            initial_llm_thought_content = self._extract_content_from_llm_response(
+                resp_from_llm_gen
+            )
            if initial_llm_thought_content:
-                self.observations.append(f"Initial thought/response: {initial_llm_thought_content}")
+                self.observations.append(
+                    f"Initial thought/response: {initial_llm_thought_content}"
+                )
            else:
-                logger.info("ReActAgent: Initial LLM response (before handler) had no textual content (might be only tool calls).")
-            resp_after_handler = self._llm_handler(resp_from_llm_gen, tools_dict, messages, log_context)
-            
-            for tool_call_info in self.tool_calls: # Iterate over self.tool_calls populated by _llm_handler
+                logger.info(
+                    "ReActAgent: Initial LLM response (before handler) had no textual content (might be only tool calls)."
+                )
+            resp_after_handler = self._llm_handler(
+                resp_from_llm_gen, tools_dict, messages, log_context
+            )
+
+            for (
+                tool_call_info
+            ) in (
+                self.tool_calls
+            ):  # Iterate over self.tool_calls populated by _llm_handler
                observation_string = (
                    f"Executed Action: Tool '{tool_call_info.get('tool_name', 'N/A')}' "
                    f"with arguments '{tool_call_info.get('arguments', '{}')}'. Result: '{str(tool_call_info.get('result', ''))[:200]}...'"
                )
                self.observations.append(observation_string)

-            content_after_handler = self._extract_content_from_llm_response(resp_after_handler)
+            content_after_handler = self._extract_content_from_llm_response(
+                resp_after_handler
+            )
            if content_after_handler:
-                self.observations.append(f"Response after tool execution: {content_after_handler}")
+                self.observations.append(
+                    f"Response after tool execution: {content_after_handler}"
+                )
            else:
-                logger.info("ReActAgent: LLM response after handler had no textual content.")
+                logger.info(
+                    "ReActAgent: LLM response after handler had no textual content."
+                )

            if log_context:
                log_context.stacks.append(
-                    {"component": "agent_tool_calls", "data": {"tool_calls": self.tool_calls.copy()}}
+                    {
+                        "component": "agent_tool_calls",
+                        "data": {"tool_calls": self.tool_calls.copy()},
+                    }
                )

            yield {"sources": retrieved_data}
@@ -165,13 +208,17 @@ class ReActAgent(BaseAgent):
                display_tool_calls.append(cleaned_tc)
            if display_tool_calls:
                yield {"tool_calls": display_tool_calls}
-            
+
            if "SATISFIED" in content_after_handler:
-                logger.info("ReActAgent: LLM satisfied with the plan and data. Stopping reasoning.")
+                logger.info(
+                    "ReActAgent: LLM satisfied with the plan and data. Stopping reasoning."
+                )
                break

        # 3. Create Final Answer based on all observations
-        final_answer_stream = self._create_final_answer(query, self.observations, log_context)
+        final_answer_stream = self._create_final_answer(
+            query, self.observations, log_context
+        )
        for answer_chunk in final_answer_stream:
            yield {"answer": answer_chunk}
        logger.info("ReActAgent: Finished generating final answer.")
@@ -184,12 +231,16 @@ class ReActAgent(BaseAgent):
            summaries = docs_data if docs_data else "No documents retrieved."
            plan_prompt_filled = plan_prompt_filled.replace("{summaries}", summaries)
        plan_prompt_filled = plan_prompt_filled.replace("{prompt}", self.prompt or "")
-        plan_prompt_filled = plan_prompt_filled.replace("{observations}", "\n".join(self.observations))
+        plan_prompt_filled = plan_prompt_filled.replace(
+            "{observations}", "\n".join(self.observations)
+        )

        messages = [{"role": "user", "content": plan_prompt_filled}]

        plan_stream_from_llm = self.llm.gen_stream(
-            model=self.gpt_model, messages=messages, tools=getattr(self, 'tools', None) # Use self.tools
+            model=self.gpt_model,
+            messages=messages,
+            tools=getattr(self, "tools", None),  # Use self.tools
        )
        if log_context:
            data = build_stack_data(self.llm)
@@ -206,8 +257,12 @@ class ReActAgent(BaseAgent):
        observation_string = "\n".join(observations)
        max_obs_len = 10000
        if len(observation_string) > max_obs_len:
-            observation_string = observation_string[:max_obs_len] + "\n...[observations truncated]"
-            logger.warning("ReActAgent: Truncated observations for final answer prompt due to length.")
+            observation_string = (
+                observation_string[:max_obs_len] + "\n...[observations truncated]"
+            )
+            logger.warning(
+                "ReActAgent: Truncated observations for final answer prompt due to length."
+            )

        final_answer_prompt_filled = final_prompt_template.format(
            query=query, observations=observation_string
@@ -226,4 +281,4 @@ class ReActAgent(BaseAgent):
        for chunk in final_answer_stream_from_llm:
            content_piece = self._extract_content_from_llm_response(chunk)
            if content_piece:
-                yield content_piece
+                yield content_piece