Merge pull request #1630 from siiddhantt/feat/show-tool-execution

feat: tool calls tracking
2026-03-06 13:53:26 +00:00 · 2025-02-14 10:27:15 +00:00
parent 095cb58df3 7b05afab74
commit 05319e36a7
18 changed files with 502 additions and 99 deletions
--- a/application/utils.py
+++ b/application/utils.py
@@ -1,8 +1,9 @@
-import tiktoken
 import hashlib
-from flask import jsonify, make_response
 import re

+import tiktoken
+from flask import jsonify, make_response
+

 _encoding = None

@@ -22,6 +23,7 @@ def num_tokens_from_string(string: str) -> int:
    else:
        return 0

+
 def num_tokens_from_object_or_list(thing):
    if isinstance(thing, list):
        return sum([num_tokens_from_object_or_list(x) for x in thing])
@@ -32,6 +34,7 @@ def num_tokens_from_object_or_list(thing):
    else:
        return 0

+
 def count_tokens_docs(docs):
    docs_content = ""
    for doc in docs:
@@ -59,6 +62,7 @@ def check_required_fields(data, required_fields):
 def get_hash(data):
    return hashlib.md5(data.encode(), usedforsecurity=False).hexdigest()

+
 def limit_chat_history(history, max_token_limit=None, gpt_model="docsgpt"):
    """
    Limits chat history based on token count.
@@ -67,38 +71,41 @@ def limit_chat_history(history, max_token_limit=None, gpt_model="docsgpt"):
    from application.core.settings import settings

    max_token_limit = (
-            max_token_limit
-            if max_token_limit and 
-            max_token_limit < settings.MODEL_TOKEN_LIMITS.get(
-                gpt_model, settings.DEFAULT_MAX_HISTORY
-            )
-            else settings.MODEL_TOKEN_LIMITS.get(
-                gpt_model, settings.DEFAULT_MAX_HISTORY
-            )
-        )
-    
+        max_token_limit
+        if max_token_limit
+        and max_token_limit
+        < settings.MODEL_TOKEN_LIMITS.get(gpt_model, settings.DEFAULT_MAX_HISTORY)
+        else settings.MODEL_TOKEN_LIMITS.get(gpt_model, settings.DEFAULT_MAX_HISTORY)
+    )

    if not history:
        return []
-        
-    tokens_current_history = 0
+
    trimmed_history = []
-    
+    tokens_current_history = 0
+
    for message in reversed(history):
+        tokens_batch = 0
        if "prompt" in message and "response" in message:
-            tokens_batch = num_tokens_from_string(message["prompt"]) + num_tokens_from_string(
-                message["response"]
-            )
-            if tokens_current_history + tokens_batch < max_token_limit:
-                tokens_current_history += tokens_batch
-                trimmed_history.insert(0, message)
-            else:
-                break
+            tokens_batch += num_tokens_from_string(message["prompt"])
+            tokens_batch += num_tokens_from_string(message["response"])
+
+        if "tool_calls" in message:
+            for tool_call in message["tool_calls"]:
+                tool_call_string = f"Tool: {tool_call.get('tool_name')} | Action: {tool_call.get('action_name')} | Args: {tool_call.get('arguments')} | Response: {tool_call.get('result')}"
+                tokens_batch += num_tokens_from_string(tool_call_string)
+
+        if tokens_current_history + tokens_batch < max_token_limit:
+            tokens_current_history += tokens_batch
+            trimmed_history.insert(0, message)
+        else:
+            break

    return trimmed_history

+
 def validate_function_name(function_name):
    """Validates if a function name matches the allowed pattern."""
    if not re.match(r"^[a-zA-Z0-9_-]+$", function_name):
        return False
-    return True
+    return True