fix: google parser, llm handler and other errors

This commit is contained in:
Siddhant Rai
2025-01-17 09:22:41 +05:30
parent 811dfecf98
commit c97d1e3363
4 changed files with 141 additions and 102 deletions

View File

@@ -1,60 +1,77 @@
from application.llm.base import BaseLLM
import google.generativeai as genai
from application.core.settings import settings
import logging
from application.llm.base import BaseLLM
class GoogleLLM(BaseLLM):
def __init__(self, api_key=None, user_api_key=None, *args, **kwargs):
super().__init__(*args, **kwargs)
self.api_key = settings.API_KEY
self.user_api_key = user_api_key
genai.configure(api_key=self.api_key)
def _clean_messages_google(self, messages):
return [
{
"role": "model" if message["role"] == "system" else message["role"],
"parts": [message["content"]],
}
for message in messages[1:]
]
cleaned_messages = []
for message in messages[1:]:
cleaned_messages.append(
{
"role": "model" if message["role"] == "system" else message["role"],
"parts": [message["content"]],
}
)
return cleaned_messages
def _clean_tools_format(self, tools_data):
"""
Cleans the tools data format, converting string type representations
to the expected dictionary structure for google-generativeai.
"""
if isinstance(tools_data, list):
return [self._clean_tools_format(item) for item in tools_data]
elif isinstance(tools_data, dict):
if 'function' in tools_data and 'type' in tools_data and tools_data['type'] == 'function':
if (
"function" in tools_data
and "type" in tools_data
and tools_data["type"] == "function"
):
# Handle the case where tools are nested under 'function'
cleaned_function = self._clean_tools_format(tools_data['function'])
return {'function_declarations': [cleaned_function]}
elif 'function' in tools_data and 'type_' in tools_data and tools_data['type_'] == 'function':
cleaned_function = self._clean_tools_format(tools_data["function"])
return {"function_declarations": [cleaned_function]}
elif (
"function" in tools_data
and "type_" in tools_data
and tools_data["type_"] == "function"
):
# Handle the case where tools are nested under 'function' and type is already 'type_'
cleaned_function = self._clean_tools_format(tools_data['function'])
return {'function_declarations': [cleaned_function]}
cleaned_function = self._clean_tools_format(tools_data["function"])
return {"function_declarations": [cleaned_function]}
else:
new_tools_data = {}
for key, value in tools_data.items():
if key == 'type':
if value == 'string':
new_tools_data['type_'] = 'STRING' # Keep as string for now
elif value == 'object':
new_tools_data['type_'] = 'OBJECT' # Keep as string for now
elif key == 'additionalProperties':
if key == "type":
if value == "string":
new_tools_data["type_"] = "STRING"
elif value == "object":
new_tools_data["type_"] = "OBJECT"
elif key == "additionalProperties":
continue
elif key == 'properties':
elif key == "properties":
if isinstance(value, dict):
new_properties = {}
for prop_name, prop_value in value.items():
if isinstance(prop_value, dict) and 'type' in prop_value:
if prop_value['type'] == 'string':
new_properties[prop_name] = {'type_': 'STRING', 'description': prop_value.get('description')}
if (
isinstance(prop_value, dict)
and "type" in prop_value
):
if prop_value["type"] == "string":
new_properties[prop_name] = {
"type_": "STRING",
"description": prop_value.get(
"description"
),
}
# Add more type mappings as needed
else:
new_properties[prop_name] = self._clean_tools_format(prop_value)
new_properties[prop_name] = (
self._clean_tools_format(prop_value)
)
new_tools_data[key] = new_properties
else:
new_tools_data[key] = self._clean_tools_format(value)
@@ -74,65 +91,64 @@ class GoogleLLM(BaseLLM):
tools=None,
formatting="openai",
**kwargs
):
from google import genai
from google.genai import types
client = genai.Client(api_key=self.api_key)
):
config = {}
model_name = "gemini-2.0-flash-exp"
config = {
}
model = 'gemini-2.0-flash-exp'
if formatting=="raw":
response = client.models.generate_content(
model=model,
contents=messages
)
else:
model = genai.GenerativeModel(
model_name=model,
generation_config=config,
system_instruction=messages[0]["content"],
tools=self._clean_tools_format(tools)
)
chat_session = model.start_chat(
history=self._clean_messages_google(messages)[:-1]
)
response = chat_session.send_message(
self._clean_messages_google(messages)[-1]
)
logging.info(response)
if formatting == "raw":
client = genai.GenerativeModel(model_name=model_name)
response = client.generate_content(contents=messages)
return response.text
else:
if tools:
client = genai.GenerativeModel(
model_name=model_name,
generation_config=config,
system_instruction=messages[0]["content"],
tools=self._clean_tools_format(tools),
)
chat_session = gen_model.start_chat(
history=self._clean_messages_google(messages)[:-1]
)
response = chat_session.send_message(
self._clean_messages_google(messages)[-1]
)
return response
else:
gen_model = genai.GenerativeModel(
model_name=model_name,
generation_config=config,
system_instruction=messages[0]["content"],
)
chat_session = gen_model.start_chat(
history=self._clean_messages_google(messages)[:-1]
)
response = chat_session.send_message(
self._clean_messages_google(messages)[-1]
)
return response.text
def _raw_gen_stream(
self,
baseself,
model,
messages,
stream=True,
tools=None,
**kwargs
):
import google.generativeai as genai
genai.configure(api_key=self.api_key)
config = {
}
model = genai.GenerativeModel(
model_name=model,
self, baseself, model, messages, stream=True, tools=None, **kwargs
):
config = {}
model_name = "gemini-2.0-flash-exp"
gen_model = genai.GenerativeModel(
model_name=model_name,
generation_config=config,
system_instruction=messages[0]["content"]
)
chat_session = model.start_chat(
system_instruction=messages[0]["content"],
tools=self._clean_tools_format(tools),
)
chat_session = gen_model.start_chat(
history=self._clean_messages_google(messages)[:-1],
)
response = chat_session.send_message(
self._clean_messages_google(messages)[-1]
, stream=stream
self._clean_messages_google(messages)[-1], stream=stream
)
for line in response:
if line.text is not None:
yield line.text
for chunk in response:
if chunk.text is not None:
yield chunk.text
def _supports_tools(self):
return True
return True