From abde63fb56ca526e07a1794f3418858b44d60274 Mon Sep 17 00:00:00 2001 From: Mark Sze Date: Thu, 14 Nov 2024 05:20:22 +0000 Subject: [PATCH 01/10] Transfer to AG2 --- autogen/oai/gemini.py | 579 +++++++++++++----- .../graph_rag/test_falkor_graph_rag.py | 4 +- test/oai/test_gemini.py | 216 ++----- 3 files changed, 501 insertions(+), 298 deletions(-) diff --git a/autogen/oai/gemini.py b/autogen/oai/gemini.py index fee3418c78..4f1950ce96 100644 --- a/autogen/oai/gemini.py +++ b/autogen/oai/gemini.py @@ -1,4 +1,4 @@ -# Copyright (c) 2023 - 2024, Owners of https://github.com/ag2ai +# Copyright (c) 2023 - 2024, Owners of https://github.com/autogenhub # # SPDX-License-Identifier: Apache-2.0 # @@ -38,6 +38,8 @@ from __future__ import annotations import base64 +import copy +import json import logging import os import random @@ -45,23 +47,35 @@ import time import warnings from io import BytesIO -from typing import Any, Dict, List, Mapping, Union +from typing import Any, Dict, List, Tuple, Union import google.generativeai as genai +import PIL import requests import vertexai -from google.ai.generativelanguage import Content, Part +from google.ai.generativelanguage import Content, FunctionCall, FunctionDeclaration, FunctionResponse, Part, Tool +from google.ai.generativelanguage_v1beta.types import Schema from google.auth.credentials import Credentials -from openai.types.chat import ChatCompletion +from jsonschema import ValidationError +from openai.types.chat import ChatCompletion, ChatCompletionMessageToolCall from openai.types.chat.chat_completion import ChatCompletionMessage, Choice from openai.types.completion_usage import CompletionUsage from PIL import Image -from vertexai.generative_models import Content as VertexAIContent +from vertexai.generative_models import ( + Content as VertexAIContent, +) +from vertexai.generative_models import ( + FunctionDeclaration as vaiFunctionDeclaration, +) from vertexai.generative_models import GenerativeModel from vertexai.generative_models import HarmBlockThreshold as VertexAIHarmBlockThreshold from vertexai.generative_models import HarmCategory as VertexAIHarmCategory +from vertexai.generative_models import Image as VertexAIImage from vertexai.generative_models import Part as VertexAIPart from vertexai.generative_models import SafetySetting as VertexAISafetySetting +from vertexai.generative_models import ( + Tool as vaiTool, +) logger = logging.getLogger(__name__) @@ -160,6 +174,7 @@ def get_usage(response) -> Dict: } def create(self, params: Dict) -> ChatCompletion: + if self.use_vertexai: self._initialize_vertexai(**params) else: @@ -167,11 +182,16 @@ def create(self, params: Dict) -> ChatCompletion: "location" not in params ), "Google Cloud project and compute location cannot be set when using an API Key!" model_name = params.get("model", "gemini-pro") - if not model_name: + + if model_name == "gemini-pro-vision": + raise ValueError( + "Gemini 1.0 Pro vision ('gemini-pro-vision') has been deprecated, please consider switching to a different model, for example 'gemini-1.5-flash'." + ) + elif not model_name: raise ValueError( "Please provide a model name for the Gemini Client. " "You can configure it in the OAI Config List file. " - "See this [LLM configuration tutorial](https://ag2ai.github.io/autogen/docs/topics/llm_configuration/) for more details." + "See this [LLM configuration tutorial](https://autogenhub.github.io/autogen/docs/topics/llm_configuration/) for more details." ) params.get("api_type", "google") # not used @@ -180,6 +200,10 @@ def create(self, params: Dict) -> ChatCompletion: n_response = params.get("n", 1) system_instruction = params.get("system_instruction", None) response_validation = params.get("response_validation", True) + if "tools" in params: + tools = self._tools_to_gemini_tools(params["tools"]) + else: + tools = None generation_config = { gemini_term: params[autogen_term] @@ -196,77 +220,92 @@ def create(self, params: Dict) -> ChatCompletion: "Streaming is not supported for Gemini yet, and it will have no effect. Please set stream=False.", UserWarning, ) + stream = False if n_response > 1: warnings.warn("Gemini only supports `n=1` for now. We only generate one response.", UserWarning) - if "vision" not in model_name: - # A. create and call the chat model. - gemini_messages = self._oai_messages_to_gemini_messages(messages) - if self.use_vertexai: - model = GenerativeModel( - model_name, - generation_config=generation_config, - safety_settings=safety_settings, - system_instruction=system_instruction, - ) - chat = model.start_chat(history=gemini_messages[:-1], response_validation=response_validation) - else: - # we use chat model by default - model = genai.GenerativeModel( - model_name, - generation_config=generation_config, - safety_settings=safety_settings, - system_instruction=system_instruction, - ) - genai.configure(api_key=self.api_key) - chat = model.start_chat(history=gemini_messages[:-1]) - - response = chat.send_message(gemini_messages[-1].parts, stream=stream, safety_settings=safety_settings) - ans: str = chat.history[-1].parts[0].text - prompt_tokens = model.count_tokens(chat.history[:-1]).total_tokens - completion_tokens = model.count_tokens(ans).total_tokens - elif model_name == "gemini-pro-vision": - # B. handle the vision model - if self.use_vertexai: - model = GenerativeModel( - model_name, - generation_config=generation_config, - safety_settings=safety_settings, - system_instruction=system_instruction, - ) - else: - model = genai.GenerativeModel( - model_name, - generation_config=generation_config, - safety_settings=safety_settings, - system_instruction=system_instruction, - ) - genai.configure(api_key=self.api_key) - # Gemini's vision model does not support chat history yet - # chat = model.start_chat(history=gemini_messages[:-1]) - # response = chat.send_message(gemini_messages[-1].parts) - user_message = self._oai_content_to_gemini_content(messages[-1]["content"]) - if len(messages) > 2: - warnings.warn( - "Warning: Gemini's vision model does not support chat history yet.", - "We only use the last message as the prompt.", - UserWarning, - ) + autogen_tool_calls = [] - response = model.generate_content(user_message, stream=stream) - # ans = response.text - if self.use_vertexai: - ans: str = response.candidates[0].content.parts[0].text - else: - ans: str = response._result.candidates[0].content.parts[0].text + # Maps the function call ids to function names so we can inject it into FunctionResponse messages + self.tool_call_function_map: Dict[str, str] = {} - prompt_tokens = model.count_tokens(user_message).total_tokens - completion_tokens = model.count_tokens(ans).total_tokens + # A. create and call the chat model. + gemini_messages = self._oai_messages_to_gemini_messages(messages) + if self.use_vertexai: + model = GenerativeModel( + model_name, + generation_config=generation_config, + safety_settings=safety_settings, + system_instruction=system_instruction, + tools=tools, + ) + + chat = model.start_chat(history=gemini_messages[:-1], response_validation=response_validation) + else: + model = genai.GenerativeModel( + model_name, + generation_config=generation_config, + safety_settings=safety_settings, + system_instruction=system_instruction, + tools=tools, + ) + + genai.configure(api_key=self.api_key) + chat = model.start_chat(history=gemini_messages[:-1]) + + response = chat.send_message(gemini_messages[-1].parts, stream=stream, safety_settings=safety_settings) + + # Extract text and tools from response + ans = "" + random_id = random.randint(0, 10000) + prev_function_calls = [] + for part in response.parts: + + # Function calls + if fn_call := part.function_call: + + # If we have a repeated function call, ignore it + if fn_call not in prev_function_calls: + autogen_tool_calls.append( + ChatCompletionMessageToolCall( + id=random_id, + function={ + "name": fn_call.name, + "arguments": ( + json.dumps({key: val for key, val in fn_call.args.items()}) + if fn_call.args is not None + else "" + ), + }, + type="function", + ) + ) + + prev_function_calls.append(fn_call) + random_id += 1 + + # Plain text content + elif text := part.text: + ans += text + + # If we have function calls, ignore the text + # as it can be Gemini guessing the function response + if len(autogen_tool_calls) != 0: + ans = "" + else: + autogen_tool_calls = None + + prompt_tokens = response.usage_metadata.prompt_token_count + completion_tokens = response.usage_metadata.candidates_token_count # 3. convert output - message = ChatCompletionMessage(role="assistant", content=ans, function_call=None, tool_calls=None) - choices = [Choice(finish_reason="stop", index=0, message=message)] + message = ChatCompletionMessage( + role="assistant", content=ans, function_call=None, tool_calls=autogen_tool_calls + ) + choices = [ + Choice(finish_reason="tool_calls" if autogen_tool_calls is not None else "stop", index=0, message=message) + ] response_oai = ChatCompletion( id=str(random.randint(0, 1000)), @@ -279,50 +318,105 @@ def create(self, params: Dict) -> ChatCompletion: completion_tokens=completion_tokens, total_tokens=prompt_tokens + completion_tokens, ), - cost=calculate_gemini_cost(prompt_tokens, completion_tokens, model_name), + cost=calculate_gemini_cost(self.use_vertexai, prompt_tokens, completion_tokens, model_name), ) return response_oai - def _oai_content_to_gemini_content(self, content: Union[str, List]) -> List: - """Convert content from OAI format to Gemini format""" + def _oai_content_to_gemini_content(self, message: Dict[str, Any]) -> Tuple[List, str]: + """Convert AutoGen content to Gemini parts, catering for text and tool calls""" rst = [] - if isinstance(content, str): + + if message["role"] == "tool": + # Tool call recommendation + + function_name = self.tool_call_function_map[message["tool_call_id"]] + + if self.use_vertexai: + rst.append( + VertexAIPart.from_function_response( + name=function_name, response={"result": self._to_json_or_str(message["content"])} + ) + ) + else: + rst.append( + Part( + function_response=FunctionResponse( + name=function_name, response={"result": self._to_json_or_str(message["content"])} + ) + ) + ) + + return rst, "tool" + elif "tool_calls" in message and len(message["tool_calls"]) != 0: + for tool_call in message["tool_calls"]: + + function_id = tool_call["id"] + function_name = tool_call["function"]["name"] + self.tool_call_function_map[function_id] = function_name + + if self.use_vertexai: + rst.append( + VertexAIPart.from_dict( + { + "functionCall": { + "name": function_name, + "args": json.loads(tool_call["function"]["arguments"]), + } + } + ) + ) + else: + rst.append( + Part( + function_call=FunctionCall( + name=function_name, + args=json.loads(tool_call["function"]["arguments"]), + ) + ) + ) + + return rst, "tool_call" + + elif isinstance(message["content"], str): + content = message["content"] if content == "": content = "empty" # Empty content is not allowed. if self.use_vertexai: rst.append(VertexAIPart.from_text(content)) else: rst.append(Part(text=content)) - return rst - - assert isinstance(content, list) - for msg in content: - if isinstance(msg, dict): - assert "type" in msg, f"Missing 'type' field in message: {msg}" - if msg["type"] == "text": - if self.use_vertexai: - rst.append(VertexAIPart.from_text(text=msg["text"])) + return rst, "text" + + # For images the message contains a list of text items + if isinstance(message["content"], list): + has_image = False + for msg in message["content"]: + if isinstance(msg, dict): + assert "type" in msg, f"Missing 'type' field in message: {msg}" + if msg["type"] == "text": + if self.use_vertexai: + rst.append(VertexAIPart.from_text(text=msg["text"])) + else: + rst.append(Part(text=msg["text"])) + elif msg["type"] == "image_url": + if self.use_vertexai: + img_url = msg["image_url"]["url"] + img_part = VertexAIPart.from_uri(img_url, mime_type="image/png") + rst.append(img_part) + else: + b64_img = get_image_data(msg["image_url"]["url"]) + rst.append(Part(inline_data={"mime_type": "image/png", "data": b64_img})) + + has_image = True else: - rst.append(Part(text=msg["text"])) - elif msg["type"] == "image_url": - if self.use_vertexai: - img_url = msg["image_url"]["url"] - re.match(r"data:image/(?:png|jpeg);base64,", img_url) - img = get_image_data(img_url, use_b64=False) - # image/png works with jpeg as well - img_part = VertexAIPart.from_data(img, mime_type="image/png") - rst.append(img_part) - else: - b64_img = get_image_data(msg["image_url"]["url"]) - img = _to_pil(b64_img) - rst.append(img) + raise ValueError(f"Unsupported message type: {msg['type']}") else: - raise ValueError(f"Unsupported message type: {msg['type']}") - else: - raise ValueError(f"Unsupported message type: {type(msg)}") - return rst + raise ValueError(f"Unsupported message type: {type(msg)}") + return rst, "image" if has_image else "text" + else: + raise Exception("Unable to convert content to Gemini format.") def _concat_parts(self, parts: List[Part]) -> List: """Concatenate parts with the same type. @@ -358,39 +452,178 @@ def _oai_messages_to_gemini_messages(self, messages: list[Dict[str, Any]]) -> li Make sure the "user" role and "model" role are interleaved. Also, make sure the last item is from the "user" role. """ - prev_role = None rst = [] - curr_parts = [] - for i, message in enumerate(messages): - parts = self._oai_content_to_gemini_content(message["content"]) + for message in messages: + parts, part_type = self._oai_content_to_gemini_content(message) role = "user" if message["role"] in ["user", "system"] else "model" - if (prev_role is None) or (role == prev_role): - curr_parts += parts - elif role != prev_role: - if self.use_vertexai: - rst.append(VertexAIContent(parts=curr_parts, role=prev_role)) - else: - rst.append(Content(parts=curr_parts, role=prev_role)) - curr_parts = parts - prev_role = role - # handle the last message - if self.use_vertexai: - rst.append(VertexAIContent(parts=curr_parts, role=role)) - else: - rst.append(Content(parts=curr_parts, role=role)) + if part_type == "text": + rst.append( + VertexAIContent(parts=parts, role=role) + if self.use_vertexai + else rst.append(Content(parts=parts, role=role)) + ) + elif part_type == "tool": + rst.append( + VertexAIContent(parts=parts, role="function") + if self.use_vertexai + else rst.append(Content(parts=parts, role="function")) + ) + elif part_type == "tool_call": + rst.append( + VertexAIContent(parts=parts, role="function") + if self.use_vertexai + else rst.append(Content(parts=parts, role="function")) + ) + elif part_type == "image": + # Image has multiple parts, some can be text and some can be image based + text_parts = [] + image_parts = [] + for part in parts: + if isinstance(part, Part): + # Text or non-Vertex AI image part + text_parts.append(part) + elif isinstance(part, VertexAIPart): + # Image + image_parts.append(part) + else: + raise Exception("Unable to process image part") + + if len(text_parts) > 0: + rst.append( + VertexAIContent(parts=text_parts, role=role) + if self.use_vertexai + else rst.append(Content(parts=text_parts, role=role)) + ) + + if len(image_parts) > 0: + rst.append( + VertexAIContent(parts=image_parts, role=role) + if self.use_vertexai + else rst.append(Content(parts=image_parts, role=role)) + ) + + if len(rst) != 0 and rst[-1] is None: + rst.pop() # The Gemini is restrict on order of roles, such that # 1. The messages should be interleaved between user and model. # 2. The last message must be from the user role. # We add a dummy message "continue" if the last role is not the user. - if rst[-1].role != "user": + if rst[-1].role not in ["user", "function"]: + text_part, type = self._oai_content_to_gemini_content({"content": "continue"}) + rst.append( + VertexAIContent(parts=text_part, role="user") + if self.use_vertexai + else Content(parts=text_part, role="user") + ) + + return rst + + def _tools_to_gemini_tools(self, tools: List[Dict[str, Any]]) -> List[Tool]: + """Create Gemini tools (as typically requires Callables)""" + + functions = [] + for tool in tools: if self.use_vertexai: - rst.append(VertexAIContent(parts=self._oai_content_to_gemini_content("continue"), role="user")) + function = vaiFunctionDeclaration( + name=tool["function"]["name"], + description=tool["function"]["description"], + parameters=tool["function"]["parameters"], + ) else: - rst.append(Content(parts=self._oai_content_to_gemini_content("continue"), role="user")) + function = GeminiClient._create_gemini_function_declaration(tool) + functions.append(function) - return rst + if self.use_vertexai: + return [vaiTool(function_declarations=functions)] + else: + return [Tool(function_declarations=functions)] + + @staticmethod + def _create_gemini_function_declaration(tool: Dict) -> FunctionDeclaration: + function_declaration = FunctionDeclaration() + function_declaration.name = tool["function"]["name"] + function_declaration.description = tool["function"]["description"] + if len(tool["function"]["parameters"]["properties"]) != 0: + function_declaration.parameters = GeminiClient._create_gemini_function_parameters( + copy.deepcopy(tool["function"]["parameters"]) + ) + + return function_declaration + + @staticmethod + def _create_gemini_function_declaration_schema(json_data) -> Schema: + """Recursively creates Schema objects for FunctionDeclaration.""" + param_schema = Schema() + param_type = json_data["type"] + + """ + TYPE_UNSPECIFIED = 0 + STRING = 1 + INTEGER = 2 + NUMBER = 3 + OBJECT = 4 + ARRAY = 5 + BOOLEAN = 6 + """ + + if param_type == "integer": + param_schema.type_ = 2 + elif param_type == "number": + param_schema.type_ = 3 + elif param_type == "string": + param_schema.type_ = 1 + elif param_type == "boolean": + param_schema.type_ = 6 + elif param_type == "array": + param_schema.type_ = 5 + if "items" in json_data: + param_schema.items = GeminiClient._create_gemini_function_declaration_schema(json_data["items"]) + else: + print("Warning: Array schema missing 'items' definition.") + elif param_type == "object": + param_schema.type_ = 4 + param_schema.properties = {} + if "properties" in json_data: + for prop_name, prop_data in json_data["properties"].items(): + param_schema.properties[prop_name] = GeminiClient._create_gemini_function_declaration_schema( + prop_data + ) + else: + print("Warning: Object schema missing 'properties' definition.") + + elif param_type in ("null", "any"): + param_schema.type_ = 1 # Treating these as strings for simplicity + else: + print(f"Warning: Unsupported parameter type '{param_type}'.") + + if "description" in json_data: + param_schema.description = json_data["description"] + + return param_schema + + def _create_gemini_function_parameters(function_parameter: dict[str, any]) -> dict[str, any]: + """Convert function parameters to Gemini format, recursive""" + + function_parameter["type_"] = function_parameter["type"].upper() + + # Parameter properties and items + if "properties" in function_parameter: + for key in function_parameter["properties"]: + function_parameter["properties"][key] = GeminiClient._create_gemini_function_parameters( + function_parameter["properties"][key] + ) + + if "items" in function_parameter: + function_parameter["items"] = GeminiClient._create_gemini_function_parameters(function_parameter["items"]) + + # Remove any attributes not needed + for attr in ["type", "default"]: + if attr in function_parameter: + del function_parameter[attr] + + return function_parameter @staticmethod def _to_vertexai_safety_settings(safety_settings): @@ -421,21 +654,13 @@ def _to_vertexai_safety_settings(safety_settings): else: return safety_settings - -def _to_pil(data: str) -> Image.Image: - """ - Converts a base64 encoded image data string to a PIL Image object. - - This function first decodes the base64 encoded string to bytes, then creates a BytesIO object from the bytes, - and finally creates and returns a PIL Image object from the BytesIO object. - - Parameters: - data (str): The base64 encoded image data string. - - Returns: - Image.Image: The PIL Image object created from the input data. - """ - return Image.open(BytesIO(base64.b64decode(data))) + @staticmethod + def _to_json_or_str(data: str) -> Union[Dict, str]: + try: + json_data = json.loads(data) + return json_data + except (json.JSONDecodeError, ValidationError): + return data def get_image_data(image_file: str, use_b64=True) -> bytes: @@ -456,14 +681,76 @@ def get_image_data(image_file: str, use_b64=True) -> bytes: return content -def calculate_gemini_cost(input_tokens: int, output_tokens: int, model_name: str) -> float: - if "1.5" in model_name or "gemini-experimental" in model_name: - # "gemini-1.5-pro-preview-0409" - # Cost is $7 per million input tokens and $21 per million output tokens - return 7.0 * input_tokens / 1e6 + 21.0 * output_tokens / 1e6 +def calculate_gemini_cost(use_vertexai: bool, input_tokens: int, output_tokens: int, model_name: str) -> float: + + def total_cost_mil(cost_per_mil_input: float, cost_per_mil_output: float): + # Cost per million + return cost_per_mil_input * input_tokens / 1e6 + cost_per_mil_output * output_tokens / 1e6 + + def total_cost_k(cost_per_k_input: float, cost_per_k_output: float): + # Cost per thousand + return cost_per_k_input * input_tokens / 1e3 + cost_per_k_output * output_tokens / 1e3 + + model_name = model_name.lower() + up_to_128k = input_tokens <= 128000 + + if use_vertexai: + # Vertex AI pricing - based on Text input + # https://cloud.google.com/vertex-ai/generative-ai/pricing#vertex-ai-pricing + + if "gemini-1.5-flash" in model_name: + if up_to_128k: + return total_cost_k(0.00001875, 0.000075) + else: + return total_cost_k(0.0000375, 0.00015) + + elif "gemini-1.5-pro" in model_name: + if up_to_128k: + return total_cost_k(0.0003125, 0.00125) + else: + return total_cost_k(0.000625, 0.0025) + + elif "gemini-1.0-pro" in model_name: + return total_cost_k(0.000125, 0.00001875) + + else: + warnings.warn( + f"Cost calculation is not implemented for model {model_name}. Cost will be calculated zero.", + UserWarning, + ) + return 0 + + else: + # Non-Vertex AI pricing + + if "gemini-1.5-flash-8b" in model_name: + # https://ai.google.dev/pricing#1_5flash-8B + if up_to_128k: + return total_cost_mil(0.0375, 0.15) + else: + return total_cost_mil(0.075, 0.3) - if "gemini-pro" not in model_name and "gemini-1.0-pro" not in model_name: - warnings.warn(f"Cost calculation is not implemented for model {model_name}. Using Gemini-1.0-Pro.", UserWarning) + elif "gemini-1.5-flash" in model_name: + # https://ai.google.dev/pricing#1_5flash + if up_to_128k: + return total_cost_mil(0.075, 0.3) + else: + return total_cost_mil(0.15, 0.6) + + elif "gemini-1.5-pro" in model_name: + # https://ai.google.dev/pricing#1_5pro + if up_to_128k: + return total_cost_mil(1.25, 5.0) + else: + return total_cost_mil(2.50, 10.0) + + elif "gemini-1.0-pro" in model_name: + # https://ai.google.dev/pricing#1_5pro + return total_cost_mil(0.50, 1.5) - # Cost is $0.5 per million input tokens and $1.5 per million output tokens - return 0.5 * input_tokens / 1e6 + 1.5 * output_tokens / 1e6 + else: + warnings.warn( + f"Cost calculation is not implemented for model {model_name}. Cost will be calculated zero.", + UserWarning, + ) + return 0 diff --git a/test/agentchat/contrib/graph_rag/test_falkor_graph_rag.py b/test/agentchat/contrib/graph_rag/test_falkor_graph_rag.py index 8814479da9..5b61454e9e 100644 --- a/test/agentchat/contrib/graph_rag/test_falkor_graph_rag.py +++ b/test/agentchat/contrib/graph_rag/test_falkor_graph_rag.py @@ -3,7 +3,7 @@ import pytest from conftest import reason, skip_openai # noqa: E402 from graphrag_sdk import KnowledgeGraph, Source -from graphrag_sdk.schema import Schema +from graphrag_sdk.ontology import Ontology try: from autogen.agentchat.contrib.graph_rag.document import ( @@ -34,7 +34,7 @@ def test_falkor_db_query_engine(): 3. Query it with a question and verify the result contains the critical information. """ # Arrange - test_schema = Schema() + test_schema = Ontology() actor = test_schema.add_entity("Actor").add_attribute("name", str, unique=True) movie = test_schema.add_entity("Movie").add_attribute("title", str, unique=True) test_schema.add_relation("ACTED", actor, movie) diff --git a/test/oai/test_gemini.py b/test/oai/test_gemini.py index b5b84cd028..7bc834b3bd 100644 --- a/test/oai/test_gemini.py +++ b/test/oai/test_gemini.py @@ -1,4 +1,4 @@ -# Copyright (c) 2023 - 2024, Owners of https://github.com/ag2ai +# Copyright (c) 2023 - 2024, Owners of https://github.com/autogenhub # # SPDX-License-Identifier: Apache-2.0 # @@ -114,28 +114,23 @@ def test_gemini_message_handling(gemini_client): {"role": "model", "content": "How can I help you?"}, {"role": "user", "content": "Which planet is the nearest to the sun?"}, {"role": "user", "content": "Which planet is the farthest from the sun?"}, - {"role": "model", "content": "Mercury is the closest palnet to the sun."}, - {"role": "model", "content": "Neptune is the farthest palnet from the sun."}, + {"role": "model", "content": "Mercury is the closest planet to the sun."}, + {"role": "model", "content": "Neptune is the farthest planet from the sun."}, {"role": "user", "content": "How can we determine the mass of a black hole?"}, ] # The datastructure below defines what the structure of the messages # should resemble after converting to Gemini format. - # Messages of similar roles are expected to be merged to a single message, - # where the contents of the original messages will be included in - # consecutive parts of the converted Gemini message + # Historically it has merged messages and ensured alternating roles, + # this no longer appears to be required by the Gemini API expected_gemini_struct = [ # system role is converted to user role {"role": "user", "parts": ["You are my personal assistant."]}, {"role": "model", "parts": ["How can I help you?"]}, - { - "role": "user", - "parts": ["Which planet is the nearest to the sun?", "Which planet is the farthest from the sun?"], - }, - { - "role": "model", - "parts": ["Mercury is the closest palnet to the sun.", "Neptune is the farthest palnet from the sun."], - }, + {"role": "user", "parts": ["Which planet is the nearest to the sun?"]}, + {"role": "user", "parts": ["Which planet is the farthest from the sun?"]}, + {"role": "model", "parts": ["Mercury is the closest planet to the sun."]}, + {"role": "model", "parts": ["Neptune is the farthest planet from the sun."]}, {"role": "user", "parts": ["How can we determine the mass of a black hole?"]}, ] @@ -286,22 +281,33 @@ def test_cost_calculation(gemini_client, mock_response): @pytest.mark.skipif(skip, reason="Google GenAI dependency is not installed") @patch("autogen.oai.gemini.genai.GenerativeModel") -@patch("autogen.oai.gemini.genai.configure") -def test_create_response(mock_configure, mock_generative_model, gemini_client): +# @patch("autogen.oai.gemini.genai.configure") +@patch("autogen.oai.gemini.calculate_gemini_cost") +def test_create_response_with_text(mock_calculate_cost, mock_generative_model, gemini_client): # Mock the genai model configuration and creation process mock_chat = MagicMock() mock_model = MagicMock() - mock_configure.return_value = None + # mock_configure.return_value = None mock_generative_model.return_value = mock_model mock_model.start_chat.return_value = mock_chat - # Set up a mock for the chat history item access and the text attribute return - mock_history_part = MagicMock() - mock_history_part.text = "Example response" - mock_chat.history.__getitem__.return_value.parts.__getitem__.return_value = mock_history_part + # Set up mock token counts with real integers + mock_usage_metadata = MagicMock() + mock_usage_metadata.prompt_token_count = 100 + mock_usage_metadata.candidates_token_count = 50 + + # Setup the mock to return a response with only text content + mock_text_part = MagicMock() + mock_text_part.text = "Example response" + mock_text_part.function_call = None - # Setup the mock to return a mocked chat response - mock_chat.send_message.return_value = MagicMock(history=[MagicMock(parts=[MagicMock(text="Example response")])]) + mock_response = MagicMock() + mock_response.parts = [mock_text_part] + mock_response.usage_metadata = mock_usage_metadata + mock_chat.send_message.return_value = mock_response + + # Mock the calculate_gemini_cost function + mock_calculate_cost.return_value = 0.002 # Call the create method response = gemini_client.create( @@ -309,13 +315,25 @@ def test_create_response(mock_configure, mock_generative_model, gemini_client): ) # Assertions to check if response is structured as expected + # assert isinstance(response, ChatCompletion), "Response should be an instance of ChatCompletion" assert response.choices[0].message.content == "Example response", "Response content should match expected output" + assert not response.choices[0].message.tool_calls, "There should be no tool calls" + assert response.usage.prompt_tokens == 100, "Prompt tokens should match the mocked value" + assert response.usage.completion_tokens == 50, "Completion tokens should match the mocked value" + assert response.usage.total_tokens == 150, "Total tokens should be the sum of prompt and completion tokens" + assert response.cost == 0.002, "Cost should match the mocked calculate_gemini_cost return value" + + # Verify that calculate_gemini_cost was called with the correct arguments + mock_calculate_cost.assert_called_once_with(False, 100, 50, "gemini-pro") @pytest.mark.skipif(skip, reason="Google GenAI dependency is not installed") @patch("autogen.oai.gemini.GenerativeModel") @patch("autogen.oai.gemini.vertexai.init") -def test_vertexai_create_response(mock_init, mock_generative_model, gemini_client_with_credentials): +@patch("autogen.oai.gemini.calculate_gemini_cost") +def test_vertexai_create_response( + mock_calculate_cost, mock_init, mock_generative_model, gemini_client_with_credentials +): # Mock the genai model configuration and creation process mock_chat = MagicMock() mock_model = MagicMock() @@ -323,139 +341,37 @@ def test_vertexai_create_response(mock_init, mock_generative_model, gemini_clien mock_generative_model.return_value = mock_model mock_model.start_chat.return_value = mock_chat - # Set up a mock for the chat history item access and the text attribute return - mock_history_part = MagicMock() - mock_history_part.text = "Example response" - mock_chat.history.__getitem__.return_value.parts.__getitem__.return_value = mock_history_part - - # Setup the mock to return a mocked chat response - mock_chat.send_message.return_value = MagicMock(history=[MagicMock(parts=[MagicMock(text="Example response")])]) - - # Call the create method - response = gemini_client_with_credentials.create( - {"model": "gemini-pro", "messages": [{"content": "Hello", "role": "user"}], "stream": False} - ) - - # Assertions to check if response is structured as expected - assert response.choices[0].message.content == "Example response", "Response content should match expected output" - + # Set up mock token counts with real integers + mock_usage_metadata = MagicMock() + mock_usage_metadata.prompt_token_count = 100 + mock_usage_metadata.candidates_token_count = 50 -@pytest.mark.skipif(skip, reason="Google GenAI dependency is not installed") -@patch("autogen.oai.gemini.GenerativeModel") -@patch("autogen.oai.gemini.vertexai.init") -def test_vertexai_default_auth_create_response(mock_init, mock_generative_model, gemini_google_auth_default_client): - # Mock the genai model configuration and creation process - mock_chat = MagicMock() - mock_model = MagicMock() - mock_init.return_value = None - mock_generative_model.return_value = mock_model - mock_model.start_chat.return_value = mock_chat + # Setup the mock to return a response with only text content + mock_text_part = MagicMock() + mock_text_part.text = "Example response" + mock_text_part.function_call = None - # Set up a mock for the chat history item access and the text attribute return - mock_history_part = MagicMock() - mock_history_part.text = "Example response" - mock_chat.history.__getitem__.return_value.parts.__getitem__.return_value = mock_history_part + mock_response = MagicMock() + mock_response.parts = [mock_text_part] + mock_response.usage_metadata = mock_usage_metadata + mock_chat.send_message.return_value = mock_response - # Setup the mock to return a mocked chat response - mock_chat.send_message.return_value = MagicMock(history=[MagicMock(parts=[MagicMock(text="Example response")])]) + # Mock the calculate_gemini_cost function + mock_calculate_cost.return_value = 0.002 # Call the create method - response = gemini_google_auth_default_client.create( + response = gemini_client_with_credentials.create( {"model": "gemini-pro", "messages": [{"content": "Hello", "role": "user"}], "stream": False} ) # Assertions to check if response is structured as expected + # assert isinstance(response, ChatCompletion), "Response should be an instance of ChatCompletion" assert response.choices[0].message.content == "Example response", "Response content should match expected output" - - -@pytest.mark.skipif(skip, reason="Google GenAI dependency is not installed") -@patch("autogen.oai.gemini.genai.GenerativeModel") -@patch("autogen.oai.gemini.genai.configure") -def test_create_vision_model_response(mock_configure, mock_generative_model, gemini_client): - # Mock the genai model configuration and creation process - mock_model = MagicMock() - mock_configure.return_value = None - mock_generative_model.return_value = mock_model - - # Set up a mock to simulate the vision model behavior - mock_vision_response = MagicMock() - mock_vision_part = MagicMock(text="Vision model output") - - # Setting up the chain of return values for vision model response - mock_vision_response._result.candidates.__getitem__.return_value.content.parts.__getitem__.return_value = ( - mock_vision_part - ) - mock_model.generate_content.return_value = mock_vision_response - - # Call the create method with vision model parameters - response = gemini_client.create( - { - "model": "gemini-pro-vision", # Vision model name - "messages": [ - { - "content": [ - {"type": "text", "text": "Let's play a game."}, - { - "type": "image_url", - "image_url": { - "url": "" - }, - }, - ], - "role": "user", - } - ], # Assuming a simple content input for vision - "stream": False, - } - ) - - # Assertions to check if response is structured as expected - assert ( - response.choices[0].message.content == "Vision model output" - ), "Response content should match expected output from vision model" - - -@pytest.mark.skipif(skip, reason="Google GenAI dependency is not installed") -@patch("autogen.oai.gemini.GenerativeModel") -@patch("autogen.oai.gemini.vertexai.init") -def test_vertexai_create_vision_model_response(mock_init, mock_generative_model, gemini_google_auth_default_client): - # Mock the genai model configuration and creation process - mock_model = MagicMock() - mock_init.return_value = None - mock_generative_model.return_value = mock_model - - # Set up a mock to simulate the vision model behavior - mock_vision_response = MagicMock() - mock_vision_part = MagicMock(text="Vision model output") - - # Setting up the chain of return values for vision model response - mock_vision_response.candidates.__getitem__.return_value.content.parts.__getitem__.return_value = mock_vision_part - - mock_model.generate_content.return_value = mock_vision_response - - # Call the create method with vision model parameters - response = gemini_google_auth_default_client.create( - { - "model": "gemini-pro-vision", # Vision model name - "messages": [ - { - "content": [ - {"type": "text", "text": "Let's play a game."}, - { - "type": "image_url", - "image_url": { - "url": "" - }, - }, - ], - "role": "user", - } - ], # Assuming a simple content input for vision - "stream": False, - } - ) - - # Assertions to check if response is structured as expected - assert ( - response.choices[0].message.content == "Vision model output" - ), "Response content should match expected output from vision model" + assert not response.choices[0].message.tool_calls, "There should be no tool calls" + assert response.usage.prompt_tokens == 100, "Prompt tokens should match the mocked value" + assert response.usage.completion_tokens == 50, "Completion tokens should match the mocked value" + assert response.usage.total_tokens == 150, "Total tokens should be the sum of prompt and completion tokens" + assert response.cost == 0.002, "Cost should match the mocked calculate_gemini_cost return value" + + # Verify that calculate_gemini_cost was called with the correct arguments + mock_calculate_cost.assert_called_once_with(True, 100, 50, "gemini-pro") From 3a3ffa0c89c22ede68471d70057d7eb9c63d889b Mon Sep 17 00:00:00 2001 From: Mark Sze Date: Sun, 1 Dec 2024 21:20:40 +0000 Subject: [PATCH 02/10] Remove unnecessary test file --- .../graph_rag/test_falkor_graph_rag.py | 61 ------------------- 1 file changed, 61 deletions(-) delete mode 100644 test/agentchat/contrib/graph_rag/test_falkor_graph_rag.py diff --git a/test/agentchat/contrib/graph_rag/test_falkor_graph_rag.py b/test/agentchat/contrib/graph_rag/test_falkor_graph_rag.py deleted file mode 100644 index 5b61454e9e..0000000000 --- a/test/agentchat/contrib/graph_rag/test_falkor_graph_rag.py +++ /dev/null @@ -1,61 +0,0 @@ -import sys - -import pytest -from conftest import reason, skip_openai # noqa: E402 -from graphrag_sdk import KnowledgeGraph, Source -from graphrag_sdk.ontology import Ontology - -try: - from autogen.agentchat.contrib.graph_rag.document import ( - Document, - DocumentType, - ) - from autogen.agentchat.contrib.graph_rag.falkor_graph_query_engine import ( - FalkorGraphQueryEngine, - GraphStoreQueryResult, - ) -except ImportError: - skip = True -else: - skip = False - -reason = "do not run on MacOS or windows OR dependency is not installed OR " + reason - - -@pytest.mark.skipif( - sys.platform in ["darwin", "win32"] or skip or skip_openai, - reason=reason, -) -def test_falkor_db_query_engine(): - """ - Test Falkor DB Query Engine. - 1. create a test Falkor DB Query Engine with a schema. - 2. Initialize it with an input txt file. - 3. Query it with a question and verify the result contains the critical information. - """ - # Arrange - test_schema = Ontology() - actor = test_schema.add_entity("Actor").add_attribute("name", str, unique=True) - movie = test_schema.add_entity("Movie").add_attribute("title", str, unique=True) - test_schema.add_relation("ACTED", actor, movie) - - query_engine = FalkorGraphQueryEngine(schema=test_schema) - - source_file = "test/agentchat/contrib/graph_rag/the_matrix.txt" - input_docs = [Document(doctype=DocumentType.TEXT, path_or_url=source_file)] - - question = "Name a few actors who've played in 'The Matrix'" - - # Act - query_engine.init_db(input_doc=input_docs) - - query_result: GraphStoreQueryResult = query_engine.query(question=question) - - # Assert - assert query_result.answer.find("Keanu Reeves") >= 0 - for message in query_result.messages: - if isinstance(message, dict) and "role" in message and message["role"] == "user": - assert "content" in message - assert message["content"] is question - return - pytest.fail("Question not found in message history.") From 4dbb7a5adcf85d020f7f69b3b262efc8e608b0f6 Mon Sep 17 00:00:00 2001 From: Mark Sze Date: Sun, 1 Dec 2024 21:24:03 +0000 Subject: [PATCH 03/10] Exception note update Signed-off-by: Mark Sze --- autogen/oai/gemini.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/autogen/oai/gemini.py b/autogen/oai/gemini.py index 4f1950ce96..738eeafd0f 100644 --- a/autogen/oai/gemini.py +++ b/autogen/oai/gemini.py @@ -191,7 +191,7 @@ def create(self, params: Dict) -> ChatCompletion: raise ValueError( "Please provide a model name for the Gemini Client. " "You can configure it in the OAI Config List file. " - "See this [LLM configuration tutorial](https://autogenhub.github.io/autogen/docs/topics/llm_configuration/) for more details." + "See this [LLM configuration tutorial](https://ag2ai.github.io/ag2/docs/topics/llm_configuration/) for more details." ) params.get("api_type", "google") # not used From a3d12bee8c2d4976d0c2353c6267a14354e8f972 Mon Sep 17 00:00:00 2001 From: Mark Sze Date: Sun, 1 Dec 2024 21:28:02 +0000 Subject: [PATCH 04/10] Update FalkorDB test file to reconcile Signed-off-by: Mark Sze --- .../graph_rag/test_falkor_graph_rag.py | 66 +++++++++++++++++++ 1 file changed, 66 insertions(+) create mode 100644 test/agentchat/contrib/graph_rag/test_falkor_graph_rag.py diff --git a/test/agentchat/contrib/graph_rag/test_falkor_graph_rag.py b/test/agentchat/contrib/graph_rag/test_falkor_graph_rag.py new file mode 100644 index 0000000000..0e23414b43 --- /dev/null +++ b/test/agentchat/contrib/graph_rag/test_falkor_graph_rag.py @@ -0,0 +1,66 @@ +# Copyright (c) 2023 - 2024, Owners of https://github.com/ag2ai +# +# SPDX-License-Identifier: Apache-2.0 +# +# Portions derived from https://github.com/microsoft/autogen are under the MIT License. +# SPDX-License-Identifier: MIT +import sys + +import pytest +from conftest import reason, skip_openai # noqa: E402 +from graphrag_sdk import Attribute, AttributeType, Entity, Ontology, Relation + +try: + from autogen.agentchat.contrib.graph_rag.document import Document, DocumentType + from autogen.agentchat.contrib.graph_rag.falkor_graph_query_engine import ( + FalkorGraphQueryEngine, + GraphStoreQueryResult, + ) +except ImportError: + skip = True +else: + skip = False + +reason = "do not run on MacOS or windows OR dependency is not installed OR " + reason + + +@pytest.mark.skipif( + sys.platform in ["darwin", "win32"] or skip or skip_openai, + reason=reason, +) +def test_falkor_db_query_engine(): + """ + Test FalkorDB Query Engine. + 1. create a test FalkorDB Query Engine with a schema. + 2. Initialize it with an input txt file. + 3. Query it with a question and verify the result contains the critical information. + """ + # Arrange + movie_ontology = Ontology() + movie_ontology.add_entity( + Entity(label="Actor", attributes=[Attribute(name="name", attr_type=AttributeType.STRING, unique=True)]) + ) + movie_ontology.add_entity( + Entity(label="Movie", attributes=[Attribute(name="title", attr_type=AttributeType.STRING, unique=True)]) + ) + movie_ontology.add_relation(Relation(label="ACTED", source="Actor", target="Movie")) + + query_engine = FalkorGraphQueryEngine( + name="IMDB", + # host="192.168.0.115", # Change + # port=6379, # if needed + ontology=movie_ontology, + ) + + source_file = "test/agentchat/contrib/graph_rag/the_matrix.txt" + input_docs = [Document(doctype=DocumentType.TEXT, path_or_url=source_file)] + + question = "Name a few actors who've played in 'The Matrix'" + + # Act + query_engine.init_db(input_doc=input_docs) + + query_result: GraphStoreQueryResult = query_engine.query(question=question) + + # Assert + assert query_result.answer.find("Keanu Reeves") >= 0 From ace3127c42028fda319b71ef0f5bc306482ad55c Mon Sep 17 00:00:00 2001 From: simplaj Date: Sat, 7 Dec 2024 01:19:45 +0800 Subject: [PATCH 05/10] fix base_url not work in groq --- autogen/oai/groq.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/autogen/oai/groq.py b/autogen/oai/groq.py index ea560e7ea0..e3112619fa 100644 --- a/autogen/oai/groq.py +++ b/autogen/oai/groq.py @@ -68,6 +68,7 @@ def __init__(self, **kwargs): if "response_format" in kwargs and kwargs["response_format"] is not None: warnings.warn("response_format is not supported for Groq API, it will be ignored.", UserWarning) + self.base_url = kwargs.get("base_url", None) def message_retrieval(self, response) -> List: """ @@ -149,7 +150,7 @@ def create(self, params: Dict) -> ChatCompletion: groq_params["messages"] = groq_messages # We use chat model by default, and set max_retries to 5 (in line with typical retries loop) - client = Groq(api_key=self.api_key, max_retries=5) + client = Groq(api_key=self.api_key, max_retries=5, base_url=self.base_url) # Token counts will be returned prompt_tokens = 0 From 7b3736972c65f6bc9ca13e2442ec91457cb7cd21 Mon Sep 17 00:00:00 2001 From: Mark Sze <66362098+marklysze@users.noreply.github.com> Date: Wed, 11 Dec 2024 09:20:47 +1100 Subject: [PATCH 06/10] Setup.py > underscores to hyphens fix --- setup.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/setup.py b/setup.py index a5a71db02a..ee4db82ca8 100644 --- a/setup.py +++ b/setup.py @@ -93,7 +93,7 @@ "retrievechat-pgvector": retrieve_chat_pgvector, "retrievechat-mongodb": [*retrieve_chat, "pymongo>=4.0.0"], "retrievechat-qdrant": [*retrieve_chat, "qdrant_client", "fastembed>=0.3.1"], - "graph_rag_falkor_db": graph_rag_falkor_db, + "graph-rag-falkor-db": graph_rag_falkor_db, "autobuild": autobuild, "captainagent": autobuild + ["pandas"], "teachable": ["chromadb"], From c31b375fc0b3cde9cc9c66a22fa5cd71413f7a27 Mon Sep 17 00:00:00 2001 From: Mark Sze <66362098+marklysze@users.noreply.github.com> Date: Wed, 11 Dec 2024 10:43:20 +1100 Subject: [PATCH 07/10] Update setup.py Added comment for future editors --- setup.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/setup.py b/setup.py index ee4db82ca8..fce7ff0afe 100644 --- a/setup.py +++ b/setup.py @@ -76,6 +76,9 @@ # pysqlite3-binary used so it doesn't need to compile pysqlite3 autobuild = ["chromadb", "sentence-transformers", "huggingface-hub", "pysqlite3-binary"] +# NOTE: underscores in pip install, e.g. pip install ag2[graph_rag_falkor_db], will automatically +# convert to hyphens. So, do not include underscores in the name of extras. + extra_require = { "test": [ "ipykernel", From 96801fca459ed95b694b7ee05d674f407e2eda58 Mon Sep 17 00:00:00 2001 From: Mark Sze <66362098+marklysze@users.noreply.github.com> Date: Wed, 11 Dec 2024 12:26:56 +1100 Subject: [PATCH 08/10] Update agentchat_swarm_graphrag_trip_planner.ipynb --- notebook/agentchat_swarm_graphrag_trip_planner.ipynb | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/notebook/agentchat_swarm_graphrag_trip_planner.ipynb b/notebook/agentchat_swarm_graphrag_trip_planner.ipynb index 13a2763028..26a400e2f6 100644 --- a/notebook/agentchat_swarm_graphrag_trip_planner.ipynb +++ b/notebook/agentchat_swarm_graphrag_trip_planner.ipynb @@ -25,7 +25,7 @@ "FalkorDB's GraphRAG-SDK is a dependency for this notebook, which can be installed with ag2 via pip:\n", "\n", "```bash\n", - "pip install ag2[graph_rag_falkor_db]\n", + "pip install ag2[graph-rag-falkor-db]\n", "```\n", "\n", "For more information, please refer to the [installation guide](/docs/installation/).\n", From 5885889968cc64c75e9e4bbcafe4f67ca7c39f85 Mon Sep 17 00:00:00 2001 From: Mark Sze <66362098+marklysze@users.noreply.github.com> Date: Wed, 11 Dec 2024 12:27:39 +1100 Subject: [PATCH 09/10] Update contrib-graph-rag-tests.yml --- .github/workflows/contrib-graph-rag-tests.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/contrib-graph-rag-tests.yml b/.github/workflows/contrib-graph-rag-tests.yml index d5b2a9ef6b..04bb67c568 100644 --- a/.github/workflows/contrib-graph-rag-tests.yml +++ b/.github/workflows/contrib-graph-rag-tests.yml @@ -45,7 +45,7 @@ jobs: pip install pytest - name: Install FalkorDB SDK when on linux run: | - pip install -e .[graph_rag_falkor_db] + pip install -e .[graph-rag-falkor-db] - name: Set AUTOGEN_USE_DOCKER based on OS shell: bash run: | From 528aa3962acafd6b673c5e5278b85683d527b268 Mon Sep 17 00:00:00 2001 From: Mark Sze <66362098+marklysze@users.noreply.github.com> Date: Wed, 11 Dec 2024 12:28:36 +1100 Subject: [PATCH 10/10] Update agentchat_graph_rag_falkordb.ipynb --- notebook/agentchat_graph_rag_falkordb.ipynb | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/notebook/agentchat_graph_rag_falkordb.ipynb b/notebook/agentchat_graph_rag_falkordb.ipynb index b1802dfe18..4697da6a9a 100644 --- a/notebook/agentchat_graph_rag_falkordb.ipynb +++ b/notebook/agentchat_graph_rag_falkordb.ipynb @@ -13,7 +13,7 @@ "FalkorDB's GraphRAG-SDK is a dependency for this notebook, which can be installed with ag2 via pip:\n", "\n", "```bash\n", - "pip install ag2[graph_rag_falkor_db]\n", + "pip install ag2[graph-rag-falkor-db]\n", "```\n", "\n", "or if you have already installed ag2/autogen/pyautogen\n",