PyPI - google-adk - Versions diffs - 0.5.0__py3-none-any.whl → 1.0.0__py3-none-any.whl - Mend

google-adk 0.5.0py3-none-any.whl → 1.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (113) hide show

google/adk/agents/base_agent.py +76 -30
google/adk/agents/base_agent.py.orig +330 -0
google/adk/agents/callback_context.py +0 -5
google/adk/agents/llm_agent.py +122 -30
google/adk/agents/loop_agent.py +1 -1
google/adk/agents/parallel_agent.py +7 -0
google/adk/agents/readonly_context.py +7 -1
google/adk/agents/run_config.py +1 -1
google/adk/agents/sequential_agent.py +31 -0
google/adk/agents/transcription_entry.py +4 -2
google/adk/artifacts/gcs_artifact_service.py +1 -1
google/adk/artifacts/in_memory_artifact_service.py +1 -1
google/adk/auth/auth_credential.py +6 -1
google/adk/auth/auth_preprocessor.py +7 -1
google/adk/auth/auth_tool.py +3 -4
google/adk/cli/agent_graph.py +5 -5
google/adk/cli/browser/index.html +2 -2
google/adk/cli/browser/{main-ULN5R5I5.js → main-QOEMUXM4.js} +44 -45
google/adk/cli/cli.py +7 -7
google/adk/cli/cli_deploy.py +7 -2
google/adk/cli/cli_eval.py +172 -99
google/adk/cli/cli_tools_click.py +147 -64
google/adk/cli/fast_api.py +330 -148
google/adk/cli/fast_api.py.orig +174 -80
google/adk/cli/utils/common.py +23 -0
google/adk/cli/utils/evals.py +83 -1
google/adk/cli/utils/logs.py +13 -5
google/adk/code_executors/__init__.py +3 -1
google/adk/code_executors/built_in_code_executor.py +52 -0
google/adk/evaluation/__init__.py +1 -1
google/adk/evaluation/agent_evaluator.py +168 -128
google/adk/evaluation/eval_case.py +102 -0
google/adk/evaluation/eval_set.py +37 -0
google/adk/evaluation/eval_sets_manager.py +42 -0
google/adk/evaluation/evaluation_generator.py +88 -113
google/adk/evaluation/evaluator.py +56 -0
google/adk/evaluation/local_eval_sets_manager.py +264 -0
google/adk/evaluation/response_evaluator.py +106 -2
google/adk/evaluation/trajectory_evaluator.py +83 -2
google/adk/events/event.py +6 -1
google/adk/events/event_actions.py +6 -1
google/adk/examples/example_util.py +3 -2
google/adk/flows/llm_flows/_code_execution.py +9 -1
google/adk/flows/llm_flows/audio_transcriber.py +4 -3
google/adk/flows/llm_flows/base_llm_flow.py +54 -15
google/adk/flows/llm_flows/functions.py +9 -8
google/adk/flows/llm_flows/instructions.py +13 -5
google/adk/flows/llm_flows/single_flow.py +1 -1
google/adk/memory/__init__.py +1 -1
google/adk/memory/_utils.py +23 -0
google/adk/memory/base_memory_service.py +23 -21
google/adk/memory/base_memory_service.py.orig +76 -0
google/adk/memory/in_memory_memory_service.py +57 -25
google/adk/memory/memory_entry.py +37 -0
google/adk/memory/vertex_ai_rag_memory_service.py +38 -15
google/adk/models/anthropic_llm.py +16 -9
google/adk/models/gemini_llm_connection.py +11 -11
google/adk/models/google_llm.py +9 -2
google/adk/models/google_llm.py.orig +305 -0
google/adk/models/lite_llm.py +77 -21
google/adk/models/llm_response.py +14 -2
google/adk/models/registry.py +1 -1
google/adk/runners.py +65 -41
google/adk/sessions/__init__.py +1 -1
google/adk/sessions/base_session_service.py +6 -33
google/adk/sessions/database_session_service.py +58 -65
google/adk/sessions/in_memory_session_service.py +106 -24
google/adk/sessions/session.py +3 -0
google/adk/sessions/vertex_ai_session_service.py +23 -45
google/adk/telemetry.py +3 -0
google/adk/tools/__init__.py +4 -7
google/adk/tools/{built_in_code_execution_tool.py → _built_in_code_execution_tool.py} +11 -0
google/adk/tools/_memory_entry_utils.py +30 -0
google/adk/tools/agent_tool.py +9 -9
google/adk/tools/apihub_tool/apihub_toolset.py +55 -74
google/adk/tools/application_integration_tool/application_integration_toolset.py +107 -85
google/adk/tools/application_integration_tool/clients/connections_client.py +20 -0
google/adk/tools/application_integration_tool/clients/integration_client.py +6 -6
google/adk/tools/application_integration_tool/integration_connector_tool.py +69 -26
google/adk/tools/base_toolset.py +58 -0
google/adk/tools/enterprise_search_tool.py +65 -0
google/adk/tools/function_parameter_parse_util.py +2 -2
google/adk/tools/google_api_tool/__init__.py +18 -70
google/adk/tools/google_api_tool/google_api_tool.py +11 -5
google/adk/tools/google_api_tool/google_api_toolset.py +126 -0
google/adk/tools/google_api_tool/google_api_toolsets.py +102 -0
google/adk/tools/google_api_tool/googleapi_to_openapi_converter.py +40 -42
google/adk/tools/langchain_tool.py +96 -49
google/adk/tools/load_memory_tool.py +14 -5
google/adk/tools/mcp_tool/__init__.py +3 -2
google/adk/tools/mcp_tool/mcp_session_manager.py +153 -16
google/adk/tools/mcp_tool/mcp_session_manager.py.orig +322 -0
google/adk/tools/mcp_tool/mcp_tool.py +12 -12
google/adk/tools/mcp_tool/mcp_toolset.py +155 -195
google/adk/tools/openapi_tool/openapi_spec_parser/openapi_toolset.py +32 -7
google/adk/tools/openapi_tool/openapi_spec_parser/operation_parser.py +31 -31
google/adk/tools/openapi_tool/openapi_spec_parser/tool_auth_handler.py +1 -1
google/adk/tools/preload_memory_tool.py +27 -18
google/adk/tools/retrieval/__init__.py +1 -1
google/adk/tools/retrieval/vertex_ai_rag_retrieval.py +1 -1
google/adk/tools/toolbox_toolset.py +79 -0
google/adk/tools/transfer_to_agent_tool.py +0 -1
google/adk/version.py +1 -1
{google_adk-0.5.0.dist-info → google_adk-1.0.0.dist-info}/METADATA +7 -5
google_adk-1.0.0.dist-info/RECORD +195 -0
google/adk/agents/remote_agent.py +0 -50
google/adk/tools/google_api_tool/google_api_tool_set.py +0 -110
google/adk/tools/google_api_tool/google_api_tool_sets.py +0 -112
google/adk/tools/toolbox_tool.py +0 -46
google_adk-0.5.0.dist-info/RECORD +0 -180
{google_adk-0.5.0.dist-info → google_adk-1.0.0.dist-info}/WHEEL +0 -0
{google_adk-0.5.0.dist-info → google_adk-1.0.0.dist-info}/entry_points.txt +0 -0
{google_adk-0.5.0.dist-info → google_adk-1.0.0.dist-info}/licenses/LICENSE +0 -0

google/adk/models/google_llm.py.orig ADDED Viewed

@@ -0,0 +1,305 @@
+# Copyright 2025 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from __future__ import annotations
+import contextlib
+from functools import cached_property
+import logging
+import sys
+from typing import AsyncGenerator
+from typing import cast
+from typing import TYPE_CHECKING
+from google.genai import Client
+from google.genai import types
+from typing_extensions import override
+from .. import version
+from .base_llm import BaseLlm
+from .base_llm_connection import BaseLlmConnection
+from .gemini_llm_connection import GeminiLlmConnection
+from .llm_response import LlmResponse
+if TYPE_CHECKING:
+  from .llm_request import LlmRequest
+logger = None
+_NEW_LINE = '\n'
+_EXCLUDED_PART_FIELD = {'inline_data': {'data'}}
+class Gemini(BaseLlm):
+  """Integration for Gemini models.
+  Attributes:
+    model: The name of the Gemini model.
+  """
+  model: str = 'gemini-1.5-flash'
+  @staticmethod
+  @override
+  def supported_models() -> list[str]:
+    """Provides the list of supported models.
+    Returns:
+      A list of supported models.
+    """
+    return [
+        r'gemini-.*',
+        # fine-tuned vertex endpoint pattern
+        r'projects\/.+\/locations\/.+\/endpoints\/.+',
+        # vertex gemini long name
+        r'projects\/.+\/locations\/.+\/publishers\/google\/models\/gemini.+',
+    ]
+  async def generate_content_async(
+      self, llm_request: LlmRequest, stream: bool = False
+  ) -> AsyncGenerator[LlmResponse, None]:
+    """Sends a request to the Gemini model.
+    Args:
+      llm_request: LlmRequest, the request to send to the Gemini model.
+      stream: bool = False, whether to do streaming call.
+    Yields:
+      LlmResponse: The model response.
+    """
+    self._maybe_append_user_content(llm_request)
+    global logger
+    if not logger:
+      logger = logging.getLogger(__name__)
+    logger.info(
+        'Sending out request, model: %s, backend: %s, stream: %s',
+        llm_request.model,
+        self._api_backend,
+        stream,
+    )
+    logger.info(_build_request_log(llm_request))
+    print('********* Jack --> ')
+    for hh in logging.root.handlers:
+      print(hh, hh.level)
+    for hh in logger.handlers:
+      print(hh, hh.level)
+    print('********* Jack <-- ')
+    if stream:
+      responses = await self.api_client.aio.models.generate_content_stream(
+          model=llm_request.model,
+          contents=llm_request.contents,
+          config=llm_request.config,
+      )
+      response = None
+      text = ''
+      # for sse, similar as bidi (see receive method in gemini_llm_connecton.py),
+      # we need to mark those text content as partial and after all partial
+      # contents are sent, we send an accumulated event which contains all the
+      # previous partial content. The only difference is bidi rely on
+      # complete_turn flag to detect end while sse depends on finish_reason.
+      async for response in responses:
+        logger.info(_build_response_log(response))
+        llm_response = LlmResponse.create(response)
+        if (
+            llm_response.content
+            and llm_response.content.parts
+            and llm_response.content.parts[0].text
+        ):
+          text += llm_response.content.parts[0].text
+          llm_response.partial = True
+        elif text and (
+            not llm_response.content
+            or not llm_response.content.parts
+            # don't yield the merged text event when receiving audio data
+            or not llm_response.content.parts[0].inline_data
+        ):
+          yield LlmResponse(
+              content=types.ModelContent(
+                  parts=[types.Part.from_text(text=text)],
+              ),
+              usage_metadata=llm_response.usage_metadata,
+          )
+          text = ''
+        yield llm_response
+      if (
+          text
+          and response
+          and response.candidates
+          and response.candidates[0].finish_reason == types.FinishReason.STOP
+      ):
+        yield LlmResponse(
+            content=types.ModelContent(
+                parts=[types.Part.from_text(text=text)],
+            ),
+        )
+    else:
+      response = await self.api_client.aio.models.generate_content(
+          model=llm_request.model,
+          contents=llm_request.contents,
+          config=llm_request.config,
+      )
+      logger.info(_build_response_log(response))
+      yield LlmResponse.create(response)
+  @cached_property
+  def api_client(self) -> Client:
+    """Provides the api client.
+    Returns:
+      The api client.
+    """
+    return Client(
+        http_options=types.HttpOptions(headers=self._tracking_headers)
+    )
+  @cached_property
+  def _api_backend(self) -> str:
+    return 'vertex' if self.api_client.vertexai else 'ml_dev'
+  @cached_property
+  def _tracking_headers(self) -> dict[str, str]:
+    framework_label = f'google-adk/{version.__version__}'
+    language_label = 'gl-python/' + sys.version.split()[0]
+    version_header_value = f'{framework_label} {language_label}'
+    tracking_headers = {
+        'x-goog-api-client': version_header_value,
+        'user-agent': version_header_value,
+    }
+    return tracking_headers
+  @cached_property
+  def _live_api_client(self) -> Client:
+    if self._api_backend == 'vertex':
+      # use beta version for vertex api
+      api_version = 'v1beta1'
+      # use default api version for vertex
+      return Client(
+          http_options=types.HttpOptions(
+              headers=self._tracking_headers, api_version=api_version
+          )
+      )
+    else:
+      # use v1alpha for ml_dev
+      api_version = 'v1alpha'
+      return Client(
+          http_options=types.HttpOptions(
+              headers=self._tracking_headers, api_version=api_version
+          )
+      )
+  @contextlib.asynccontextmanager
+  async def connect(self, llm_request: LlmRequest) -> BaseLlmConnection:
+    """Connects to the Gemini model and returns an llm connection.
+    Args:
+      llm_request: LlmRequest, the request to send to the Gemini model.
+    Yields:
+      BaseLlmConnection, the connection to the Gemini model.
+    """
+    llm_request.live_connect_config.system_instruction = types.Content(
+        role='system',
+        parts=[
+            types.Part.from_text(text=llm_request.config.system_instruction)
+        ],
+    )
+    llm_request.live_connect_config.tools = llm_request.config.tools
+    async with self._live_api_client.aio.live.connect(
+        model=llm_request.model, config=llm_request.live_connect_config
+    ) as live_session:
+      yield GeminiLlmConnection(live_session)
+def _build_function_declaration_log(
+    func_decl: types.FunctionDeclaration,
+) -> str:
+  param_str = '{}'
+  if func_decl.parameters and func_decl.parameters.properties:
+    param_str = str({
+        k: v.model_dump(exclude_none=True)
+        for k, v in func_decl.parameters.properties.items()
+    })
+  return_str = 'None'
+  if func_decl.response:
+    return_str = str(func_decl.response.model_dump(exclude_none=True))
+  return f'{func_decl.name}: {param_str} -> {return_str}'
+def _build_request_log(req: LlmRequest) -> str:
+  function_decls: list[types.FunctionDeclaration] = cast(
+      list[types.FunctionDeclaration],
+      req.config.tools[0].function_declarations if req.config.tools else [],
+  )
+  function_logs = (
+      [
+          _build_function_declaration_log(func_decl)
+          for func_decl in function_decls
+      ]
+      if function_decls
+      else []
+  )
+  contents_logs = [
+      content.model_dump_json(
+          exclude_none=True,
+          exclude={
+              'parts': {
+                  i: _EXCLUDED_PART_FIELD for i in range(len(content.parts))
+              }
+          },
+      )
+      for content in req.contents
+  ]
+  return f"""
+LLM Request:
+-----------------------------------------------------------
+System Instruction:
+{req.config.system_instruction}
+-----------------------------------------------------------
+Contents:
+{_NEW_LINE.join(contents_logs)}
+-----------------------------------------------------------
+Functions:
+{_NEW_LINE.join(function_logs)}
+-----------------------------------------------------------
+"""
+def _build_response_log(resp: types.GenerateContentResponse) -> str:
+  function_calls_text = []
+  if function_calls := resp.function_calls:
+    for func_call in function_calls:
+      function_calls_text.append(
+          f'name: {func_call.name}, args: {func_call.args}'
+      )
+  return f"""
+LLM Response:
+-----------------------------------------------------------
+Text:
+{resp.text}
+-----------------------------------------------------------
+Function calls:
+{_NEW_LINE.join(function_calls_text)}
+-----------------------------------------------------------
+Raw response:
+{resp.model_dump_json(exclude_none=True)}
+-----------------------------------------------------------
+"""

google/adk/models/lite_llm.py CHANGED Viewed

@@ -51,7 +51,7 @@ from .base_llm import BaseLlm
 from .llm_request import LlmRequest
 from .llm_response import LlmResponse
-logger = logging.getLogger(__name__)
+logger = logging.getLogger("google_adk." + __name__)
 _NEW_LINE = "\n"
 _EXCLUDED_PART_FIELD = {"inline_data": {"data"}}
@@ -67,6 +67,12 @@ class TextChunk(BaseModel):
   text: str
+class UsageMetadataChunk(BaseModel):
+  prompt_tokens: int
+  completion_tokens: int
+  total_tokens: int
 class LiteLLMClient:
   """Provides acompletion method (for better testability)."""
@@ -344,15 +350,20 @@ def _function_declaration_to_tool_param(
 def _model_response_to_chunk(
     response: ModelResponse,
 ) -> Generator[
-    Tuple[Optional[Union[TextChunk, FunctionChunk]], Optional[str]], None, None
+    Tuple[
+        Optional[Union[TextChunk, FunctionChunk, UsageMetadataChunk]],
+        Optional[str],
+    ],
+    None,
+    None,
 ]:
-  """Converts a litellm message to text or function chunk.
+  """Converts a litellm message to text, function or usage metadata chunk.
   Args:
     response: The response from the model.
   Yields:
-    A tuple of text or function chunk and finish reason.
+    A tuple of text or function or usage metadata chunk and finish reason.
   """
   message = None
@@ -384,11 +395,21 @@ def _model_response_to_chunk(
   if not message:
     yield None, None
+  # Ideally usage would be expected with the last ModelResponseStream with a
+  # finish_reason set. But this is not the case we are observing from litellm.
+  # So we are sending it as a separate chunk to be set on the llm_response.
+  if response.get("usage", None):
+    yield UsageMetadataChunk(
+        prompt_tokens=response["usage"].get("prompt_tokens", 0),
+        completion_tokens=response["usage"].get("completion_tokens", 0),
+        total_tokens=response["usage"].get("total_tokens", 0),
+    ), None
 def _model_response_to_generate_content_response(
     response: ModelResponse,
 ) -> LlmResponse:
-  """Converts a litellm response to LlmResponse.
+  """Converts a litellm response to LlmResponse. Also adds usage metadata.
   Args:
     response: The model response.
@@ -403,7 +424,15 @@ def _model_response_to_generate_content_response(
   if not message:
     raise ValueError("No message in response")
-  return _message_to_generate_content_response(message)
+  llm_response = _message_to_generate_content_response(message)
+  if response.get("usage", None):
+    llm_response.usage_metadata = types.GenerateContentResponseUsageMetadata(
+        prompt_token_count=response["usage"].get("prompt_tokens", 0),
+        candidates_token_count=response["usage"].get("completion_tokens", 0),
+        total_token_count=response["usage"].get("total_tokens", 0),
+    )
+  return llm_response
 def _message_to_generate_content_response(
@@ -628,6 +657,10 @@ class LiteLlm(BaseLlm):
       function_args = ""
       function_id = None
       completion_args["stream"] = True
+      aggregated_llm_response = None
+      aggregated_llm_response_with_tool_call = None
+      usage_metadata = None
       for part in self.llm_client.completion(**completion_args):
         for chunk, finish_reason in _model_response_to_chunk(part):
           if isinstance(chunk, FunctionChunk):
@@ -645,32 +678,55 @@ class LiteLlm(BaseLlm):
                 ),
                 is_partial=True,
             )
+          elif isinstance(chunk, UsageMetadataChunk):
+            usage_metadata = types.GenerateContentResponseUsageMetadata(
+                prompt_token_count=chunk.prompt_tokens,
+                candidates_token_count=chunk.completion_tokens,
+                total_token_count=chunk.total_tokens,
+            )
           if finish_reason == "tool_calls" and function_id:
-            yield _message_to_generate_content_response(
-                ChatCompletionAssistantMessage(
-                    role="assistant",
-                    content="",
-                    tool_calls=[
-                        ChatCompletionMessageToolCall(
-                            type="function",
-                            id=function_id,
-                            function=Function(
-                                name=function_name,
-                                arguments=function_args,
-                            ),
-                        )
-                    ],
+            aggregated_llm_response_with_tool_call = (
+                _message_to_generate_content_response(
+                    ChatCompletionAssistantMessage(
+                        role="assistant",
+                        content="",
+                        tool_calls=[
+                            ChatCompletionMessageToolCall(
+                                type="function",
+                                id=function_id,
+                                function=Function(
+                                    name=function_name,
+                                    arguments=function_args,
+                                ),
+                            )
+                        ],
+                    )
                 )
             )
             function_name = ""
             function_args = ""
             function_id = None
           elif finish_reason == "stop" and text:
-            yield _message_to_generate_content_response(
+            aggregated_llm_response = _message_to_generate_content_response(
                 ChatCompletionAssistantMessage(role="assistant", content=text)
             )
             text = ""
+      # waiting until streaming ends to yield the llm_response as litellm tends
+      # to send chunk that contains usage_metadata after the chunk with
+      # finish_reason set to tool_calls or stop.
+      if aggregated_llm_response:
+        if usage_metadata:
+          aggregated_llm_response.usage_metadata = usage_metadata
+          usage_metadata = None
+        yield aggregated_llm_response
+      if aggregated_llm_response_with_tool_call:
+        if usage_metadata:
+          aggregated_llm_response_with_tool_call.usage_metadata = usage_metadata
+        yield aggregated_llm_response_with_tool_call
     else:
       response = await self.llm_client.acompletion(**completion_args)
       yield _model_response_to_generate_content_response(response)

google/adk/models/llm_response.py CHANGED Viewed

@@ -17,6 +17,7 @@ from __future__ import annotations
 from typing import Any, Optional
 from google.genai import types
+from pydantic import alias_generators
 from pydantic import BaseModel
 from pydantic import ConfigDict
@@ -40,7 +41,11 @@ class LlmResponse(BaseModel):
     custom_metadata: The custom metadata of the LlmResponse.
   """
-  model_config = ConfigDict(extra='forbid')
+  model_config = ConfigDict(
+      extra='forbid',
+      alias_generator=alias_generators.to_camel,
+      populate_by_name=True,
+  )
   """The pydantic model config."""
   content: Optional[types.Content] = None
@@ -80,6 +85,9 @@ class LlmResponse(BaseModel):
   NOTE: the entire dict must be JSON serializable.
   """
+  usage_metadata: Optional[types.GenerateContentResponseUsageMetadata] = None
+  """The usage metadata of the LlmResponse"""
   @staticmethod
   def create(
       generate_content_response: types.GenerateContentResponse,
@@ -93,18 +101,20 @@ class LlmResponse(BaseModel):
     Returns:
       The LlmResponse.
     """
+    usage_metadata = generate_content_response.usage_metadata
     if generate_content_response.candidates:
       candidate = generate_content_response.candidates[0]
       if candidate.content and candidate.content.parts:
         return LlmResponse(
             content=candidate.content,
             grounding_metadata=candidate.grounding_metadata,
+            usage_metadata=usage_metadata,
         )
       else:
         return LlmResponse(
             error_code=candidate.finish_reason,
             error_message=candidate.finish_message,
+            usage_metadata=usage_metadata,
         )
     else:
       if generate_content_response.prompt_feedback:
@@ -112,9 +122,11 @@ class LlmResponse(BaseModel):
         return LlmResponse(
             error_code=prompt_feedback.block_reason,
             error_message=prompt_feedback.block_reason_message,
+            usage_metadata=usage_metadata,
         )
       else:
         return LlmResponse(
             error_code='UNKNOWN_ERROR',
             error_message='Unknown error.',
+            usage_metadata=usage_metadata,
         )

google/adk/models/registry.py CHANGED Viewed

@@ -24,7 +24,7 @@ from typing import TYPE_CHECKING
 if TYPE_CHECKING:
   from .base_llm import BaseLlm
-logger = logging.getLogger(__name__)
+logger = logging.getLogger('google_adk.' + __name__)
 _llm_registry_dict: dict[str, type[BaseLlm]] = {}

google-adk 0.5.0__py3-none-any.whl → 1.0.0__py3-none-any.whl

google-adk 0.5.0py3-none-any.whl → 1.0.0py3-none-any.whl