PyPI - google-genai - Versions diffs - 1.7.0__py3-none-any.whl → 1.53.0__py3-none-any.whl - Mend

google-genai 1.7.0py3-none-any.whl → 1.53.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (42) hide show

google/genai/__init__.py +4 -2
google/genai/_adapters.py +55 -0
google/genai/_api_client.py +1301 -299
google/genai/_api_module.py +1 -1
google/genai/_automatic_function_calling_util.py +54 -33
google/genai/_base_transformers.py +26 -0
google/genai/_base_url.py +50 -0
google/genai/_common.py +560 -59
google/genai/_extra_utils.py +371 -38
google/genai/_live_converters.py +1467 -0
google/genai/_local_tokenizer_loader.py +214 -0
google/genai/_mcp_utils.py +117 -0
google/genai/_operations_converters.py +394 -0
google/genai/_replay_api_client.py +204 -92
google/genai/_test_api_client.py +1 -1
google/genai/_tokens_converters.py +520 -0
google/genai/_transformers.py +633 -233
google/genai/batches.py +1733 -538
google/genai/caches.py +678 -1012
google/genai/chats.py +48 -38
google/genai/client.py +142 -15
google/genai/documents.py +532 -0
google/genai/errors.py +141 -35
google/genai/file_search_stores.py +1296 -0
google/genai/files.py +312 -744
google/genai/live.py +617 -367
google/genai/live_music.py +197 -0
google/genai/local_tokenizer.py +395 -0
google/genai/models.py +3598 -3116
google/genai/operations.py +201 -362
google/genai/pagers.py +23 -7
google/genai/py.typed +1 -0
google/genai/tokens.py +362 -0
google/genai/tunings.py +1274 -496
google/genai/types.py +14535 -5454
google/genai/version.py +2 -2
{google_genai-1.7.0.dist-info → google_genai-1.53.0.dist-info}/METADATA +736 -234
google_genai-1.53.0.dist-info/RECORD +41 -0
{google_genai-1.7.0.dist-info → google_genai-1.53.0.dist-info}/WHEEL +1 -1
google_genai-1.7.0.dist-info/RECORD +0 -27
{google_genai-1.7.0.dist-info → google_genai-1.53.0.dist-info/licenses}/LICENSE +0 -0
{google_genai-1.7.0.dist-info → google_genai-1.53.0.dist-info}/top_level.txt +0 -0

google/genai/live_music.py ADDED Viewed

@@ -0,0 +1,197 @@
+# Copyright 2025 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+"""[Experimental] Live Music API client."""
+import contextlib
+import json
+import logging
+from typing import AsyncIterator
+from . import _api_module
+from . import _common
+from . import _live_converters as live_converters
+from . import _transformers as t
+from . import types
+from ._api_client import BaseApiClient
+from ._common import set_value_by_path as setv
+try:
+  from websockets.asyncio.client import ClientConnection
+  from websockets.asyncio.client import connect
+except ModuleNotFoundError:
+  from websockets.client import ClientConnection  # type: ignore
+  from websockets.client import connect  # type: ignore
+logger = logging.getLogger('google_genai.live_music')
+class AsyncMusicSession:
+  """[Experimental] AsyncMusicSession."""
+  def __init__(self, api_client: BaseApiClient, websocket: ClientConnection):
+    self._api_client = api_client
+    self._ws = websocket
+  async def set_weighted_prompts(
+      self, prompts: list[types.WeightedPrompt]
+  ) -> None:
+    if self._api_client.vertexai:
+      raise NotImplementedError(
+          'Live music generation is not supported in Vertex AI.'
+      )
+    else:
+      client_content_dict = {
+          'weightedPrompts': [
+              _common.convert_to_dict(prompt, convert_keys=True)
+              for prompt in prompts
+          ]
+      }
+    await self._ws.send(json.dumps({'clientContent': client_content_dict}))
+  async def set_music_generation_config(
+      self, config: types.LiveMusicGenerationConfig
+  ) -> None:
+    if self._api_client.vertexai:
+      raise NotImplementedError(
+          'Live music generation is not supported in Vertex AI.'
+      )
+    else:
+      config_dict = _common.convert_to_dict(config, convert_keys=True)
+    await self._ws.send(json.dumps({'musicGenerationConfig': config_dict}))
+  async def _send_control_signal(
+      self, playback_control: types.LiveMusicPlaybackControl
+  ) -> None:
+    if self._api_client.vertexai:
+      raise NotImplementedError(
+          'Live music generation is not supported in Vertex AI.'
+      )
+    else:
+      playback_control_dict = {'playbackControl': playback_control.value}
+      await self._ws.send(json.dumps(playback_control_dict))
+  async def play(self) -> None:
+    """Sends playback signal to start the music stream."""
+    return await self._send_control_signal(types.LiveMusicPlaybackControl.PLAY)
+  async def pause(self) -> None:
+    """Sends a playback signal to pause the music stream."""
+    return await self._send_control_signal(types.LiveMusicPlaybackControl.PAUSE)
+  async def stop(self) -> None:
+    """Sends a playback signal to stop the music stream.
+    Resets the music generation context while retaining the current config.
+    """
+    return await self._send_control_signal(types.LiveMusicPlaybackControl.STOP)
+  async def reset_context(self) -> None:
+    """Reset the context (prompts retained) without stopping the music generation."""
+    return await self._send_control_signal(
+        types.LiveMusicPlaybackControl.RESET_CONTEXT
+    )
+  async def receive(self) -> AsyncIterator[types.LiveMusicServerMessage]:
+    """Receive model responses from the server.
+    Yields:
+      The audio chunks from the server.
+    """
+    # TODO(b/365983264) Handle intermittent issues for the user.
+    while result := await self._receive():
+      yield result
+  async def _receive(self) -> types.LiveMusicServerMessage:
+    parameter_model = types.LiveMusicServerMessage()
+    try:
+      raw_response = await self._ws.recv(decode=False)
+    except TypeError:
+      raw_response = await self._ws.recv()  # type: ignore[assignment]
+    if raw_response:
+      try:
+        response = json.loads(raw_response)
+      except json.decoder.JSONDecodeError:
+        raise ValueError(f'Failed to parse response: {raw_response!r}')
+    else:
+      response = {}
+    if self._api_client.vertexai:
+      raise NotImplementedError('Live music generation is not supported in Vertex AI.')
+    else:
+      response_dict = response
+    return types.LiveMusicServerMessage._from_response(
+        response=response_dict, kwargs=parameter_model.model_dump()
+    )
+  async def close(self) -> None:
+    """Closes the bi-directional stream and terminates the session."""
+    await self._ws.close()
+class AsyncLiveMusic(_api_module.BaseModule):
+  """[Experimental] Live music module.
+  Live music can be accessed via `client.aio.live.music`.
+  """
+  @_common.experimental_warning(
+      'Realtime music generation is experimental and may change in future versions.'
+  )
+  @contextlib.asynccontextmanager
+  async def connect(self, *, model: str) -> AsyncIterator[AsyncMusicSession]:
+    """[Experimental] Connect to the live music server."""
+    base_url = self._api_client._websocket_base_url()
+    if isinstance(base_url, bytes):
+      base_url = base_url.decode('utf-8')
+    transformed_model = t.t_model(self._api_client, model)
+    if self._api_client.api_key:
+      api_key = self._api_client.api_key
+      version = self._api_client._http_options.api_version
+      uri = f'{base_url}/ws/google.ai.generativelanguage.{version}.GenerativeService.BidiGenerateMusic?key={api_key}'
+      headers = self._api_client._http_options.headers
+      # Only mldev supported
+      request_dict = _common.convert_to_dict(
+          live_converters._LiveMusicConnectParameters_to_mldev(
+              from_object=types.LiveMusicConnectParameters(
+                model=transformed_model,
+              ).model_dump(exclude_none=True)
+          )
+      )
+      setv(request_dict, ['setup', 'model'], transformed_model)
+      request = json.dumps(request_dict)
+    else:
+      raise NotImplementedError('Live music generation is not supported in Vertex AI.')
+    try:
+      async with connect(uri, additional_headers=headers) as ws:
+        await ws.send(request)
+        logger.info(await ws.recv(decode=False))
+        yield AsyncMusicSession(api_client=self._api_client, websocket=ws)
+    except TypeError:
+      # Try with the older websockets API
+      async with connect(uri, extra_headers=headers) as ws:
+        await ws.send(request)
+        logger.info(await ws.recv())
+        yield AsyncMusicSession(api_client=self._api_client, websocket=ws)

google/genai/local_tokenizer.py ADDED Viewed

@@ -0,0 +1,395 @@
+# Copyright 2025 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+"""[Experimental] Text Only Local Tokenizer."""
+import logging
+from typing import Any, Iterable
+from typing import Optional, Union
+from sentencepiece import sentencepiece_model_pb2
+from . import _common
+from . import _local_tokenizer_loader as loader
+from . import _transformers as t
+from . import types
+logger = logging.getLogger("google_genai.local_tokenizer")
+__all__ = [
+    "_parse_hex_byte",
+    "_token_str_to_bytes",
+    "LocalTokenizer",
+    "_TextsAccumulator",
+]
+class _TextsAccumulator:
+  """Accumulates countable texts from `Content` and `Tool` objects.
+  This class is responsible for traversing complex `Content` and `Tool`
+  objects and extracting all the text content that should be included when
+  calculating token counts.
+  A key feature of this class is its ability to detect unsupported fields in
+  `Content` objects. If a user provides a `Content` object with fields that
+  this local tokenizer doesn't recognize (e.g., new fields added in a future
+  API update), this class will log a warning.
+  The detection mechanism for `Content` objects works by recursively building
+  a "counted" version of the input object. This "counted" object only
+  contains the data that was successfully processed and added to the text
+  list for tokenization. After traversing the input, the original `Content`
+  object is compared to the "counted" object. If they don't match, it
+  signifies the presence of unsupported fields, and a warning is logged.
+  """
+  def __init__(self) -> None:
+    self._texts: list[str] = []
+  def get_texts(self) -> Iterable[str]:
+    return self._texts
+  def add_contents(self, contents: Iterable[types.Content]) -> None:
+    for content in contents:
+      self.add_content(content)
+  def add_content(self, content: types.Content) -> None:
+    counted_content = types.Content(parts=[], role=content.role)
+    if content.parts:
+      for part in content.parts:
+        assert counted_content.parts is not None
+        counted_part = types.Part()
+        if part.file_data is not None or part.inline_data is not None:
+          raise ValueError(
+              "LocalTokenizers do not support non-text content types."
+          )
+        if part.video_metadata is not None:
+          counted_part.video_metadata = part.video_metadata
+        if part.function_call is not None:
+          self.add_function_call(part.function_call)
+          counted_part.function_call = part.function_call
+        if part.function_response is not None:
+          self.add_function_response(part.function_response)
+          counted_part.function_response = part.function_response
+        if part.text is not None:
+          counted_part.text = part.text
+          self._texts.append(part.text)
+        counted_content.parts.append(counted_part)
+    if content.model_dump(exclude_none=True) != counted_content.model_dump(
+        exclude_none=True
+    ):
+      logger.warning(
+          "Content contains unsupported types for token counting. Supported"
+          f" fields {counted_content}. Got {content}."
+      )
+  def add_function_call(self, function_call: types.FunctionCall) -> None:
+    """Processes a function call and adds relevant text to the accumulator.
+    Args:
+        function_call: The function call to process.
+    """
+    if function_call.name:
+      self._texts.append(function_call.name)
+    counted_function_call = types.FunctionCall(name=function_call.name)
+    if function_call.args:
+      counted_args = self._dict_traverse(function_call.args)
+      counted_function_call.args = counted_args
+  def add_tool(self, tool: types.Tool) -> types.Tool:
+    counted_tool = types.Tool(function_declarations=[])
+    if tool.function_declarations:
+      for function_declaration in tool.function_declarations:
+        counted_function_declaration = self._function_declaration_traverse(
+            function_declaration
+        )
+        if counted_tool.function_declarations is None:
+          counted_tool.function_declarations = []
+        counted_tool.function_declarations.append(counted_function_declaration)
+    return counted_tool
+  def add_tools(self, tools: Iterable[types.Tool]) -> None:
+    for tool in tools:
+      self.add_tool(tool)
+  def add_function_responses(
+      self, function_responses: Iterable[types.FunctionResponse]
+  ) -> None:
+    for function_response in function_responses:
+      self.add_function_response(function_response)
+  def add_function_response(
+      self, function_response: types.FunctionResponse
+  ) -> None:
+    counted_function_response = types.FunctionResponse()
+    if function_response.name:
+      self._texts.append(function_response.name)
+      counted_function_response.name = function_response.name
+    if function_response.response:
+      counted_response = self._dict_traverse(function_response.response)
+      counted_function_response.response = counted_response
+  def _function_declaration_traverse(
+      self, function_declaration: types.FunctionDeclaration
+  ) -> types.FunctionDeclaration:
+    counted_function_declaration = types.FunctionDeclaration()
+    if function_declaration.name:
+      self._texts.append(function_declaration.name)
+      counted_function_declaration.name = function_declaration.name
+    if function_declaration.description:
+      self._texts.append(function_declaration.description)
+      counted_function_declaration.description = (
+          function_declaration.description
+      )
+    if function_declaration.parameters:
+      counted_parameters = self.add_schema(function_declaration.parameters)
+      counted_function_declaration.parameters = counted_parameters
+    if function_declaration.response:
+      counted_response = self.add_schema(function_declaration.response)
+      counted_function_declaration.response = counted_response
+    return counted_function_declaration
+  def add_schema(self, schema: types.Schema) -> types.Schema:
+    """Processes a schema and adds relevant text to the accumulator.
+    Args:
+        schema: The schema to process.
+    Returns:
+        The new schema object with only countable fields.
+    """
+    counted_schema = types.Schema()
+    if schema.type:
+      counted_schema.type = schema.type
+    if schema.title:
+      counted_schema.title = schema.title
+    if schema.default is not None:
+      counted_schema.default = schema.default
+    if schema.format:
+      self._texts.append(schema.format)
+      counted_schema.format = schema.format
+    if schema.description:
+      self._texts.append(schema.description)
+      counted_schema.description = schema.description
+    if schema.enum:
+      self._texts.extend(schema.enum)
+      counted_schema.enum = schema.enum
+    if schema.required:
+      self._texts.extend(schema.required)
+      counted_schema.required = schema.required
+    if schema.property_ordering:
+      counted_schema.property_ordering = schema.property_ordering
+    if schema.items:
+      counted_schema_items = self.add_schema(schema.items)
+      counted_schema.items = counted_schema_items
+    if schema.properties:
+      d = {}
+      for key, value in schema.properties.items():
+        self._texts.append(key)
+        counted_value = self.add_schema(value)
+        d[key] = counted_value
+      counted_schema.properties = d
+    if schema.example:
+      counted_schema_example = self._any_traverse(schema.example)
+      counted_schema.example = counted_schema_example
+    return counted_schema
+  def _dict_traverse(self, d: dict[str, Any]) -> dict[str, Any]:
+    """Processes a dict and adds relevant text to the accumulator.
+    Args:
+        d: The dict to process.
+    Returns:
+        The new dict object with only countable fields.
+    """
+    counted_dict = {}
+    self._texts.extend(list(d.keys()))
+    for key, val in d.items():
+      counted_dict[key] = self._any_traverse(val)
+    return counted_dict
+  def _any_traverse(self, value: Any) -> Any:
+    """Processes a value and adds relevant text to the accumulator.
+    Args:
+        value: The value to process.
+    Returns:
+        The new value with only countable fields.
+    """
+    if isinstance(value, str):
+      self._texts.append(value)
+      return value
+    elif isinstance(value, dict):
+      return self._dict_traverse(value)
+    elif isinstance(value, list):
+      return [self._any_traverse(item) for item in value]
+    else:
+      return value
+def _token_str_to_bytes(
+    token: str, type: sentencepiece_model_pb2.ModelProto.SentencePiece.Type
+) -> bytes:
+  if type == sentencepiece_model_pb2.ModelProto.SentencePiece.Type.BYTE:
+    return _parse_hex_byte(token).to_bytes(length=1, byteorder="big")
+  else:
+    return token.replace("▁", " ").encode("utf-8")
+def _parse_hex_byte(token: str) -> int:
+  """Parses a hex byte string of the form '<0xXX>' and returns the integer value.
+  Raises ValueError if the input is malformed or the byte value is invalid.
+  """
+  if len(token) != 6:
+    raise ValueError(f"Invalid byte length: {token}")
+  if not token.startswith("<0x") or not token.endswith(">"):
+    raise ValueError(f"Invalid byte format: {token}")
+  try:
+    val = int(token[3:5], 16)  # Parse the hex part directly
+  except ValueError:
+    raise ValueError(f"Invalid hex value: {token}")
+  if val >= 256:
+    raise ValueError(f"Byte value out of range: {token}")
+  return val
+class LocalTokenizer:
+  """[Experimental] Text Only Local Tokenizer.
+  This class provides a local tokenizer for text only token counting.
+  LIMITATIONS:
+  - Only supports text based tokenization and no multimodal tokenization.
+  - Forward compatibility depends on the open-source tokenizer models for future
+  Gemini versions.
+  - For token counting of tools and response schemas, the `LocalTokenizer` only
+  supports `types.Tool` and `types.Schema` objects. Python functions or Pydantic
+  models cannot be passed directly.
+  """
+  def __init__(self, model_name: str):
+    self._tokenizer_name = loader.get_tokenizer_name(model_name)
+    self._model_proto = loader.load_model_proto(self._tokenizer_name)
+    self._tokenizer = loader.get_sentencepiece(self._tokenizer_name)
+  @_common.experimental_warning(
+      "The SDK's local tokenizer implementation is experimental and may change"
+      " in the future. It only supports text based tokenization."
+  )
+  def count_tokens(
+      self,
+      contents: Union[types.ContentListUnion, types.ContentListUnionDict],
+      *,
+      config: Optional[types.CountTokensConfigOrDict] = None,
+  ) -> types.CountTokensResult:
+    """Counts the number of tokens in a given text.
+    Args:
+      contents: The contents to tokenize.
+      config: The configuration for counting tokens.
+    Returns:
+      A `CountTokensResult` containing the total number of tokens.
+    Usage:
+    .. code-block:: python
+      from google import genai
+      tokenizer = genai.LocalTokenizer(model_name='gemini-2.0-flash-001')
+      result = tokenizer.count_tokens("What is your name?")
+      print(result)
+      # total_tokens=5
+    """
+    processed_contents = t.t_contents(contents)
+    text_accumulator = _TextsAccumulator()
+    config = types.CountTokensConfig.model_validate(config or {})
+    text_accumulator.add_contents(processed_contents)
+    if config.tools:
+      text_accumulator.add_tools(config.tools)
+    if config.generation_config and config.generation_config.response_schema:
+      text_accumulator.add_schema(config.generation_config.response_schema)
+    if config.system_instruction:
+      text_accumulator.add_contents(t.t_contents([config.system_instruction]))
+    tokens_list = self._tokenizer.encode(list(text_accumulator.get_texts()))
+    return types.CountTokensResult(
+        total_tokens=sum(len(tokens) for tokens in tokens_list)
+    )
+  @_common.experimental_warning(
+      "The SDK's local tokenizer implementation is experimental and may change"
+      " in the future. It only supports text based tokenization."
+  )
+  def compute_tokens(
+      self,
+      contents: Union[types.ContentListUnion, types.ContentListUnionDict],
+  ) -> types.ComputeTokensResult:
+    """Computes the tokens ids and string pieces in the input.
+    Args:
+      contents: The contents to tokenize.
+    Returns:
+      A `ComputeTokensResult` containing the token information.
+    Usage:
+    .. code-block:: python
+      from google import genai
+      tokenizer = genai.LocalTokenizer(model_name='gemini-2.0-flash-001')
+      result = tokenizer.compute_tokens("What is your name?")
+      print(result)
+      # tokens_info=[TokensInfo(token_ids=[279, 329, 1313, 2508, 13], tokens=[b' What', b' is', b' your', b' name', b'?'], role='user')]
+    """
+    processed_contents = t.t_contents(contents)
+    text_accumulator = _TextsAccumulator()
+    for content in processed_contents:
+      text_accumulator.add_content(content)
+    tokens_protos = self._tokenizer.EncodeAsImmutableProto(
+        text_accumulator.get_texts()
+    )
+    roles = []
+    for content in processed_contents:
+      if content.parts:
+        for _ in content.parts:
+          roles.append(content.role)
+    token_infos = []
+    for tokens_proto, role in zip(tokens_protos, roles):
+      token_infos.append(
+          types.TokensInfo(
+              token_ids=[piece.id for piece in tokens_proto.pieces],
+              tokens=[
+                  _token_str_to_bytes(
+                      piece.piece, self._model_proto.pieces[piece.id].type
+                  )
+                  for piece in tokens_proto.pieces
+              ],
+              role=role,
+          )
+      )
+    return types.ComputeTokensResult(tokens_info=token_infos)

google-genai 1.7.0__py3-none-any.whl → 1.53.0__py3-none-any.whl

google-genai 1.7.0py3-none-any.whl → 1.53.0py3-none-any.whl