PyPI - google-genai - Versions diffs - 1.7.0__py3-none-any.whl → 1.9.0__py3-none-any.whl - Mend

google-genai 1.7.0py3-none-any.whl → 1.9.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

google/genai/_api_client.py +93 -78
google/genai/_replay_api_client.py +22 -14
google/genai/_transformers.py +81 -16
google/genai/batches.py +61 -295
google/genai/caches.py +546 -526
google/genai/chats.py +15 -8
google/genai/client.py +5 -3
google/genai/errors.py +47 -24
google/genai/files.py +89 -305
google/genai/live.py +466 -12
google/genai/models.py +1992 -2291
google/genai/operations.py +104 -124
google/genai/tunings.py +256 -272
google/genai/types.py +394 -98
google/genai/version.py +1 -1
{google_genai-1.7.0.dist-info → google_genai-1.9.0.dist-info}/METADATA +3 -2
google_genai-1.9.0.dist-info/RECORD +27 -0
{google_genai-1.7.0.dist-info → google_genai-1.9.0.dist-info}/WHEEL +1 -1
google_genai-1.7.0.dist-info/RECORD +0 -27
{google_genai-1.7.0.dist-info → google_genai-1.9.0.dist-info/licenses}/LICENSE +0 -0
{google_genai-1.7.0.dist-info → google_genai-1.9.0.dist-info}/top_level.txt +0 -0

google/genai/types.py CHANGED Viewed

@@ -137,10 +137,9 @@ class State(_common.CaseInSensitiveEnum):
 class FinishReason(_common.CaseInSensitiveEnum):
-  """Output only.
+  """Output only. The reason why the model stopped generating tokens.
-  The reason why the model stopped generating tokens. If empty, the model has
-  not stopped generating the tokens.
+  If empty, the model has not stopped generating the tokens.
   """
   FINISH_REASON_UNSPECIFIED = 'FINISH_REASON_UNSPECIFIED'
@@ -153,6 +152,7 @@ class FinishReason(_common.CaseInSensitiveEnum):
   PROHIBITED_CONTENT = 'PROHIBITED_CONTENT'
   SPII = 'SPII'
   MALFORMED_FUNCTION_CALL = 'MALFORMED_FUNCTION_CALL'
+  IMAGE_SAFETY = 'IMAGE_SAFETY'
 class HarmProbability(_common.CaseInSensitiveEnum):
@@ -185,6 +185,15 @@ class BlockedReason(_common.CaseInSensitiveEnum):
   PROHIBITED_CONTENT = 'PROHIBITED_CONTENT'
+class Modality(_common.CaseInSensitiveEnum):
+  """Server content modalities."""
+  MODALITY_UNSPECIFIED = 'MODALITY_UNSPECIFIED'
+  TEXT = 'TEXT'
+  IMAGE = 'IMAGE'
+  AUDIO = 'AUDIO'
 class DeploymentResourcesType(_common.CaseInSensitiveEnum):
   """"""
@@ -334,13 +343,15 @@ class FileSource(_common.CaseInSensitiveEnum):
   GENERATED = 'GENERATED'
-class Modality(_common.CaseInSensitiveEnum):
+class MediaModality(_common.CaseInSensitiveEnum):
   """Server content modalities."""
   MODALITY_UNSPECIFIED = 'MODALITY_UNSPECIFIED'
   TEXT = 'TEXT'
   IMAGE = 'IMAGE'
+  VIDEO = 'VIDEO'
   AUDIO = 'AUDIO'
+  DOCUMENT = 'DOCUMENT'
 class VideoMetadata(_common.BaseModel):
@@ -623,6 +634,11 @@ class Part(_common.BaseModel):
   @classmethod
   def from_video_metadata(cls, *, start_offset: str, end_offset: str) -> 'Part':
+    logger.warning("""Part.from_video_metadata will be deprecated soon.
+           Because a Part instance needs to include at least one of the fields:
+           text, file_data, inline_data, function_call, function_response, executable_code or code_execution_result.
+           A Part instance contains only video_metadata is not a valid Part.
+        """)
     video_metadata = VideoMetadata(
         end_offset=end_offset, start_offset=start_offset
     )
@@ -692,7 +708,7 @@ class Content(_common.BaseModel):
       default=None,
       description="""Optional. The producer of the content. Must be either 'user' or
       'model'. Useful to set for multi-turn conversations, otherwise can be
-      left blank or unset. If role is not specified, SDK will determine the role.""",
+      empty. If role is not specified, SDK will determine the role.""",
   )
@@ -767,7 +783,7 @@ class ContentDict(TypedDict, total=False):
   role: Optional[str]
   """Optional. The producer of the content. Must be either 'user' or
       'model'. Useful to set for multi-turn conversations, otherwise can be
-      left blank or unset. If role is not specified, SDK will determine the role."""
+      empty. If role is not specified, SDK will determine the role."""
 ContentOrDict = Union[Content, ContentDict]
@@ -832,9 +848,6 @@ class Schema(_common.BaseModel):
       default=None,
       description="""Optional. Maximum length of the Type.STRING""",
   )
-  title: Optional[str] = Field(
-      default=None, description="""Optional. The title of the Schema."""
-  )
   min_length: Optional[int] = Field(
       default=None,
       description="""Optional. SCHEMA FIELDS FOR TYPE STRING Minimum length of the Type.STRING""",
@@ -898,6 +911,9 @@ class Schema(_common.BaseModel):
       default=None,
       description="""Optional. Required properties of Type.OBJECT.""",
   )
+  title: Optional[str] = Field(
+      default=None, description="""Optional. The title of the Schema."""
+  )
   type: Optional[Type] = Field(
       default=None, description="""Optional. The type of the data."""
   )
@@ -921,9 +937,6 @@ class SchemaDict(TypedDict, total=False):
   max_length: Optional[int]
   """Optional. Maximum length of the Type.STRING"""
-  title: Optional[str]
-  """Optional. The title of the Schema."""
   min_length: Optional[int]
   """Optional. SCHEMA FIELDS FOR TYPE STRING Minimum length of the Type.STRING"""
@@ -972,6 +985,9 @@ class SchemaDict(TypedDict, total=False):
   required: Optional[list[str]]
   """Optional. Required properties of Type.OBJECT."""
+  title: Optional[str]
+  """Optional. The title of the Schema."""
   type: Optional[Type]
   """Optional. The type of the data."""
@@ -1210,25 +1226,34 @@ GoogleSearchRetrievalOrDict = Union[
 class VertexAISearch(_common.BaseModel):
-  """Retrieve from Vertex AI Search datastore for grounding.
+  """Retrieve from Vertex AI Search datastore or engine for grounding.
-  See https://cloud.google.com/products/agent-builder
+  datastore and engine are mutually exclusive. See
+  https://cloud.google.com/products/agent-builder
   """
   datastore: Optional[str] = Field(
       default=None,
-      description="""Required. Fully-qualified Vertex AI Search data store resource ID. Format: `projects/{project}/locations/{location}/collections/{collection}/dataStores/{dataStore}`""",
+      description="""Optional. Fully-qualified Vertex AI Search data store resource ID. Format: `projects/{project}/locations/{location}/collections/{collection}/dataStores/{dataStore}`""",
+  )
+  engine: Optional[str] = Field(
+      default=None,
+      description="""Optional. Fully-qualified Vertex AI Search engine resource ID. Format: `projects/{project}/locations/{location}/collections/{collection}/engines/{engine}`""",
   )
 class VertexAISearchDict(TypedDict, total=False):
-  """Retrieve from Vertex AI Search datastore for grounding.
+  """Retrieve from Vertex AI Search datastore or engine for grounding.
-  See https://cloud.google.com/products/agent-builder
+  datastore and engine are mutually exclusive. See
+  https://cloud.google.com/products/agent-builder
   """
   datastore: Optional[str]
-  """Required. Fully-qualified Vertex AI Search data store resource ID. Format: `projects/{project}/locations/{location}/collections/{collection}/dataStores/{dataStore}`"""
+  """Optional. Fully-qualified Vertex AI Search data store resource ID. Format: `projects/{project}/locations/{location}/collections/{collection}/dataStores/{dataStore}`"""
+  engine: Optional[str]
+  """Optional. Fully-qualified Vertex AI Search engine resource ID. Format: `projects/{project}/locations/{location}/collections/{collection}/engines/{engine}`"""
 VertexAISearchOrDict = Union[VertexAISearch, VertexAISearchDict]
@@ -2740,13 +2765,15 @@ class Candidate(_common.BaseModel):
       description="""Number of tokens for this candidate.
       """,
   )
-  avg_logprobs: Optional[float] = Field(
+  finish_reason: Optional[FinishReason] = Field(
       default=None,
-      description="""Output only. Average log probability score of the candidate.""",
+      description="""The reason why the model stopped generating tokens.
+      If empty, the model has not stopped generating the tokens.
+      """,
   )
-  finish_reason: Optional[FinishReason] = Field(
+  avg_logprobs: Optional[float] = Field(
       default=None,
-      description="""Output only. The reason why the model stopped generating tokens. If empty, the model has not stopped generating the tokens.""",
+      description="""Output only. Average log probability score of the candidate.""",
   )
   grounding_metadata: Optional[GroundingMetadata] = Field(
       default=None,
@@ -2784,12 +2811,14 @@ class CandidateDict(TypedDict, total=False):
   """Number of tokens for this candidate.
       """
+  finish_reason: Optional[FinishReason]
+  """The reason why the model stopped generating tokens.
+      If empty, the model has not stopped generating the tokens.
+      """
   avg_logprobs: Optional[float]
   """Output only. Average log probability score of the candidate."""
-  finish_reason: Optional[FinishReason]
-  """Output only. The reason why the model stopped generating tokens. If empty, the model has not stopped generating the tokens."""
   grounding_metadata: Optional[GroundingMetadataDict]
   """Output only. Metadata specifies sources used to ground generated content."""
@@ -2840,9 +2869,38 @@ GenerateContentResponsePromptFeedbackOrDict = Union[
 ]
+class ModalityTokenCount(_common.BaseModel):
+  """Represents token counting info for a single modality."""
+  modality: Optional[MediaModality] = Field(
+      default=None,
+      description="""The modality associated with this token count.""",
+  )
+  token_count: Optional[int] = Field(
+      default=None, description="""Number of tokens."""
+  )
+class ModalityTokenCountDict(TypedDict, total=False):
+  """Represents token counting info for a single modality."""
+  modality: Optional[MediaModality]
+  """The modality associated with this token count."""
+  token_count: Optional[int]
+  """Number of tokens."""
+ModalityTokenCountOrDict = Union[ModalityTokenCount, ModalityTokenCountDict]
 class GenerateContentResponseUsageMetadata(_common.BaseModel):
   """Usage metadata about response(s)."""
+  cache_tokens_details: Optional[list[ModalityTokenCount]] = Field(
+      default=None,
+      description="""Output only. List of modalities of the cached content in the request input.""",
+  )
   cached_content_token_count: Optional[int] = Field(
       default=None,
       description="""Output only. Number of tokens in the cached part in the input (the cached content).""",
@@ -2850,30 +2908,68 @@ class GenerateContentResponseUsageMetadata(_common.BaseModel):
   candidates_token_count: Optional[int] = Field(
       default=None, description="""Number of tokens in the response(s)."""
   )
+  candidates_tokens_details: Optional[list[ModalityTokenCount]] = Field(
+      default=None,
+      description="""Output only. List of modalities that were returned in the response.""",
+  )
   prompt_token_count: Optional[int] = Field(
       default=None,
       description="""Number of tokens in the request. When `cached_content` is set, this is still the total effective prompt size meaning this includes the number of tokens in the cached content.""",
   )
+  prompt_tokens_details: Optional[list[ModalityTokenCount]] = Field(
+      default=None,
+      description="""Output only. List of modalities that were processed in the request input.""",
+  )
+  thoughts_token_count: Optional[int] = Field(
+      default=None,
+      description="""Output only. Number of tokens present in thoughts output.""",
+  )
+  tool_use_prompt_token_count: Optional[int] = Field(
+      default=None,
+      description="""Output only. Number of tokens present in tool-use prompt(s).""",
+  )
+  tool_use_prompt_tokens_details: Optional[list[ModalityTokenCount]] = Field(
+      default=None,
+      description="""Output only. List of modalities that were processed for tool-use request inputs.""",
+  )
   total_token_count: Optional[int] = Field(
       default=None,
-      description="""Total token count for prompt and response candidates.""",
+      description="""Total token count for prompt, response candidates, and tool-use prompts (if present).""",
   )
 class GenerateContentResponseUsageMetadataDict(TypedDict, total=False):
   """Usage metadata about response(s)."""
+  cache_tokens_details: Optional[list[ModalityTokenCountDict]]
+  """Output only. List of modalities of the cached content in the request input."""
   cached_content_token_count: Optional[int]
   """Output only. Number of tokens in the cached part in the input (the cached content)."""
   candidates_token_count: Optional[int]
   """Number of tokens in the response(s)."""
+  candidates_tokens_details: Optional[list[ModalityTokenCountDict]]
+  """Output only. List of modalities that were returned in the response."""
   prompt_token_count: Optional[int]
   """Number of tokens in the request. When `cached_content` is set, this is still the total effective prompt size meaning this includes the number of tokens in the cached content."""
+  prompt_tokens_details: Optional[list[ModalityTokenCountDict]]
+  """Output only. List of modalities that were processed in the request input."""
+  thoughts_token_count: Optional[int]
+  """Output only. Number of tokens present in thoughts output."""
+  tool_use_prompt_token_count: Optional[int]
+  """Output only. Number of tokens present in tool-use prompt(s)."""
+  tool_use_prompt_tokens_details: Optional[list[ModalityTokenCountDict]]
+  """Output only. List of modalities that were processed for tool-use request inputs."""
   total_token_count: Optional[int]
-  """Total token count for prompt and response candidates."""
+  """Total token count for prompt, response candidates, and tool-use prompts (if present)."""
 GenerateContentResponseUsageMetadataOrDict = Union[
@@ -2914,12 +3010,14 @@ class GenerateContentResponse(_common.BaseModel):
   automatic_function_calling_history: Optional[list[Content]] = None
   parsed: Optional[Union[pydantic.BaseModel, dict, Enum]] = Field(
       default=None,
-      description="""Parsed response if response_schema is provided. Not available for streaming.""",
+      description="""First candidate from the parsed response if response_schema is provided. Not available for streaming.""",
   )
-  @property
-  def text(self) -> Optional[str]:
-    """Returns the concatenation of all text parts in the response."""
+  def _get_text(self, warn_property: str = 'text') -> Optional[str]:
+    """Returns the concatenation of all text parts in the response.
+    This is an internal method that allows customizing the warning message.
+    """
     if (
         not self.candidates
         or not self.candidates[0].content
@@ -2928,9 +3026,10 @@ class GenerateContentResponse(_common.BaseModel):
       return None
     if len(self.candidates) > 1:
       logger.warning(
-          f'there are {len(self.candidates)} candidates, returning text from'
-          ' the first candidate.Access response.candidates directly to get'
-          ' text from other candidates.'
+          f'there are {len(self.candidates)} candidates, returning'
+          f' {warn_property} result from the first candidate. Access'
+          ' response.candidates directly to get the result from other'
+          ' candidates.'
       )
     text = ''
     any_text_part_text = False
@@ -2949,12 +3048,18 @@ class GenerateContentResponse(_common.BaseModel):
     if non_text_parts:
       logger.warning(
           'Warning: there are non-text parts in the response:'
-          f' {non_text_parts},returning concatenated text from text parts,check'
-          ' out the non text parts for full response from model.'
+          f' {non_text_parts},returning concatenated {warn_property} result'
+          ' from text parts,check out the non text parts for full response'
+          ' from model.'
       )
     # part.text == '' is different from part.text is None
     return text if any_text_part_text else None
+  @property
+  def text(self) -> Optional[str]:
+    """Returns the concatenation of all text parts in the response."""
+    return self._get_text(warn_property='text')
   @property
   def function_calls(self) -> Optional[list[FunctionCall]]:
     """Returns the list of function calls in the response."""
@@ -3037,16 +3142,23 @@ class GenerateContentResponse(_common.BaseModel):
     ):
       # Pydantic schema.
       try:
-        if result.text is not None:
-          result.parsed = response_schema.model_validate_json(result.text)
+        result_text = result._get_text(warn_property='parsed')
+        if result_text is not None:
+          result.parsed = response_schema.model_validate_json(result_text)
       # may not be a valid json per stream response
       except pydantic.ValidationError:
         pass
       except json.decoder.JSONDecodeError:
         pass
-    elif isinstance(response_schema, EnumMeta) and result.text is not None:
+    elif (
+        isinstance(response_schema, EnumMeta)
+        and result._get_text(warn_property='parsed') is not None
+    ):
       # Enum with "application/json" returns response in double quotes.
-      enum_value = result.text.replace('"', '')
+      result_text = result._get_text(warn_property='parsed')
+      if result_text is None:
+        raise ValueError('Response is empty.')
+      enum_value = result_text.replace('"', '')
       try:
         result.parsed = response_schema(enum_value)
         if (
@@ -3064,8 +3176,9 @@ class GenerateContentResponse(_common.BaseModel):
         placeholder: response_schema  # type: ignore[valid-type]
       try:
-        if result.text is not None:
-          parsed = {'placeholder': json.loads(result.text)}
+        result_text = result._get_text(warn_property='parsed')
+        if result_text is not None:
+          parsed = {'placeholder': json.loads(result_text)}
           placeholder = Placeholder.model_validate(parsed)
           result.parsed = placeholder.placeholder
       except json.decoder.JSONDecodeError:
@@ -3080,8 +3193,9 @@ class GenerateContentResponse(_common.BaseModel):
       # want the result converted to. So just return json.
       # JSON schema.
       try:
-        if result.text is not None:
-          result.parsed = json.loads(result.text)
+        result_text = result._get_text(warn_property='parsed')
+        if result_text is not None:
+          result.parsed = json.loads(result_text)
       # may not be a valid json per stream response
       except json.decoder.JSONDecodeError:
         pass
@@ -3091,12 +3205,13 @@ class GenerateContentResponse(_common.BaseModel):
       for union_type in union_types:
         if issubclass(union_type, pydantic.BaseModel):
           try:
-            if result.text is not None:
+            result_text = result._get_text(warn_property='parsed')
+            if result_text is not None:
               class Placeholder(pydantic.BaseModel):  # type: ignore[no-redef]
                 placeholder: response_schema  # type: ignore[valid-type]
-              parsed = {'placeholder': json.loads(result.text)}
+              parsed = {'placeholder': json.loads(result_text)}
               placeholder = Placeholder.model_validate(parsed)
               result.parsed = placeholder.placeholder
           except json.decoder.JSONDecodeError:
@@ -3105,8 +3220,9 @@ class GenerateContentResponse(_common.BaseModel):
             pass
         else:
           try:
-            if result.text is not None:
-              result.parsed = json.loads(result.text)
+            result_text = result._get_text(warn_property='parsed')
+            if result_text is not None:
+              result.parsed = json.loads(result_text)
           # may not be a valid json per stream response
           except json.decoder.JSONDecodeError:
             pass
@@ -3436,7 +3552,8 @@ class GenerateImagesConfig(_common.BaseModel):
   )
   include_safety_attributes: Optional[bool] = Field(
       default=None,
-      description="""Whether to report the safety scores of each image in the response.
+      description="""Whether to report the safety scores of each generated image and
+      the positive prompt in the response.
       """,
   )
   include_rai_reason: Optional[bool] = Field(
@@ -3515,7 +3632,8 @@ class GenerateImagesConfigDict(TypedDict, total=False):
       """
   include_safety_attributes: Optional[bool]
-  """Whether to report the safety scores of each image in the response.
+  """Whether to report the safety scores of each generated image and
+      the positive prompt in the response.
       """
   include_rai_reason: Optional[bool]
@@ -3761,6 +3879,11 @@ class SafetyAttributes(_common.BaseModel):
       description="""List of scores of each categories.
       """,
   )
+  content_type: Optional[str] = Field(
+      default=None,
+      description="""Internal use only.
+      """,
+  )
 class SafetyAttributesDict(TypedDict, total=False):
@@ -3774,6 +3897,10 @@ class SafetyAttributesDict(TypedDict, total=False):
   """List of scores of each categories.
       """
+  content_type: Optional[str]
+  """Internal use only.
+      """
 SafetyAttributesOrDict = Union[SafetyAttributes, SafetyAttributesDict]
@@ -3840,6 +3967,12 @@ class GenerateImagesResponse(_common.BaseModel):
       description="""List of generated images.
       """,
   )
+  positive_prompt_safety_attributes: Optional[SafetyAttributes] = Field(
+      default=None,
+      description="""Safety attributes of the positive prompt. Only populated if
+      ``include_safety_attributes`` is set to True.
+      """,
+  )
 class GenerateImagesResponseDict(TypedDict, total=False):
@@ -3849,6 +3982,11 @@ class GenerateImagesResponseDict(TypedDict, total=False):
   """List of generated images.
       """
+  positive_prompt_safety_attributes: Optional[SafetyAttributesDict]
+  """Safety attributes of the positive prompt. Only populated if
+      ``include_safety_attributes`` is set to True.
+      """
 GenerateImagesResponseOrDict = Union[
     GenerateImagesResponse, GenerateImagesResponseDict
@@ -4085,7 +4223,8 @@ class EditImageConfig(_common.BaseModel):
   )
   include_safety_attributes: Optional[bool] = Field(
       default=None,
-      description="""Whether to report the safety scores of each image in the response.
+      description="""Whether to report the safety scores of each generated image and
+      the positive prompt in the response.
       """,
   )
   include_rai_reason: Optional[bool] = Field(
@@ -4163,7 +4302,8 @@ class EditImageConfigDict(TypedDict, total=False):
       """
   include_safety_attributes: Optional[bool]
-  """Whether to report the safety scores of each image in the response.
+  """Whether to report the safety scores of each generated image and
+      the positive prompt in the response.
       """
   include_rai_reason: Optional[bool]
@@ -5313,14 +5453,7 @@ GenerateVideosResponseOrDict = Union[
 class GenerateVideosOperation(_common.BaseModel):
-  """A video generation operation.
-  Use the following code to refresh the operation:
-  ```
-  operation = client.operations.get(operation)
-  ```
-  """
+  """A video generation operation."""
   name: Optional[str] = Field(
       default=None,
@@ -5348,14 +5481,7 @@ class GenerateVideosOperation(_common.BaseModel):
 class GenerateVideosOperationDict(TypedDict, total=False):
-  """A video generation operation.
-  Use the following code to refresh the operation:
-  ```
-  operation = client.operations.get(operation)
-  ```
-  """
+  """A video generation operation."""
   name: Optional[str]
   """The server-assigned name, which is only unique within the same service that originally returns it. If you use the default HTTP mapping, the `name` should be a resource name ending with `operations/{unique_id}`."""
@@ -6603,11 +6729,11 @@ class CreateCachedContentConfig(_common.BaseModel):
   )
   ttl: Optional[str] = Field(
       default=None,
-      description="""The TTL for this resource. The expiration time is computed: now + TTL.""",
+      description="""The TTL for this resource. The expiration time is computed: now + TTL. It is a duration string, with up to nine fractional digits, terminated by 's'. Example: "3.5s".""",
   )
   expire_time: Optional[datetime.datetime] = Field(
       default=None,
-      description="""Timestamp of when this resource is considered expired.""",
+      description="""Timestamp of when this resource is considered expired. Uses RFC 3339 format, Example: 2014-10-02T15:01:23Z.""",
   )
   display_name: Optional[str] = Field(
       default=None,
@@ -6643,10 +6769,10 @@ class CreateCachedContentConfigDict(TypedDict, total=False):
   """Used to override HTTP request options."""
   ttl: Optional[str]
-  """The TTL for this resource. The expiration time is computed: now + TTL."""
+  """The TTL for this resource. The expiration time is computed: now + TTL. It is a duration string, with up to nine fractional digits, terminated by 's'. Example: "3.5s"."""
   expire_time: Optional[datetime.datetime]
-  """Timestamp of when this resource is considered expired."""
+  """Timestamp of when this resource is considered expired. Uses RFC 3339 format, Example: 2014-10-02T15:01:23Z."""
   display_name: Optional[str]
   """The user-generated meaningful display name of the cached content.
@@ -6937,11 +7063,11 @@ class UpdateCachedContentConfig(_common.BaseModel):
   )
   ttl: Optional[str] = Field(
       default=None,
-      description="""The TTL for this resource. The expiration time is computed: now + TTL.""",
+      description="""The TTL for this resource. The expiration time is computed: now + TTL. It is a duration string, with up to nine fractional digits, terminated by 's'. Example: "3.5s".""",
   )
   expire_time: Optional[datetime.datetime] = Field(
       default=None,
-      description="""Timestamp of when this resource is considered expired.""",
+      description="""Timestamp of when this resource is considered expired. Uses RFC 3339 format, Example: 2014-10-02T15:01:23Z.""",
   )
@@ -6952,10 +7078,10 @@ class UpdateCachedContentConfigDict(TypedDict, total=False):
   """Used to override HTTP request options."""
   ttl: Optional[str]
-  """The TTL for this resource. The expiration time is computed: now + TTL."""
+  """The TTL for this resource. The expiration time is computed: now + TTL. It is a duration string, with up to nine fractional digits, terminated by 's'. Example: "3.5s"."""
   expire_time: Optional[datetime.datetime]
-  """Timestamp of when this resource is considered expired."""
+  """Timestamp of when this resource is considered expired. Uses RFC 3339 format, Example: 2014-10-02T15:01:23Z."""
 UpdateCachedContentConfigOrDict = Union[
@@ -7985,6 +8111,10 @@ class TestTableItem(_common.BaseModel):
       default=None,
       description="""When set to a reason string, this test will be skipped in the API mode. Use this flag for tests that can not be reproduced with the real API. E.g. a test that deletes a resource.""",
   )
+  ignore_keys: Optional[list[str]] = Field(
+      default=None,
+      description="""Keys to ignore when comparing the request and response. This is useful for tests that are not deterministic.""",
+  )
 class TestTableItemDict(TypedDict, total=False):
@@ -8010,6 +8140,9 @@ class TestTableItemDict(TypedDict, total=False):
   skip_in_api_mode: Optional[str]
   """When set to a reason string, this test will be skipped in the API mode. Use this flag for tests that can not be reproduced with the real API. E.g. a test that deletes a resource."""
+  ignore_keys: Optional[list[str]]
+  """Keys to ignore when comparing the request and response. This is useful for tests that are not deterministic."""
 TestTableItemOrDict = Union[TestTableItem, TestTableItemDict]
@@ -8641,6 +8774,36 @@ LiveServerSetupCompleteOrDict = Union[
 ]
+class Transcription(_common.BaseModel):
+  """Audio transcription in Server Conent."""
+  text: Optional[str] = Field(
+      default=None,
+      description="""Transcription text.
+      """,
+  )
+  finished: Optional[bool] = Field(
+      default=None,
+      description="""The bool indicates the end of the transcription.
+      """,
+  )
+class TranscriptionDict(TypedDict, total=False):
+  """Audio transcription in Server Conent."""
+  text: Optional[str]
+  """Transcription text.
+      """
+  finished: Optional[bool]
+  """The bool indicates the end of the transcription.
+      """
+TranscriptionOrDict = Union[Transcription, TranscriptionDict]
 class LiveServerContent(_common.BaseModel):
   """Incremental server update generated by the model in response to client messages.
@@ -8660,6 +8823,30 @@ class LiveServerContent(_common.BaseModel):
       default=None,
       description="""If true, indicates that a client message has interrupted current model generation. If the client is playing out the content in realtime, this is a good signal to stop and empty the current queue.""",
   )
+  generation_complete: Optional[bool] = Field(
+      default=None,
+      description="""If true, indicates that the model is done generating. When model is
+      interrupted while generating there will be no generation_complete message
+      in interrupted turn, it will go through interrupted > turn_complete.
+      When model assumes realtime playback there will be delay between
+      generation_complete and turn_complete that is caused by model
+      waiting for playback to finish. If true, indicates that the model
+      has finished generating all content. This is a signal to the client
+      that it can stop sending messages.""",
+  )
+  input_transcription: Optional[Transcription] = Field(
+      default=None,
+      description="""Input transcription. The transcription is independent to the model
+      turn which means it doesn’t imply any ordering between transcription and
+      model turn.""",
+  )
+  output_transcription: Optional[Transcription] = Field(
+      default=None,
+      description="""Output transcription. The transcription is independent to the model
+      turn which means it doesn’t imply any ordering between transcription and
+      model turn.
+      """,
+  )
 class LiveServerContentDict(TypedDict, total=False):
@@ -8678,6 +8865,27 @@ class LiveServerContentDict(TypedDict, total=False):
   interrupted: Optional[bool]
   """If true, indicates that a client message has interrupted current model generation. If the client is playing out the content in realtime, this is a good signal to stop and empty the current queue."""
+  generation_complete: Optional[bool]
+  """If true, indicates that the model is done generating. When model is
+      interrupted while generating there will be no generation_complete message
+      in interrupted turn, it will go through interrupted > turn_complete.
+      When model assumes realtime playback there will be delay between
+      generation_complete and turn_complete that is caused by model
+      waiting for playback to finish. If true, indicates that the model
+      has finished generating all content. This is a signal to the client
+      that it can stop sending messages."""
+  input_transcription: Optional[TranscriptionDict]
+  """Input transcription. The transcription is independent to the model
+      turn which means it doesn’t imply any ordering between transcription and
+      model turn."""
+  output_transcription: Optional[TranscriptionDict]
+  """Output transcription. The transcription is independent to the model
+      turn which means it doesn’t imply any ordering between transcription and
+      model turn.
+      """
 LiveServerContentOrDict = Union[LiveServerContent, LiveServerContentDict]
@@ -8817,15 +9025,7 @@ class LiveClientSetup(_common.BaseModel):
   generation_config: Optional[GenerationConfig] = Field(
       default=None,
       description="""The generation configuration for the session.
-The following fields are supported:
-- `response_logprobs`
-- `response_mime_type`
-- `logprobs`
-- `response_schema`
-- `stop_sequence`
-- `routing_config`
-- `audio_timestamp`
+      Note: only a subset of fields are supported.
       """,
   )
   system_instruction: Optional[Content] = Field(
@@ -8855,15 +9055,7 @@ class LiveClientSetupDict(TypedDict, total=False):
   generation_config: Optional[GenerationConfigDict]
   """The generation configuration for the session.
-The following fields are supported:
-- `response_logprobs`
-- `response_mime_type`
-- `logprobs`
-- `response_schema`
-- `stop_sequence`
-- `routing_config`
-- `audio_timestamp`
+      Note: only a subset of fields are supported.
       """
   system_instruction: Optional[ContentDict]
@@ -8937,11 +9129,11 @@ LiveClientContentOrDict = Union[LiveClientContent, LiveClientContentDict]
 class LiveClientRealtimeInput(_common.BaseModel):
   """User input that is sent in real time.
-  This is different from `ClientContentUpdate` in a few ways:
+  This is different from `LiveClientContent` in a few ways:
     - Can be sent continuously without interruption to model generation.
     - If there is a need to mix data interleaved across the
-      `ClientContentUpdate` and the `RealtimeUpdate`, server attempts to
+      `LiveClientContent` and the `LiveClientRealtimeInput`, server attempts to
       optimize for best response, but there are no guarantees.
     - End of turn is not explicitly specified, but is rather derived from user
       activity (for example, end of speech).
@@ -8959,11 +9151,11 @@ class LiveClientRealtimeInput(_common.BaseModel):
 class LiveClientRealtimeInputDict(TypedDict, total=False):
   """User input that is sent in real time.
-  This is different from `ClientContentUpdate` in a few ways:
+  This is different from `LiveClientContent` in a few ways:
     - Can be sent continuously without interruption to model generation.
     - If there is a need to mix data interleaved across the
-      `ClientContentUpdate` and the `RealtimeUpdate`, server attempts to
+      `LiveClientContent` and the `LiveClientRealtimeInput`, server attempts to
       optimize for best response, but there are no guarantees.
     - End of turn is not explicitly specified, but is rather derived from user
       activity (for example, end of speech).
@@ -9059,6 +9251,23 @@ class LiveClientMessageDict(TypedDict, total=False):
 LiveClientMessageOrDict = Union[LiveClientMessage, LiveClientMessageDict]
+class AudioTranscriptionConfig(_common.BaseModel):
+  """The audio transcription configuration in Setup."""
+  pass
+class AudioTranscriptionConfigDict(TypedDict, total=False):
+  """The audio transcription configuration in Setup."""
+  pass
+AudioTranscriptionConfigOrDict = Union[
+    AudioTranscriptionConfig, AudioTranscriptionConfigDict
+]
 class LiveConnectConfig(_common.BaseModel):
   """Session config for the API connection."""
@@ -9072,6 +9281,42 @@ class LiveConnectConfig(_common.BaseModel):
       modalities that the model can return. Defaults to AUDIO if not specified.
       """,
   )
+  temperature: Optional[float] = Field(
+      default=None,
+      description="""Value that controls the degree of randomness in token selection.
+      Lower temperatures are good for prompts that require a less open-ended or
+      creative response, while higher temperatures can lead to more diverse or
+      creative results.
+      """,
+  )
+  top_p: Optional[float] = Field(
+      default=None,
+      description="""Tokens are selected from the most to least probable until the sum
+      of their probabilities equals this value. Use a lower value for less
+      random responses and a higher value for more random responses.
+      """,
+  )
+  top_k: Optional[float] = Field(
+      default=None,
+      description="""For each token selection step, the ``top_k`` tokens with the
+      highest probabilities are sampled. Then tokens are further filtered based
+      on ``top_p`` with the final token selected using temperature sampling. Use
+      a lower number for less random responses and a higher number for more
+      random responses.
+      """,
+  )
+  max_output_tokens: Optional[int] = Field(
+      default=None,
+      description="""Maximum number of tokens that can be generated in the response.
+      """,
+  )
+  seed: Optional[int] = Field(
+      default=None,
+      description="""When ``seed`` is fixed to a specific number, the model makes a best
+      effort to provide the same response for repeated requests. By default, a
+      random number is used.
+      """,
+  )
   speech_config: Optional[SpeechConfig] = Field(
       default=None,
       description="""The speech generation configuration.
@@ -9091,6 +9336,17 @@ class LiveConnectConfig(_common.BaseModel):
       external systems to perform an action, or set of actions, outside of
       knowledge and scope of the model.""",
   )
+  input_audio_transcription: Optional[AudioTranscriptionConfig] = Field(
+      default=None,
+      description="""The transcription of the input aligns with the input audio language.
+      """,
+  )
+  output_audio_transcription: Optional[AudioTranscriptionConfig] = Field(
+      default=None,
+      description="""The transcription of the output aligns with the language code
+      specified for the output audio.
+      """,
+  )
 class LiveConnectConfigDict(TypedDict, total=False):
@@ -9104,6 +9360,37 @@ class LiveConnectConfigDict(TypedDict, total=False):
       modalities that the model can return. Defaults to AUDIO if not specified.
       """
+  temperature: Optional[float]
+  """Value that controls the degree of randomness in token selection.
+      Lower temperatures are good for prompts that require a less open-ended or
+      creative response, while higher temperatures can lead to more diverse or
+      creative results.
+      """
+  top_p: Optional[float]
+  """Tokens are selected from the most to least probable until the sum
+      of their probabilities equals this value. Use a lower value for less
+      random responses and a higher value for more random responses.
+      """
+  top_k: Optional[float]
+  """For each token selection step, the ``top_k`` tokens with the
+      highest probabilities are sampled. Then tokens are further filtered based
+      on ``top_p`` with the final token selected using temperature sampling. Use
+      a lower number for less random responses and a higher number for more
+      random responses.
+      """
+  max_output_tokens: Optional[int]
+  """Maximum number of tokens that can be generated in the response.
+      """
+  seed: Optional[int]
+  """When ``seed`` is fixed to a specific number, the model makes a best
+      effort to provide the same response for repeated requests. By default, a
+      random number is used.
+      """
   speech_config: Optional[SpeechConfigDict]
   """The speech generation configuration.
       """
@@ -9120,5 +9407,14 @@ class LiveConnectConfigDict(TypedDict, total=False):
       external systems to perform an action, or set of actions, outside of
       knowledge and scope of the model."""
+  input_audio_transcription: Optional[AudioTranscriptionConfigDict]
+  """The transcription of the input aligns with the input audio language.
+      """
+  output_audio_transcription: Optional[AudioTranscriptionConfigDict]
+  """The transcription of the output aligns with the language code
+      specified for the output audio.
+      """
 LiveConnectConfigOrDict = Union[LiveConnectConfig, LiveConnectConfigDict]

google-genai 1.7.0__py3-none-any.whl → 1.9.0__py3-none-any.whl

google-genai 1.7.0py3-none-any.whl → 1.9.0py3-none-any.whl