PyPI - apache-airflow-providers-google - Versions diffs - 10.2.0rc1__py3-none-any.whl → 10.3.0rc1__py3-none-any.whl - Mend

apache-airflow-providers-google 10.2.0rc1py3-none-any.whl → 10.3.0rc1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

airflow/providers/google/cloud/sensors/gcs.py CHANGED Viewed

@@ -27,6 +27,7 @@ from typing import TYPE_CHECKING, Any, Callable, Sequence
 from google.api_core.retry import Retry
 from google.cloud.storage.retry import DEFAULT_RETRY
+from airflow.configuration import conf
 from airflow.exceptions import AirflowException, AirflowProviderDeprecationWarning
 from airflow.providers.google.cloud.hooks.gcs import GCSHook
 from airflow.providers.google.cloud.triggers.gcs import (
@@ -76,10 +77,9 @@ class GCSObjectExistenceSensor(BaseSensorOperator):
         google_cloud_conn_id: str = "google_cloud_default",
         impersonation_chain: str | Sequence[str] | None = None,
         retry: Retry = DEFAULT_RETRY,
-        deferrable: bool = False,
+        deferrable: bool = conf.getboolean("operators", "default_deferrable", fallback=False),
         **kwargs,
     ) -> None:
         super().__init__(**kwargs)
         self.bucket = bucket
         self.object = object
@@ -208,10 +208,9 @@ class GCSObjectUpdateSensor(BaseSensorOperator):
         ts_func: Callable = ts_function,
         google_cloud_conn_id: str = "google_cloud_default",
         impersonation_chain: str | Sequence[str] | None = None,
-        deferrable: bool = False,
+        deferrable: bool = conf.getboolean("operators", "default_deferrable", fallback=False),
         **kwargs,
     ) -> None:
         super().__init__(**kwargs)
         self.bucket = bucket
         self.object = object
@@ -298,7 +297,7 @@ class GCSObjectsWithPrefixExistenceSensor(BaseSensorOperator):
         prefix: str,
         google_cloud_conn_id: str = "google_cloud_default",
         impersonation_chain: str | Sequence[str] | None = None,
-        deferrable: bool = False,
+        deferrable: bool = conf.getboolean("operators", "default_deferrable", fallback=False),
         **kwargs,
     ) -> None:
         super().__init__(**kwargs)
@@ -412,10 +411,9 @@ class GCSUploadSessionCompleteSensor(BaseSensorOperator):
         allow_delete: bool = True,
         google_cloud_conn_id: str = "google_cloud_default",
         impersonation_chain: str | Sequence[str] | None = None,
-        deferrable: bool = False,
+        deferrable: bool = conf.getboolean("operators", "default_deferrable", fallback=False),
         **kwargs,
     ) -> None:
         super().__init__(**kwargs)
         self.bucket = bucket

airflow/providers/google/cloud/sensors/pubsub.py CHANGED Viewed

@@ -23,6 +23,7 @@ from typing import TYPE_CHECKING, Any, Callable, Sequence
 from google.cloud.pubsub_v1.types import ReceivedMessage
+from airflow.configuration import conf
 from airflow.exceptions import AirflowException
 from airflow.providers.google.cloud.hooks.pubsub import PubSubHook
 from airflow.providers.google.cloud.triggers.pubsub import PubsubPullTrigger
@@ -103,10 +104,9 @@ class PubSubPullSensor(BaseSensorOperator):
         messages_callback: Callable[[list[ReceivedMessage], Context], Any] | None = None,
         impersonation_chain: str | Sequence[str] | None = None,
         poke_interval: float = 10.0,
-        deferrable: bool = False,
+        deferrable: bool = conf.getboolean("operators", "default_deferrable", fallback=False),
         **kwargs,
     ) -> None:
         super().__init__(**kwargs)
         self.gcp_conn_id = gcp_conn_id
         self.project_id = project_id

airflow/providers/google/cloud/transfers/bigquery_to_bigquery.py CHANGED Viewed

@@ -54,10 +54,11 @@ class BigQueryToBigQueryOperator(BaseOperator):
     :param labels: a dictionary containing labels for the job/query,
         passed to BigQuery
     :param encryption_configuration: [Optional] Custom encryption configuration (e.g., Cloud KMS keys).
-        **Example**: ::
+        .. code-block:: python
             encryption_configuration = {
-                "kmsKeyName": "projects/testp/locations/us/keyRings/test-kr/cryptoKeys/test-key"
+                "kmsKeyName": "projects/testp/locations/us/keyRings/test-kr/cryptoKeys/test-key",
             }
     :param location: The geographic location of the job. You must specify the location to run the job if
         the location to run a job is not in the US or the EU multi-regional location or

airflow/providers/google/cloud/transfers/bigquery_to_gcs.py CHANGED Viewed

@@ -25,6 +25,7 @@ from google.api_core.retry import Retry
 from google.cloud.bigquery import DEFAULT_RETRY, UnknownJob
 from airflow import AirflowException
+from airflow.configuration import conf
 from airflow.models import BaseOperator
 from airflow.providers.google.cloud.hooks.bigquery import BigQueryHook, BigQueryJob
 from airflow.providers.google.cloud.links.bigquery import BigQueryTableLink
@@ -114,7 +115,7 @@ class BigQueryToGCSOperator(BaseOperator):
         job_id: str | None = None,
         force_rerun: bool = False,
         reattach_states: set[str] | None = None,
-        deferrable: bool = False,
+        deferrable: bool = conf.getboolean("operators", "default_deferrable", fallback=False),
         **kwargs,
     ) -> None:
         super().__init__(**kwargs)

airflow/providers/google/cloud/transfers/facebook_ads_to_gcs.py CHANGED Viewed

@@ -42,10 +42,10 @@ class FlushAction(Enum):
 class FacebookAdsReportToGcsOperator(BaseOperator):
-    """
-    Fetches the results from the Facebook Ads API as desired in the params
-    Converts and saves the data as a temporary JSON file
-    Uploads the JSON to Google Cloud Storage.
+    """Fetch from Facebook Ads API.
+    This converts and saves the data as a temporary JSON file, and uploads the
+    JSON to Google Cloud Storage.
     .. seealso::
         For more information on the Facebook Ads API, take a look at the API docs:

airflow/providers/google/cloud/transfers/gcs_to_bigquery.py CHANGED Viewed

@@ -36,6 +36,7 @@ from google.cloud.bigquery import (
 from google.cloud.bigquery.table import EncryptionConfiguration, Table, TableReference
 from airflow import AirflowException
+from airflow.configuration import conf
 from airflow.models import BaseOperator
 from airflow.providers.google.cloud.hooks.bigquery import BigQueryHook, BigQueryJob
 from airflow.providers.google.cloud.hooks.gcs import GCSHook
@@ -148,10 +149,11 @@ class GCSToBigQueryOperator(BaseOperator):
         If autodetect is None and no schema is provided (neither via schema_fields
         nor a schema_object), assume the table already exists.
     :param encryption_configuration: [Optional] Custom encryption configuration (e.g., Cloud KMS keys).
-        **Example**: ::
+        .. code-block:: python
             encryption_configuration = {
-                "kmsKeyName": "projects/testp/locations/us/keyRings/test-kr/cryptoKeys/test-key"
+                "kmsKeyName": "projects/testp/locations/us/keyRings/test-kr/cryptoKeys/test-key",
             }
     :param location: [Optional] The geographic location of the job. Required except for US and EU.
         See details at https://cloud.google.com/bigquery/docs/locations#specifying_your_location
@@ -177,6 +179,7 @@ class GCSToBigQueryOperator(BaseOperator):
         "schema_object_bucket",
         "destination_project_dataset_table",
         "impersonation_chain",
+        "src_fmt_configs",
     )
     template_ext: Sequence[str] = (".sql",)
     ui_color = "#f0eee4"
@@ -216,7 +219,7 @@ class GCSToBigQueryOperator(BaseOperator):
         impersonation_chain: str | Sequence[str] | None = None,
         labels=None,
         description=None,
-        deferrable: bool = False,
+        deferrable: bool = conf.getboolean("operators", "default_deferrable", fallback=False),
         result_retry: Retry = DEFAULT_RETRY,
         result_timeout: float | None = None,
         cancel_on_kill: bool = True,
@@ -226,7 +229,6 @@ class GCSToBigQueryOperator(BaseOperator):
         project_id: str | None = None,
         **kwargs,
     ) -> None:
         super().__init__(**kwargs)
         self.hook: BigQueryHook | None = None
         self.configuration: dict[str, Any] = {}
@@ -716,7 +718,6 @@ class GCSToBigQueryOperator(BaseOperator):
     def _cleanse_time_partitioning(
         self, destination_dataset_table: str | None, time_partitioning_in: dict | None
     ) -> dict:  # if it is a partitioned table ($ is in the table name) add partition load option
         if time_partitioning_in is None:
             time_partitioning_in = {}

airflow/providers/google/cloud/transfers/gcs_to_gcs.py CHANGED Viewed

@@ -18,9 +18,10 @@
 """This module contains a Google Cloud Storage operator."""
 from __future__ import annotations
+import warnings
 from typing import TYPE_CHECKING, Sequence
-from airflow.exceptions import AirflowException
+from airflow.exceptions import AirflowException, AirflowProviderDeprecationWarning
 from airflow.models import BaseOperator
 from airflow.providers.google.cloud.hooks.gcs import GCSHook
@@ -66,8 +67,8 @@ class GCSToGCSOperator(BaseOperator):
         of copied to the new location. This is the equivalent of a mv command
         as opposed to a cp command.
     :param replace: Whether you want to replace existing destination files or not.
-    :param delimiter: This is used to restrict the result to only the 'files' in a given 'folder'.
-        If source_objects = ['foo/bah/'] and delimiter = '.avro', then only the 'files' in the
+    :param delimiter: (Deprecated) This is used to restrict the result to only the 'files' in a given
+        'folder'. If source_objects = ['foo/bah/'] and delimiter = '.avro', then only the 'files' in the
         folder 'foo/bah/' with '.avro' delimiter will be copied to the destination object.
     :param gcp_conn_id: (Optional) The connection ID used to connect to Google Cloud.
     :param last_modified_time: When specified, the objects will be copied or moved,
@@ -90,6 +91,8 @@ class GCSToGCSOperator(BaseOperator):
         doesn't exist. It doesn't have any effect when the source objects are folders or patterns.
     :param exact_match: When specified, only exact match of the source object (filename) will be
         copied.
+    :param match_glob: (Optional) filters objects based on the glob pattern given by the string (
+        e.g, ``'**/*/.json'``)
     :Example:
@@ -116,7 +119,7 @@ class GCSToGCSOperator(BaseOperator):
             source_objects=['sales/sales-2017'],
             destination_bucket='data_backup',
             destination_object='copied_sales/2017/',
-            delimiter='.avro'
+            match_glob='**/*.avro'
             gcp_conn_id=google_cloud_conn_id
         )
@@ -190,15 +193,34 @@ class GCSToGCSOperator(BaseOperator):
         impersonation_chain: str | Sequence[str] | None = None,
         source_object_required=False,
         exact_match=False,
+        match_glob: str | None = None,
         **kwargs,
     ):
         super().__init__(**kwargs)
         self.source_bucket = source_bucket
+        if source_object and WILDCARD in source_object:
+            warnings.warn(
+                "Usage of wildcard (*) in 'source_object' is deprecated, utilize 'match_glob' instead",
+                AirflowProviderDeprecationWarning,
+                stacklevel=2,
+            )
         self.source_object = source_object
+        if source_objects and any([WILDCARD in obj for obj in source_objects]):
+            warnings.warn(
+                "Usage of wildcard (*) in 'source_objects' is deprecated, utilize 'match_glob' instead",
+                AirflowProviderDeprecationWarning,
+                stacklevel=2,
+            )
         self.source_objects = source_objects
         self.destination_bucket = destination_bucket
         self.destination_object = destination_object
+        if delimiter:
+            warnings.warn(
+                "Usage of 'delimiter' is deprecated, please use 'match_glob' instead",
+                AirflowProviderDeprecationWarning,
+                stacklevel=2,
+            )
         self.delimiter = delimiter
         self.move_object = move_object
         self.replace = replace
@@ -209,6 +231,7 @@ class GCSToGCSOperator(BaseOperator):
         self.impersonation_chain = impersonation_chain
         self.source_object_required = source_object_required
         self.exact_match = exact_match
+        self.match_glob = match_glob
     def execute(self, context: Context):
@@ -251,6 +274,7 @@ class GCSToGCSOperator(BaseOperator):
         for prefix in self.source_objects:
             # Check if prefix contains wildcard
             if WILDCARD in prefix:
                 self._copy_source_with_wildcard(hook=hook, prefix=prefix)
             # Now search with prefix using provided delimiter if any
             else:
@@ -261,15 +285,19 @@ class GCSToGCSOperator(BaseOperator):
         # and only keep those files which are present in
         # Source GCS bucket and not in Destination GCS bucket
         delimiter = kwargs.get("delimiter")
+        match_glob = kwargs.get("match_glob")
         objects = kwargs.get("objects")
         if self.destination_object is None:
-            existing_objects = hook.list(self.destination_bucket, prefix=prefix, delimiter=delimiter)
+            existing_objects = hook.list(
+                self.destination_bucket, prefix=prefix, delimiter=delimiter, match_glob=match_glob
+            )
         else:
             self.log.info("Replaced destination_object with source_object prefix.")
             destination_objects = hook.list(
                 self.destination_bucket,
                 prefix=self.destination_object,
                 delimiter=delimiter,
+                match_glob=match_glob,
             )
             existing_objects = [
                 dest_object.replace(self.destination_object, prefix, 1) for dest_object in destination_objects
@@ -338,11 +366,15 @@ class GCSToGCSOperator(BaseOperator):
                 gcp_conn_id=google_cloud_conn_id
             )
         """
-        objects = hook.list(self.source_bucket, prefix=prefix, delimiter=self.delimiter)
+        objects = hook.list(
+            self.source_bucket, prefix=prefix, delimiter=self.delimiter, match_glob=self.match_glob
+        )
         if not self.replace:
             # If we are not replacing, ignore files already existing in source buckets
-            objects = self._ignore_existing_files(hook, prefix, objects=objects, delimiter=self.delimiter)
+            objects = self._ignore_existing_files(
+                hook, prefix, objects=objects, delimiter=self.delimiter, match_glob=self.match_glob
+            )
         # If objects is empty, and we have prefix, let's check if prefix is a blob
         # and copy directly
@@ -397,11 +429,18 @@ class GCSToGCSOperator(BaseOperator):
         self.log.info("Delimiter ignored because wildcard is in prefix")
         prefix_, delimiter = prefix.split(WILDCARD, 1)
         objects = hook.list(self.source_bucket, prefix=prefix_, delimiter=delimiter)
+        # TODO: After deprecating delimiter and wildcards in source objects,
+        #       remove previous line and uncomment the following:
+        # match_glob = f"**/*{delimiter}" if delimiter else None
+        # objects = hook.list(self.source_bucket, prefix=prefix_, match_glob=match_glob)
         if not self.replace:
             # If we are not replacing, list all files in the Destination GCS bucket
             # and only keep those files which are present in
             # Source GCS bucket and not in Destination GCS bucket
             objects = self._ignore_existing_files(hook, prefix_, delimiter=delimiter, objects=objects)
+            # TODO: After deprecating delimiter and wildcards in source objects,
+            #       remove previous line and uncomment the following:
+            # objects = self._ignore_existing_files(hook, prefix_, match_glob=match_glob, objects=objects)
         for source_object in objects:
             if self.destination_object is None:

airflow/providers/google/cloud/transfers/gcs_to_sftp.py CHANGED Viewed

@@ -37,7 +37,7 @@ class GCSToSFTPOperator(BaseOperator):
     """
     Transfer files from a Google Cloud Storage bucket to SFTP server.
-    **Example**: ::
+    .. code-block:: python
         with models.DAG(
             "example_gcs_to_sftp",
@@ -145,8 +145,11 @@ class GCSToSFTPOperator(BaseOperator):
             prefix, delimiter = self.source_object.split(WILDCARD, 1)
             prefix_dirname = os.path.dirname(prefix)
             objects = gcs_hook.list(self.source_bucket, prefix=prefix, delimiter=delimiter)
+            # TODO: After deprecating delimiter and wildcards in source objects,
+            #       remove the previous line and uncomment the following:
+            # match_glob = f"**/*{delimiter}" if delimiter else None
+            # objects = gcs_hook.list(self.source_bucket, prefix=prefix, match_glob=match_glob)
             for source_object in objects:
                 destination_path = self._resolve_destination_path(source_object, prefix=prefix_dirname)

airflow/providers/google/cloud/triggers/cloud_sql.py ADDED Viewed

@@ -0,0 +1,102 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+"""This module contains Google Cloud SQL triggers."""
+from __future__ import annotations
+import asyncio
+from typing import Sequence
+from airflow.providers.google.cloud.hooks.cloud_sql import CloudSQLAsyncHook, CloudSqlOperationStatus
+from airflow.triggers.base import BaseTrigger, TriggerEvent
+class CloudSQLExportTrigger(BaseTrigger):
+    """
+    Trigger that periodically polls information from Cloud SQL API to verify job status.
+    Implementation leverages asynchronous transport.
+    """
+    def __init__(
+        self,
+        operation_name: str,
+        project_id: str | None = None,
+        gcp_conn_id: str = "google_cloud_default",
+        impersonation_chain: str | Sequence[str] | None = None,
+        poke_interval: int = 20,
+    ):
+        super().__init__()
+        self.gcp_conn_id = gcp_conn_id
+        self.impersonation_chain = impersonation_chain
+        self.operation_name = operation_name
+        self.project_id = project_id
+        self.poke_interval = poke_interval
+        self.hook = CloudSQLAsyncHook(
+            gcp_conn_id=self.gcp_conn_id,
+            impersonation_chain=self.impersonation_chain,
+        )
+    def serialize(self):
+        return (
+            "airflow.providers.google.cloud.triggers.cloud_sql.CloudSQLExportTrigger",
+            {
+                "operation_name": self.operation_name,
+                "project_id": self.project_id,
+                "gcp_conn_id": self.gcp_conn_id,
+                "impersonation_chain": self.impersonation_chain,
+                "poke_interval": self.poke_interval,
+            },
+        )
+    async def run(self):
+        while True:
+            try:
+                operation = await self.hook.get_operation(
+                    project_id=self.project_id, operation_name=self.operation_name
+                )
+                if operation["status"] == CloudSqlOperationStatus.DONE:
+                    if "error" in operation:
+                        yield TriggerEvent(
+                            {
+                                "operation_name": operation["name"],
+                                "status": "error",
+                                "message": operation["error"]["message"],
+                            }
+                        )
+                        return
+                    yield TriggerEvent(
+                        {
+                            "operation_name": operation["name"],
+                            "status": "success",
+                        }
+                    )
+                    return
+                else:
+                    self.log.info(
+                        "Operation status is %s, sleeping for %s seconds.",
+                        operation["status"],
+                        self.poke_interval,
+                    )
+                    await asyncio.sleep(self.poke_interval)
+            except Exception as e:
+                self.log.exception("Exception occurred while checking operation status.")
+                yield TriggerEvent(
+                    {
+                        "status": "failed",
+                        "message": str(e),
+                    }
+                )

airflow/providers/google/cloud/triggers/kubernetes_engine.py CHANGED Viewed

@@ -18,11 +18,15 @@
 from __future__ import annotations
 import asyncio
+import warnings
 from datetime import datetime
 from typing import Any, AsyncIterator, Sequence
 from google.cloud.container_v1.types import Operation
+from airflow.exceptions import AirflowProviderDeprecationWarning
+from airflow.providers.cncf.kubernetes.utils.pod_manager import OnFinishAction
 try:
     from airflow.providers.cncf.kubernetes.triggers.pod import KubernetesPodTrigger
 except ImportError:
@@ -44,15 +48,19 @@ class GKEStartPodTrigger(KubernetesPodTrigger):
     :param poll_interval: Polling period in seconds to check for the status.
     :param trigger_start_time: time in Datetime format when the trigger was started
     :param in_cluster: run kubernetes client with in_cluster configuration.
-    :param should_delete_pod: What to do when the pod reaches its final
-        state, or the execution is interrupted. If True (default), delete the
-        pod; if False, leave the pod.
     :param get_logs: get the stdout of the container as logs of the tasks.
     :param startup_timeout: timeout in seconds to start up the pod.
     :param base_container_name: The name of the base container in the pod. This container's logs
         will appear as part of this task's logs if get_logs is True. Defaults to None. If None,
         will consult the class variable BASE_CONTAINER_NAME (which defaults to "base") for the base
         container name to use.
+    :param on_finish_action: What to do when the pod reaches its final state, or the execution is interrupted.
+        If "delete_pod", the pod will be deleted regardless it's state; if "delete_succeeded_pod",
+        only succeeded pod will be deleted. You can set to "keep_pod" to keep the pod.
+    :param should_delete_pod: What to do when the pod reaches its final
+        state, or the execution is interrupted. If True (default), delete the
+        pod; if False, leave the pod.
+        Deprecated - use `on_finish_action` instead.
     """
     def __init__(
@@ -66,9 +74,10 @@ class GKEStartPodTrigger(KubernetesPodTrigger):
         cluster_context: str | None = None,
         poll_interval: float = 2,
         in_cluster: bool | None = None,
-        should_delete_pod: bool = True,
         get_logs: bool = True,
         startup_timeout: int = 120,
+        on_finish_action: str = "delete_pod",
+        should_delete_pod: bool | None = None,
         *args,
         **kwargs,
     ):
@@ -87,10 +96,22 @@ class GKEStartPodTrigger(KubernetesPodTrigger):
         self.poll_interval = poll_interval
         self.cluster_context = cluster_context
         self.in_cluster = in_cluster
-        self.should_delete_pod = should_delete_pod
         self.get_logs = get_logs
         self.startup_timeout = startup_timeout
+        if should_delete_pod is not None:
+            warnings.warn(
+                "`should_delete_pod` parameter is deprecated, please use `on_finish_action`",
+                AirflowProviderDeprecationWarning,
+            )
+            self.on_finish_action = (
+                OnFinishAction.DELETE_POD if should_delete_pod else OnFinishAction.KEEP_POD
+            )
+            self.should_delete_pod = should_delete_pod
+        else:
+            self.on_finish_action = OnFinishAction(on_finish_action)
+            self.should_delete_pod = self.on_finish_action == OnFinishAction.DELETE_POD
         self._cluster_url = cluster_url
         self._ssl_ca_cert = ssl_ca_cert
@@ -105,11 +126,12 @@ class GKEStartPodTrigger(KubernetesPodTrigger):
                 "poll_interval": self.poll_interval,
                 "cluster_context": self.cluster_context,
                 "in_cluster": self.in_cluster,
-                "should_delete_pod": self.should_delete_pod,
                 "get_logs": self.get_logs,
                 "startup_timeout": self.startup_timeout,
                 "trigger_start_time": self.trigger_start_time,
                 "base_container_name": self.base_container_name,
+                "should_delete_pod": self.should_delete_pod,
+                "on_finish_action": self.on_finish_action.value,
             },
         )

airflow/providers/google/cloud/utils/bigquery.py CHANGED Viewed

@@ -16,6 +16,8 @@
 # under the License.
 from __future__ import annotations
+from typing import Any
 def bq_cast(string_field: str, bq_type: str) -> None | int | float | bool | str:
     """
@@ -34,3 +36,18 @@ def bq_cast(string_field: str, bq_type: str) -> None | int | float | bool | str:
         return string_field == "true"
     else:
         return string_field
+def convert_job_id(job_id: str | list[str], project_id: str, location: str | None) -> Any:
+    """
+    Helper method that converts to path: project_id:location:job_id
+    :param project_id: Required. The ID of the Google Cloud project where workspace located.
+    :param location: Optional. The ID of the Google Cloud region where workspace located.
+    :param job_id: Required. The ID of the job.
+    :return: str or list[str] of project_id:location:job_id.
+    """
+    location = location if location else "US"
+    if isinstance(job_id, list):
+        return [f"{project_id}:{location}:{i}" for i in job_id]
+    else:
+        return f"{project_id}:{location}:{job_id}"

airflow/providers/google/get_provider_info.py CHANGED Viewed

@@ -29,6 +29,7 @@ def get_provider_info():
         "description": "Google services including:\n\n  - `Google Ads <https://ads.google.com/>`__\n  - `Google Cloud (GCP) <https://cloud.google.com/>`__\n  - `Google Firebase <https://firebase.google.com/>`__\n  - `Google LevelDB <https://github.com/google/leveldb/>`__\n  - `Google Marketing Platform <https://marketingplatform.google.com/>`__\n  - `Google Workspace <https://workspace.google.com/>`__ (formerly Google Suite)\n",
         "suspended": False,
         "versions": [
+            "10.3.0",
             "10.2.0",
             "10.1.1",
             "10.1.0",
@@ -73,7 +74,7 @@ def get_provider_info():
             "gcloud-aio-auth>=4.0.0,<5.0.0",
             "gcloud-aio-bigquery>=6.1.2",
             "gcloud-aio-storage",
-            "google-ads>=20.0.0",
+            "google-ads>=21.2.0",
             "google-api-core>=2.11.0",
             "google-api-python-client>=1.6.0",
             "google-auth>=1.0.0",
@@ -1075,6 +1076,10 @@ def get_provider_info():
                 "integration-name": "Google Cloud Composer",
                 "python-modules": ["airflow.providers.google.cloud.triggers.cloud_composer"],
             },
+            {
+                "integration-name": "Google Cloud SQL",
+                "python-modules": ["airflow.providers.google.cloud.triggers.cloud_sql"],
+            },
             {
                 "integration-name": "Google Dataflow",
                 "python-modules": ["airflow.providers.google.cloud.triggers.dataflow"],
@@ -1441,7 +1446,7 @@ def get_provider_info():
         ],
         "additional-extras": [
             {"name": "apache.beam", "dependencies": ["apache-beam[gcp]"]},
-            {"name": "cncf.kubernetes", "dependencies": ["apache-airflow-providers-cncf-kubernetes>=6.2.0"]},
+            {"name": "cncf.kubernetes", "dependencies": ["apache-airflow-providers-cncf-kubernetes>=7.2.0"]},
             {"name": "leveldb", "dependencies": ["plyvel"]},
             {"name": "oracle", "dependencies": ["apache-airflow-providers-oracle>=3.1.0"]},
             {"name": "facebook", "dependencies": ["apache-airflow-providers-facebook>=2.2.0"]},

airflow/providers/google/suite/transfers/gcs_to_gdrive.py CHANGED Viewed

@@ -132,6 +132,10 @@ class GCSToGoogleDriveOperator(BaseOperator):
             prefix, delimiter = self.source_object.split(WILDCARD, 1)
             objects = self.gcs_hook.list(self.source_bucket, prefix=prefix, delimiter=delimiter)
+            # TODO: After deprecating delimiter and wildcards in source objects,
+            #       remove the previous line and uncomment the following:
+            # match_glob = f"**/*{delimiter}" if delimiter else None
+            # objects = self.gcs_hook.list(self.source_bucket, prefix=prefix, match_glob=match_glob)
             for source_object in objects:
                 if self.destination_object is None:

apache-airflow-providers-google 10.2.0rc1__py3-none-any.whl → 10.3.0rc1__py3-none-any.whl

apache-airflow-providers-google 10.2.0rc1py3-none-any.whl → 10.3.0rc1py3-none-any.whl