PyPI - ingestr - Versions diffs - 0.13.75__py3-none-any.whl → 0.14.98__py3-none-any.whl - Mend

ingestr 0.13.75py3-none-any.whl → 0.14.98py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of ingestr might be problematic. Click here for more details.

Files changed (79) hide show

ingestr/main.py +22 -3
ingestr/src/adjust/__init__.py +4 -4
ingestr/src/allium/__init__.py +128 -0
ingestr/src/anthropic/__init__.py +277 -0
ingestr/src/anthropic/helpers.py +525 -0
ingestr/src/appstore/__init__.py +1 -0
ingestr/src/asana_source/__init__.py +1 -1
ingestr/src/buildinfo.py +1 -1
ingestr/src/chess/__init__.py +1 -1
ingestr/src/couchbase_source/__init__.py +118 -0
ingestr/src/couchbase_source/helpers.py +135 -0
ingestr/src/cursor/__init__.py +83 -0
ingestr/src/cursor/helpers.py +188 -0
ingestr/src/destinations.py +169 -1
ingestr/src/docebo/__init__.py +589 -0
ingestr/src/docebo/client.py +435 -0
ingestr/src/docebo/helpers.py +97 -0
ingestr/src/elasticsearch/helpers.py +138 -0
ingestr/src/errors.py +8 -0
ingestr/src/facebook_ads/__init__.py +26 -23
ingestr/src/facebook_ads/helpers.py +47 -1
ingestr/src/factory.py +48 -0
ingestr/src/filesystem/__init__.py +8 -3
ingestr/src/filters.py +9 -0
ingestr/src/fluxx/__init__.py +9906 -0
ingestr/src/fluxx/helpers.py +209 -0
ingestr/src/frankfurter/__init__.py +157 -163
ingestr/src/frankfurter/helpers.py +3 -3
ingestr/src/freshdesk/__init__.py +25 -8
ingestr/src/freshdesk/freshdesk_client.py +40 -5
ingestr/src/fundraiseup/__init__.py +49 -0
ingestr/src/fundraiseup/client.py +81 -0
ingestr/src/github/__init__.py +6 -4
ingestr/src/google_analytics/__init__.py +1 -1
ingestr/src/hostaway/__init__.py +302 -0
ingestr/src/hostaway/client.py +288 -0
ingestr/src/http/__init__.py +35 -0
ingestr/src/http/readers.py +114 -0
ingestr/src/hubspot/__init__.py +6 -12
ingestr/src/influxdb/__init__.py +1 -0
ingestr/src/intercom/__init__.py +142 -0
ingestr/src/intercom/helpers.py +674 -0
ingestr/src/intercom/settings.py +279 -0
ingestr/src/jira_source/__init__.py +340 -0
ingestr/src/jira_source/helpers.py +439 -0
ingestr/src/jira_source/settings.py +170 -0
ingestr/src/klaviyo/__init__.py +5 -5
ingestr/src/linear/__init__.py +553 -116
ingestr/src/linear/helpers.py +77 -38
ingestr/src/mailchimp/__init__.py +126 -0
ingestr/src/mailchimp/helpers.py +226 -0
ingestr/src/mailchimp/settings.py +164 -0
ingestr/src/masking.py +344 -0
ingestr/src/monday/__init__.py +246 -0
ingestr/src/monday/helpers.py +392 -0
ingestr/src/monday/settings.py +328 -0
ingestr/src/mongodb/__init__.py +5 -2
ingestr/src/mongodb/helpers.py +384 -10
ingestr/src/plusvibeai/__init__.py +335 -0
ingestr/src/plusvibeai/helpers.py +544 -0
ingestr/src/plusvibeai/settings.py +252 -0
ingestr/src/revenuecat/__init__.py +83 -0
ingestr/src/revenuecat/helpers.py +237 -0
ingestr/src/salesforce/__init__.py +15 -8
ingestr/src/shopify/__init__.py +1 -1
ingestr/src/smartsheets/__init__.py +33 -5
ingestr/src/socrata_source/__init__.py +83 -0
ingestr/src/socrata_source/helpers.py +85 -0
ingestr/src/socrata_source/settings.py +8 -0
ingestr/src/sources.py +1418 -54
ingestr/src/stripe_analytics/__init__.py +2 -19
ingestr/src/wise/__init__.py +68 -0
ingestr/src/wise/client.py +63 -0
ingestr/tests/unit/test_smartsheets.py +6 -9
{ingestr-0.13.75.dist-info → ingestr-0.14.98.dist-info}/METADATA +24 -12
{ingestr-0.13.75.dist-info → ingestr-0.14.98.dist-info}/RECORD +79 -37
{ingestr-0.13.75.dist-info → ingestr-0.14.98.dist-info}/WHEEL +0 -0
{ingestr-0.13.75.dist-info → ingestr-0.14.98.dist-info}/entry_points.txt +0 -0
{ingestr-0.13.75.dist-info → ingestr-0.14.98.dist-info}/licenses/LICENSE.md +0 -0

ingestr/src/smartsheets/__init__.py CHANGED Viewed

@@ -3,6 +3,22 @@ from typing import Iterable
 import dlt
 import smartsheet  # type: ignore
 from dlt.extract import DltResource
+from smartsheet.models.enums import ColumnType  # type: ignore
+from smartsheet.models.sheet import Sheet  # type: ignore
+TYPE_MAPPING = {
+    ColumnType.TEXT_NUMBER: "text",
+    ColumnType.DATE: "date",
+    ColumnType.DATETIME: "timestamp",
+    ColumnType.CONTACT_LIST: "text",
+    ColumnType.CHECKBOX: "bool",
+    ColumnType.PICKLIST: "text",
+    ColumnType.DURATION: "text",
+    ColumnType.PREDECESSOR: "text",
+    ColumnType.ABSTRACT_DATETIME: "timestamp",
+    ColumnType.MULTI_CONTACT_LIST: "text",
+    ColumnType.MULTI_PICKLIST: "text",
+}
 @dlt.source
@@ -34,21 +50,33 @@ def smartsheet_source(
     )
     sheet_name = sheet_details.name
     resource_name = f"sheet_{sheet_name.replace(' ', '_').lower()}"
+    sheet = smartsheet_client.Sheets.get_sheet(sheet_id_int)
     yield dlt.resource(
-        _get_sheet_data(smartsheet_client, sheet_id_int),
+        _get_sheet_data(sheet),
         name=resource_name,
+        columns=_generate_type_hints(sheet),
         write_disposition="replace",
     )
-def _get_sheet_data(smartsheet_client: smartsheet.Smartsheet, sheet_id: int):
+def _get_sheet_data(sheet: Sheet):
     """Helper function to get all rows from a sheet."""
-    sheet = smartsheet_client.Sheets.get_sheet(sheet_id)
-    # Transform rows to a list of dictionaries
     column_titles = [col.title for col in sheet.columns]
     for row in sheet.rows:
-        row_data = {}
+        row_data = {"_row_id": row.id}
         for i, cell in enumerate(row.cells):
             row_data[column_titles[i]] = cell.value
         yield row_data
+def _generate_type_hints(sheet: Sheet):
+    return {
+        col.title: {
+            "data_type": TYPE_MAPPING.get(col.type.value),
+            "nullable": True,
+        }
+        for col in sheet.columns
+        if col.type.value in TYPE_MAPPING
+    }

ingestr/src/socrata_source/__init__.py ADDED Viewed

@@ -0,0 +1,83 @@
+"""A source loading data from Socrata open data platform"""
+from typing import Any, Dict, Iterator, Optional
+import dlt
+from .helpers import fetch_data
+@dlt.source(name="socrata", max_table_nesting=0)
+def source(
+    domain: str,
+    dataset_id: str,
+    app_token: Optional[str] = None,
+    username: Optional[str] = None,
+    password: Optional[str] = None,
+    incremental: Optional[Any] = None,
+    primary_key: Optional[str] = None,
+    write_disposition: Optional[str] = dlt.config.value,
+):
+    """
+    A dlt source for the Socrata open data platform.
+    Supports both full refresh (replace) and incremental loading (merge).
+    Args:
+        domain: The Socrata domain (e.g., "evergreen.data.socrata.com")
+        dataset_id: The dataset identifier (e.g., "6udu-fhnu")
+        app_token: Socrata app token for higher rate limits (recommended)
+        username: Username for authentication (if dataset is private)
+        password: Password for authentication (if dataset is private)
+        incremental: DLT incremental object for incremental loading
+        primary_key: Primary key field for merge operations (default: ":id")
+        write_disposition: Write disposition ("replace", "append", "merge").
+            If not provided, automatically determined based on incremental setting.
+    Returns:
+        A dlt source with a single "dataset" resource
+    """
+    @dlt.resource(
+        write_disposition=write_disposition or "replace",
+        primary_key=primary_key,  # type: ignore[call-overload]
+    )
+    def dataset(
+        incremental: Optional[dlt.sources.incremental] = incremental,  # type: ignore[type-arg]
+    ) -> Iterator[Dict[str, Any]]:
+        """
+        Yields records from a Socrata dataset.
+        Supports both full refresh (replace) and incremental loading (merge).
+        When incremental is provided, filters data using SoQL WHERE clause on the server side.
+        Yields:
+            Dict[str, Any]: Individual records from the dataset
+        """
+        fetch_kwargs: Dict[str, Any] = {
+            "domain": domain,
+            "dataset_id": dataset_id,
+            "app_token": app_token,
+            "username": username,
+            "password": password,
+        }
+        if incremental and incremental.cursor_path:
+            fetch_kwargs["incremental_key"] = incremental.cursor_path
+            fetch_kwargs["start_value"] = (
+                str(incremental.last_value)
+                if incremental.last_value is not None
+                else None
+            )
+            if getattr(incremental, "end_value", None) is not None:
+                ev = incremental.end_value  # type: ignore[attr-defined]
+                fetch_kwargs["end_value"] = (
+                    ev.isoformat()  # type: ignore[union-attr]
+                    if hasattr(ev, "isoformat")
+                    else str(ev)
+                )
+        # Fetch and yield records
+        yield from fetch_data(**fetch_kwargs)
+    return (dataset,)

ingestr/src/socrata_source/helpers.py ADDED Viewed

@@ -0,0 +1,85 @@
+"""Socrata API helpers"""
+from typing import Any, Dict, Iterator, Optional
+from dlt.sources.helpers import requests
+from .settings import DEFAULT_PAGE_SIZE, REQUEST_TIMEOUT
+def fetch_data(
+    domain: str,
+    dataset_id: str,
+    app_token: Optional[str] = None,
+    username: Optional[str] = None,
+    password: Optional[str] = None,
+    incremental_key: Optional[str] = None,
+    start_value: Optional[str] = None,
+    end_value: Optional[str] = None,
+) -> Iterator[Dict[str, Any]]:
+    """
+    Fetch records from Socrata dataset with pagination and optional filtering.
+    Uses offset-based pagination to get all records, not just first 50000.
+    Supports incremental loading via SoQL WHERE clause for server-side filtering.
+    Args:
+        domain: Socrata domain (e.g., "data.seattle.gov")
+        dataset_id: Dataset identifier (e.g., "6udu-fhnu")
+        app_token: Socrata app token for higher rate limits
+        username: Username for authentication
+        password: Password for authentication
+        start_value: Minimum value for incremental_key (inclusive)
+        end_value: Maximum value for incremental_key (exclusive)
+    Yields:
+        Lists of records (one list per page)
+    Raises:
+        requests.HTTPError: If API request fails
+    """
+    url = f"https://{domain}/resource/{dataset_id}.json"
+    headers = {"Accept": "application/json"}
+    if app_token:
+        headers["X-App-Token"] = app_token
+    auth = (username, password) if username and password else None
+    limit = DEFAULT_PAGE_SIZE
+    offset = 0
+    while True:
+        params: Dict[str, Any] = {"$limit": limit, "$offset": offset}
+        if incremental_key and start_value:
+            start_value_iso = str(start_value).replace(" ", "T")
+            where_conditions = [f"{incremental_key} >= '{start_value_iso}'"]
+            if end_value:
+                end_value_iso = str(end_value).replace(" ", "T")
+                where_conditions.append(f"{incremental_key} < '{end_value_iso}'")
+            params["$where"] = " AND ".join(where_conditions)
+            params["$order"] = f"{incremental_key} ASC"
+        response = requests.get(
+            url,
+            headers=headers,
+            auth=auth,
+            params=params,
+            timeout=REQUEST_TIMEOUT,
+        )
+        response.raise_for_status()
+        data = response.json()
+        if not data:
+            break
+        yield data
+        if len(data) < limit:
+            break
+        offset += limit

ingestr/src/socrata_source/settings.py ADDED Viewed

@@ -0,0 +1,8 @@
+"""Socrata API settings and constants"""
+# Request timeout in seconds
+REQUEST_TIMEOUT = 30
+# Maximum number of records to fetch per page
+# Socrata API supports up to 50000 records per request
+DEFAULT_PAGE_SIZE = 50000

ingestr 0.13.75__py3-none-any.whl → 0.14.98__py3-none-any.whl

Potentially problematic release.

ingestr 0.13.75py3-none-any.whl → 0.14.98py3-none-any.whl