ingestr 0.13.54__py3-none-any.whl → 0.13.55__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of ingestr might be problematic. Click here for more details.

ingestr/src/buildinfo.py CHANGED
@@ -1 +1 @@
1
- version = "v0.13.54"
1
+ version = "v0.13.55"
@@ -116,6 +116,8 @@ def facebook_insights_source(
116
116
  batch_size: int = 50,
117
117
  request_timeout: int = 300,
118
118
  app_api_version: str = None,
119
+ start_date: pendulum.DateTime | None = None,
120
+ end_date: pendulum.DateTime | None = None,
119
121
  ) -> DltResource:
120
122
  """Incrementally loads insight reports with defined granularity level, fields, breakdowns etc.
121
123
 
@@ -148,27 +150,32 @@ def facebook_insights_source(
148
150
  account_id, access_token, request_timeout, app_api_version
149
151
  )
150
152
 
151
- # we load with a defined lag
152
- initial_load_start_date = pendulum.today().subtract(days=initial_load_past_days)
153
- initial_load_start_date_str = initial_load_start_date.isoformat()
153
+ if start_date is None:
154
+ start_date = pendulum.today().subtract(days=initial_load_past_days)
155
+
156
+ columns = {}
157
+ for field in fields:
158
+ if field in INSIGHT_FIELDS_TYPES:
159
+ columns[field] = INSIGHT_FIELDS_TYPES[field]
154
160
 
155
161
  @dlt.resource(
156
162
  primary_key=INSIGHTS_PRIMARY_KEY,
157
163
  write_disposition="merge",
158
- columns=INSIGHT_FIELDS_TYPES,
164
+ columns=columns,
159
165
  )
160
166
  def facebook_insights(
161
167
  date_start: dlt.sources.incremental[str] = dlt.sources.incremental(
162
168
  "date_start",
163
- initial_value=initial_load_start_date_str,
169
+ initial_value=start_date.isoformat(),
170
+ end_value=end_date.isoformat() if end_date else None,
164
171
  range_end="closed",
165
172
  range_start="closed",
173
+ lag=attribution_window_days_lag * 24 * 60 * 60, # Convert days to seconds
166
174
  ),
167
175
  ) -> Iterator[TDataItems]:
168
- start_date = get_start_date(date_start, attribution_window_days_lag)
176
+ start_date = get_start_date(date_start)
169
177
  end_date = pendulum.now()
170
178
 
171
- # fetch insights in incremental day steps
172
179
  while start_date <= end_date:
173
180
  query = {
174
181
  "level": level,
@@ -193,7 +200,10 @@ def facebook_insights_source(
193
200
  }
194
201
  ],
195
202
  }
196
- job = execute_job(account.get_insights(params=query, is_async=True))
203
+ job = execute_job(
204
+ account.get_insights(params=query, is_async=True),
205
+ insights_max_async_sleep_seconds=10,
206
+ )
197
207
  yield list(map(process_report_item, job.get_result()))
198
208
  start_date = start_date.add(days=time_increment_days)
199
209
 
@@ -31,14 +31,13 @@ from .settings import (
31
31
 
32
32
  def get_start_date(
33
33
  incremental_start_date: dlt.sources.incremental[str],
34
- attribution_window_days_lag: int = 7,
35
34
  ) -> pendulum.DateTime:
36
35
  """
37
36
  Get the start date for incremental loading of Facebook Insights data.
38
37
  """
39
38
  start_date: pendulum.DateTime = ensure_pendulum_datetime(
40
39
  incremental_start_date.start_value
41
- ).subtract(days=attribution_window_days_lag)
40
+ )
42
41
 
43
42
  # facebook forgets insights so trim the lag and warn
44
43
  min_start_date = pendulum.today().subtract(
@@ -65,7 +64,6 @@ def process_report_item(item: AbstractObject) -> DictStrAny:
65
64
  for pki in INSIGHTS_PRIMARY_KEY:
66
65
  if pki not in d:
67
66
  d[pki] = "no_" + pki
68
-
69
67
  return d
70
68
 
71
69
 
@@ -138,7 +136,7 @@ def execute_job(
138
136
  ) -> AbstractCrudObject:
139
137
  status: str = None
140
138
  time_start = time.time()
141
- sleep_time = 10
139
+ sleep_time = 3
142
140
  while status != "Job Completed":
143
141
  duration = time.time() - time_start
144
142
  job = job.api_get()
@@ -112,6 +112,8 @@ DEFAULT_INSIGHT_FIELDS = (
112
112
  "social_spend",
113
113
  "spend",
114
114
  "website_ctr",
115
+ "conversions",
116
+ "video_thruplay_watched_actions",
115
117
  )
116
118
 
117
119
  TInsightsLevels = Literal["account", "campaign", "adset", "ad"]
@@ -0,0 +1,39 @@
1
+ from typing import Dict
2
+
3
+ import dlt
4
+ from dlt.common.configuration.inject import with_config
5
+ from dlt.sources.helpers import requests
6
+
7
+
8
+ @with_config(sections=("sources", "facebook_ads"))
9
+ def debug_access_token(
10
+ access_token: str = dlt.secrets.value,
11
+ client_id: str = dlt.secrets.value,
12
+ client_secret: str = dlt.secrets.value,
13
+ ) -> str:
14
+ """Debugs the `access_token` providing info on expiration time, scopes etc. If arguments are not provides, `dlt` will inject them from configuration"""
15
+ debug_url = f"https://graph.facebook.com/debug_token?input_token={access_token}&access_token={client_id}|{client_secret}"
16
+ response = requests.get(debug_url)
17
+ data: Dict[str, str] = response.json()
18
+
19
+ if "error" in data:
20
+ raise Exception(f"Error debugging token: {data['error']}")
21
+
22
+ return data["data"]
23
+
24
+
25
+ @with_config(sections=("sources", "facebook_ads"))
26
+ def get_long_lived_token(
27
+ access_token: str = dlt.secrets.value,
28
+ client_id: str = dlt.secrets.value,
29
+ client_secret: str = dlt.secrets.value,
30
+ ) -> str:
31
+ """Gets the long lived access token (60 days) from `access_token`. If arguments are not provides, `dlt` will inject them from configuration"""
32
+ exchange_url = f"https://graph.facebook.com/v13.0/oauth/access_token?grant_type=fb_exchange_token&client_id={client_id}&client_secret={client_secret}&fb_exchange_token={access_token}"
33
+ response = requests.get(exchange_url)
34
+ data: Dict[str, str] = response.json()
35
+
36
+ if "error" in data:
37
+ raise Exception(f"Error refreshing token: {data['error']}")
38
+
39
+ return data["access_token"]
ingestr/src/sources.py CHANGED
@@ -747,11 +747,64 @@ class FacebookAdsSource:
747
747
  endpoint = None
748
748
  if table in ["campaigns", "ad_sets", "ad_creatives", "ads", "leads"]:
749
749
  endpoint = table
750
- elif table in "facebook_insights":
750
+ elif table == "facebook_insights":
751
751
  return facebook_insights_source(
752
752
  access_token=access_token[0],
753
753
  account_id=account_id[0],
754
+ start_date=kwargs.get("interval_start"),
755
+ end_date=kwargs.get("interval_end"),
754
756
  ).with_resources("facebook_insights")
757
+ elif table.startswith("facebook_insights:"):
758
+ # Parse custom breakdowns and metrics from table name
759
+ # Supported formats:
760
+ # facebook_insights:breakdown_type
761
+ # facebook_insights:breakdown_type:metric1,metric2...
762
+ parts = table.split(":")
763
+
764
+ if len(parts) < 2 or len(parts) > 3:
765
+ raise ValueError(
766
+ "Invalid facebook_insights format. Expected: facebook_insights:breakdown_type or facebook_insights:breakdown_type:metric1,metric2..."
767
+ )
768
+
769
+ breakdown_type = parts[1].strip()
770
+ if not breakdown_type:
771
+ raise ValueError(
772
+ "Breakdown type must be provided in format: facebook_insights:breakdown_type"
773
+ )
774
+
775
+ # Validate breakdown type against available options from settings
776
+ import typing
777
+
778
+ from ingestr.src.facebook_ads.settings import TInsightsBreakdownOptions
779
+
780
+ # Get valid breakdown options from the type definition
781
+ valid_breakdowns = list(typing.get_args(TInsightsBreakdownOptions))
782
+
783
+ if breakdown_type not in valid_breakdowns:
784
+ raise ValueError(
785
+ f"Invalid breakdown type '{breakdown_type}'. Valid options: {', '.join(valid_breakdowns)}"
786
+ )
787
+
788
+ source_kwargs = {
789
+ "access_token": access_token[0],
790
+ "account_id": account_id[0],
791
+ "start_date": kwargs.get("interval_start"),
792
+ "end_date": kwargs.get("interval_end"),
793
+ "breakdowns": breakdown_type,
794
+ }
795
+
796
+ # If custom metrics are provided, parse them
797
+ if len(parts) == 3:
798
+ fields = [f.strip() for f in parts[2].split(",") if f.strip()]
799
+ if not fields:
800
+ raise ValueError(
801
+ "Custom metrics must be provided after the second colon in format: facebook_insights:breakdown_type:metric1,metric2..."
802
+ )
803
+ source_kwargs["fields"] = fields
804
+
805
+ return facebook_insights_source(**source_kwargs).with_resources(
806
+ "facebook_insights"
807
+ )
755
808
  else:
756
809
  raise ValueError(
757
810
  f"Resource '{table}' is not supported for Facebook Ads source yet, if you are interested in it please create a GitHub issue at https://github.com/bruin-data/ingestr"
@@ -85,12 +85,14 @@ def incremental_stripe_source(
85
85
  created: Optional[Any] = dlt.sources.incremental(
86
86
  "created",
87
87
  initial_value=start_date_unix,
88
+ end_value=transform_date(end_date) if end_date is not None else None,
88
89
  range_end="closed",
89
90
  range_start="closed",
90
91
  ),
91
92
  ) -> Generator[Dict[Any, Any], Any, None]:
92
- start_value = created.last_value
93
- yield from pagination(endpoint, start_date=start_value, end_date=end_date)
93
+ yield from pagination(
94
+ endpoint, start_date=created.last_value, end_date=created.end_value
95
+ )
94
96
 
95
97
  for endpoint in endpoints:
96
98
  yield dlt.resource(
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: ingestr
3
- Version: 0.13.54
3
+ Version: 0.13.55
4
4
  Summary: ingestr is a command-line application that ingests data from various sources and stores them in any database.
5
5
  Project-URL: Homepage, https://github.com/bruin-data/ingestr
6
6
  Project-URL: Issues, https://github.com/bruin-data/ingestr/issues
@@ -2,7 +2,7 @@ ingestr/conftest.py,sha256=Q03FIJIZpLBbpj55cfCHIKEjc1FCvWJhMF2cidUJKQU,1748
2
2
  ingestr/main.py,sha256=GkC1hdq8AVGrvolc95zMfjmibI95p2pmFkbgCOVf-Og,26311
3
3
  ingestr/src/.gitignore,sha256=8cX1AZTSI0TcdZFGTmS_oyBjpfCzhOEt0DdAo2dFIY8,203
4
4
  ingestr/src/blob.py,sha256=onMe5ZHxPXTdcB_s2oGNdMo-XQJ3ajwOsWE9eSTGFmc,1495
5
- ingestr/src/buildinfo.py,sha256=5aqjzKmdujvelIHbUBjqDKLXcEB2hEdLvQ6BJyTyZ1Q,21
5
+ ingestr/src/buildinfo.py,sha256=bdi0-mZhnHheYgs6WuEb8p-RIk_RFAXRCF9HalRfV0k,21
6
6
  ingestr/src/destinations.py,sha256=TcxM2rcwHfgMMP6U0yRNcfWKlEzkBbZbqCIDww7lkTY,16882
7
7
  ingestr/src/errors.py,sha256=Ufs4_DfE77_E3vnA1fOQdi6cmuLVNm7_SbFLkL1XPGk,686
8
8
  ingestr/src/factory.py,sha256=mcjgbmrZr6TvP9fCMQxo-aMGcrb2PqToRcSLp5nldww,6138
@@ -11,7 +11,7 @@ ingestr/src/http_client.py,sha256=bxqsk6nJNXCo-79gW04B53DQO-yr25vaSsqP0AKtjx4,73
11
11
  ingestr/src/loader.py,sha256=9NaWAyfkXdqAZSS-N72Iwo36Lbx4PyqIfaaH1dNdkFs,1712
12
12
  ingestr/src/partition.py,sha256=BrIP6wFJvyR7Nus_3ElnfxknUXeCipK_E_bB8kZowfc,969
13
13
  ingestr/src/resource.py,sha256=ZqmZxFQVGlF8rFPhBiUB08HES0yoTj8sZ--jKfaaVps,1164
14
- ingestr/src/sources.py,sha256=Nwx66jQwqjovLomZIVwIVNLSBy8KgqGhu4-spPHp7ZM,91785
14
+ ingestr/src/sources.py,sha256=3ozLt9lhhNANspfjA2vb8u6qjgBJezH8QBV1XKqT1fg,94124
15
15
  ingestr/src/table_definition.py,sha256=REbAbqdlmUMUuRh8nEQRreWjPVOQ5ZcfqGkScKdCrmk,390
16
16
  ingestr/src/time.py,sha256=H_Fk2J4ShXyUM-EMY7MqCLZQhlnZMZvO952bmZPc4yE,254
17
17
  ingestr/src/version.py,sha256=J_2xgZ0mKlvuHcjdKCx2nlioneLH0I47JiU_Slr_Nwc,189
@@ -39,10 +39,11 @@ ingestr/src/chess/settings.py,sha256=p0RlCGgtXUacPDEvZmwzSWmzX0Apj1riwfz-nrMK89k
39
39
  ingestr/src/collector/spinner.py,sha256=_ZUqF5MI43hVIULdjF5s5mrAZbhEFXaiWirQmrv3Yk4,1201
40
40
  ingestr/src/dynamodb/__init__.py,sha256=swhxkeYBbJ35jn1IghCtvYWT2BM33KynVCh_oR4z28A,2264
41
41
  ingestr/src/elasticsearch/__init__.py,sha256=m-q93HgUmTwGDUwHOjHawstWL06TC3WIX3H05szybrY,2556
42
- ingestr/src/facebook_ads/__init__.py,sha256=reEpSr4BaKA1wO3qVgCH51gW-TgWkbJ_g24UIhJWbac,9286
42
+ ingestr/src/facebook_ads/__init__.py,sha256=a1A5fO1r_FotoH9UET42tamqo_-ftCm9vBrkm5lpjG0,9579
43
43
  ingestr/src/facebook_ads/exceptions.py,sha256=4Nlbc0Mv3i5g-9AoyT-n1PIa8IDi3VCTfEAzholx4Wc,115
44
- ingestr/src/facebook_ads/helpers.py,sha256=ZLbNHiKer5lPb4g3_435XeBJr57Wv0o1KTyBA1mQ100,9068
45
- ingestr/src/facebook_ads/settings.py,sha256=1IxZeP_4rN3IBvAncNHOoqpzAirx0Hz-MUK_tl6UTFk,4881
44
+ ingestr/src/facebook_ads/helpers.py,sha256=EYqOAPUlhVNxwzjP_CUGjJvAXTq65nJC-v75BfyJKmg,8981
45
+ ingestr/src/facebook_ads/settings.py,sha256=Bsic8RcmH-NfEZ7r_NGospTCmwISK9XaMT5y2NZirtg,4938
46
+ ingestr/src/facebook_ads/utils.py,sha256=ES2ylPoW3j3fjp6OMUgp21n1cG1OktXsmWWMk5vBW_I,1590
46
47
  ingestr/src/filesystem/__init__.py,sha256=zkIwbRr0ir0EUdniI25p2zGiVc-7M9EmR351AjNb0eA,4163
47
48
  ingestr/src/filesystem/helpers.py,sha256=bg0muSHZr3hMa8H4jN2-LGWzI-SUoKlQNiWJ74-YYms,3211
48
49
  ingestr/src/filesystem/readers.py,sha256=a0fKkaRpnAOGsXI3EBNYZa7x6tlmAOsgRzb883StY30,3987
@@ -116,7 +117,7 @@ ingestr/src/solidgate/__init__.py,sha256=JdaXvAu5QGuf9-FY294vwCQCEmfrqIld9oqbzqC
116
117
  ingestr/src/solidgate/helpers.py,sha256=oePEc9nnvmN3IaKrfJCvyKL79xdGM0-gRTN3-8tY4Fc,4952
117
118
  ingestr/src/sql_database/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
118
119
  ingestr/src/sql_database/callbacks.py,sha256=sEFFmXxAURY3yeBjnawigDtq9LBCvi8HFqG4kLd7tMU,2002
119
- ingestr/src/stripe_analytics/__init__.py,sha256=FBkZu5op5Z-FceEi4zG7qcAgZfUYJRPMVPPrPMjvmXw,4502
120
+ ingestr/src/stripe_analytics/__init__.py,sha256=j3Vmvo8G75fJJIF4rUnpGliGTpYQZt372wo-AjGImYs,4581
120
121
  ingestr/src/stripe_analytics/helpers.py,sha256=iqZOyiGIOhOAhVXXU16DP0hkkTKcTrDu69vAJoTxgEo,1976
121
122
  ingestr/src/stripe_analytics/settings.py,sha256=ZahhZg3Sq2KnvnDcfSaXO494Csy3tElBDEHnvA1AVmA,2461
122
123
  ingestr/src/telemetry/event.py,sha256=W7bs4uVfPakQ5otmiqgqu1l5SqjYx1p87wudnWXckBc,949
@@ -138,8 +139,8 @@ ingestr/testdata/merge_expected.csv,sha256=DReHqWGnQMsf2PBv_Q2pfjsgvikYFnf1zYcQZ
138
139
  ingestr/testdata/merge_part1.csv,sha256=Pw8Z9IDKcNU0qQHx1z6BUf4rF_-SxKGFOvymCt4OY9I,185
139
140
  ingestr/testdata/merge_part2.csv,sha256=T_GiWxA81SN63_tMOIuemcvboEFeAmbKc7xRXvL9esw,287
140
141
  ingestr/tests/unit/test_smartsheets.py,sha256=eiC2CCO4iNJcuN36ONvqmEDryCA1bA1REpayHpu42lk,5058
141
- ingestr-0.13.54.dist-info/METADATA,sha256=5RaRSmJX-SiZV9iFYz3cSkiuZp0GXQ2ij9whkbQHFs8,15131
142
- ingestr-0.13.54.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
143
- ingestr-0.13.54.dist-info/entry_points.txt,sha256=oPJy0KBnPWYjDtP1k8qwAihcTLHSZokSQvRAw_wtfJM,46
144
- ingestr-0.13.54.dist-info/licenses/LICENSE.md,sha256=cW8wIhn8HFE-KLStDF9jHQ1O_ARWP3kTpk_-eOccL24,1075
145
- ingestr-0.13.54.dist-info/RECORD,,
142
+ ingestr-0.13.55.dist-info/METADATA,sha256=WNMM4qLCTDJg4xUnYNefHffB6vidRl4xopoBaaux-FM,15131
143
+ ingestr-0.13.55.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
144
+ ingestr-0.13.55.dist-info/entry_points.txt,sha256=oPJy0KBnPWYjDtP1k8qwAihcTLHSZokSQvRAw_wtfJM,46
145
+ ingestr-0.13.55.dist-info/licenses/LICENSE.md,sha256=cW8wIhn8HFE-KLStDF9jHQ1O_ARWP3kTpk_-eOccL24,1075
146
+ ingestr-0.13.55.dist-info/RECORD,,