ingestr 0.10.3__tar.gz → 0.12.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of ingestr might be problematic. Click here for more details.

Files changed (180) hide show
  1. {ingestr-0.10.3 → ingestr-0.12.1}/Makefile +6 -2
  2. {ingestr-0.10.3 → ingestr-0.12.1}/PKG-INFO +17 -5
  3. {ingestr-0.10.3 → ingestr-0.12.1}/README.md +13 -3
  4. {ingestr-0.10.3 → ingestr-0.12.1}/docs/.vitepress/config.mjs +3 -1
  5. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/adjust.md +2 -2
  6. ingestr-0.12.1/docs/supported-sources/asana.md +58 -0
  7. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/athena.md +1 -1
  8. ingestr-0.12.1/docs/supported-sources/dynamodb.md +90 -0
  9. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/gorgias.md +1 -1
  10. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/gsheets.md +1 -1
  11. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/kafka.md +1 -1
  12. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/klaviyo.md +2 -2
  13. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/notion.md +1 -1
  14. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/shopify.md +1 -1
  15. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/stripe.md +1 -1
  16. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/zendesk.md +2 -2
  17. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/main.py +1 -2
  18. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/adjust/__init__.py +4 -1
  19. ingestr-0.12.1/ingestr/src/asana_source/__init__.py +264 -0
  20. ingestr-0.12.1/ingestr/src/asana_source/helpers.py +16 -0
  21. ingestr-0.12.1/ingestr/src/asana_source/settings.py +144 -0
  22. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/chess/__init__.py +1 -1
  23. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/destinations.py +8 -1
  24. ingestr-0.12.1/ingestr/src/dynamodb/__init__.py +86 -0
  25. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/factory.py +46 -58
  26. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/hubspot/__init__.py +1 -1
  27. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/sources.py +182 -5
  28. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/stripe_analytics/__init__.py +1 -1
  29. ingestr-0.12.1/ingestr/src/tiktok_ads/__init__.py +106 -0
  30. ingestr-0.12.1/ingestr/src/tiktok_ads/tiktok_helpers.py +112 -0
  31. ingestr-0.12.1/ingestr/src/time.py +11 -0
  32. ingestr-0.12.1/ingestr/src/version.py +1 -0
  33. {ingestr-0.10.3 → ingestr-0.12.1}/pyproject.toml +8 -0
  34. {ingestr-0.10.3 → ingestr-0.12.1}/requirements-dev.txt +4 -3
  35. {ingestr-0.10.3 → ingestr-0.12.1}/requirements.txt +2 -1
  36. ingestr-0.10.3/ingestr/src/version.py +0 -1
  37. {ingestr-0.10.3 → ingestr-0.12.1}/.dockerignore +0 -0
  38. {ingestr-0.10.3 → ingestr-0.12.1}/.githooks/pre-commit-hook.sh +0 -0
  39. {ingestr-0.10.3 → ingestr-0.12.1}/.github/workflows/deploy-docs.yml +0 -0
  40. {ingestr-0.10.3 → ingestr-0.12.1}/.github/workflows/secrets-scan.yml +0 -0
  41. {ingestr-0.10.3 → ingestr-0.12.1}/.github/workflows/tests.yml +0 -0
  42. {ingestr-0.10.3 → ingestr-0.12.1}/.gitignore +0 -0
  43. {ingestr-0.10.3 → ingestr-0.12.1}/.gitleaksignore +0 -0
  44. {ingestr-0.10.3 → ingestr-0.12.1}/.python-version +0 -0
  45. {ingestr-0.10.3 → ingestr-0.12.1}/.vale.ini +0 -0
  46. {ingestr-0.10.3 → ingestr-0.12.1}/Dockerfile +0 -0
  47. {ingestr-0.10.3 → ingestr-0.12.1}/LICENSE.md +0 -0
  48. {ingestr-0.10.3 → ingestr-0.12.1}/docs/.vitepress/theme/custom.css +0 -0
  49. {ingestr-0.10.3 → ingestr-0.12.1}/docs/.vitepress/theme/index.js +0 -0
  50. {ingestr-0.10.3 → ingestr-0.12.1}/docs/commands/example-uris.md +0 -0
  51. {ingestr-0.10.3 → ingestr-0.12.1}/docs/commands/ingest.md +0 -0
  52. {ingestr-0.10.3 → ingestr-0.12.1}/docs/getting-started/core-concepts.md +0 -0
  53. {ingestr-0.10.3 → ingestr-0.12.1}/docs/getting-started/incremental-loading.md +0 -0
  54. {ingestr-0.10.3 → ingestr-0.12.1}/docs/getting-started/quickstart.md +0 -0
  55. {ingestr-0.10.3 → ingestr-0.12.1}/docs/getting-started/telemetry.md +0 -0
  56. {ingestr-0.10.3 → ingestr-0.12.1}/docs/index.md +0 -0
  57. {ingestr-0.10.3 → ingestr-0.12.1}/docs/media/athena.png +0 -0
  58. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/airtable.md +0 -0
  59. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/appsflyer.md +0 -0
  60. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/bigquery.md +0 -0
  61. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/chess.md +0 -0
  62. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/csv.md +0 -0
  63. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/databricks.md +0 -0
  64. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/duckdb.md +0 -0
  65. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/facebook-ads.md +0 -0
  66. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/hubspot.md +0 -0
  67. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/mongodb.md +0 -0
  68. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/mssql.md +0 -0
  69. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/mysql.md +0 -0
  70. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/oracle.md +0 -0
  71. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/postgres.md +0 -0
  72. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/redshift.md +0 -0
  73. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/s3.md +0 -0
  74. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/sap-hana.md +0 -0
  75. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/slack.md +0 -0
  76. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/snowflake.md +0 -0
  77. {ingestr-0.10.3 → ingestr-0.12.1}/docs/supported-sources/sqlite.md +0 -0
  78. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/.gitignore +0 -0
  79. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/adjust/adjust_helpers.py +0 -0
  80. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/airtable/__init__.py +0 -0
  81. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/appsflyer/_init_.py +0 -0
  82. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/appsflyer/client.py +0 -0
  83. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/arrow/__init__.py +0 -0
  84. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/chess/helpers.py +0 -0
  85. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/chess/settings.py +0 -0
  86. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/facebook_ads/__init__.py +0 -0
  87. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/facebook_ads/exceptions.py +0 -0
  88. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/facebook_ads/helpers.py +0 -0
  89. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/facebook_ads/settings.py +0 -0
  90. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/filesystem/__init__.py +0 -0
  91. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/filesystem/helpers.py +0 -0
  92. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/filesystem/readers.py +0 -0
  93. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/filters.py +0 -0
  94. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/google_sheets/README.md +0 -0
  95. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/google_sheets/__init__.py +0 -0
  96. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/google_sheets/helpers/__init__.py +0 -0
  97. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/google_sheets/helpers/api_calls.py +0 -0
  98. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/google_sheets/helpers/data_processing.py +0 -0
  99. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/gorgias/__init__.py +0 -0
  100. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/gorgias/helpers.py +0 -0
  101. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/hubspot/helpers.py +0 -0
  102. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/hubspot/settings.py +0 -0
  103. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/kafka/__init__.py +0 -0
  104. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/kafka/helpers.py +0 -0
  105. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/klaviyo/_init_.py +0 -0
  106. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/klaviyo/client.py +0 -0
  107. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/klaviyo/helpers.py +0 -0
  108. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/mongodb/__init__.py +0 -0
  109. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/mongodb/helpers.py +0 -0
  110. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/notion/__init__.py +0 -0
  111. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/notion/helpers/__init__.py +0 -0
  112. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/notion/helpers/client.py +0 -0
  113. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/notion/helpers/database.py +0 -0
  114. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/notion/settings.py +0 -0
  115. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/shopify/__init__.py +0 -0
  116. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/shopify/exceptions.py +0 -0
  117. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/shopify/helpers.py +0 -0
  118. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/shopify/settings.py +0 -0
  119. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/slack/__init__.py +0 -0
  120. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/slack/helpers.py +0 -0
  121. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/slack/settings.py +0 -0
  122. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/stripe_analytics/helpers.py +0 -0
  123. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/stripe_analytics/settings.py +0 -0
  124. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/table_definition.py +0 -0
  125. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/telemetry/event.py +0 -0
  126. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/testdata/fakebqcredentials.json +0 -0
  127. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/zendesk/__init__.py +0 -0
  128. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/zendesk/helpers/__init__.py +0 -0
  129. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/zendesk/helpers/api_helpers.py +0 -0
  130. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/zendesk/helpers/credentials.py +0 -0
  131. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/zendesk/helpers/talk_api.py +0 -0
  132. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/src/zendesk/settings.py +0 -0
  133. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/testdata/.gitignore +0 -0
  134. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/testdata/create_replace.csv +0 -0
  135. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/testdata/delete_insert_expected.csv +0 -0
  136. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/testdata/delete_insert_part1.csv +0 -0
  137. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/testdata/delete_insert_part2.csv +0 -0
  138. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/testdata/merge_expected.csv +0 -0
  139. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/testdata/merge_part1.csv +0 -0
  140. {ingestr-0.10.3 → ingestr-0.12.1}/ingestr/testdata/merge_part2.csv +0 -0
  141. {ingestr-0.10.3 → ingestr-0.12.1}/package-lock.json +0 -0
  142. {ingestr-0.10.3 → ingestr-0.12.1}/package.json +0 -0
  143. {ingestr-0.10.3 → ingestr-0.12.1}/resources/demo.gif +0 -0
  144. {ingestr-0.10.3 → ingestr-0.12.1}/resources/demo.tape +0 -0
  145. {ingestr-0.10.3 → ingestr-0.12.1}/resources/ingestr.svg +0 -0
  146. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/AMPM.yml +0 -0
  147. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Acronyms.yml +0 -0
  148. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Colons.yml +0 -0
  149. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Contractions.yml +0 -0
  150. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/DateFormat.yml +0 -0
  151. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Ellipses.yml +0 -0
  152. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/EmDash.yml +0 -0
  153. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Exclamation.yml +0 -0
  154. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/FirstPerson.yml +0 -0
  155. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Gender.yml +0 -0
  156. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/GenderBias.yml +0 -0
  157. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/HeadingPunctuation.yml +0 -0
  158. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Headings.yml +0 -0
  159. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Latin.yml +0 -0
  160. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/LyHyphens.yml +0 -0
  161. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/OptionalPlurals.yml +0 -0
  162. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Ordinal.yml +0 -0
  163. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/OxfordComma.yml +0 -0
  164. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Parens.yml +0 -0
  165. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Passive.yml +0 -0
  166. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Periods.yml +0 -0
  167. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Quotes.yml +0 -0
  168. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Ranges.yml +0 -0
  169. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Semicolons.yml +0 -0
  170. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Slang.yml +0 -0
  171. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Spacing.yml +0 -0
  172. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Spelling.yml +0 -0
  173. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Units.yml +0 -0
  174. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/We.yml +0 -0
  175. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/Will.yml +0 -0
  176. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/WordList.yml +0 -0
  177. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/meta.json +0 -0
  178. {ingestr-0.10.3 → ingestr-0.12.1}/styles/Google/vocab.txt +0 -0
  179. {ingestr-0.10.3 → ingestr-0.12.1}/styles/bruin/Ingestr.yml +0 -0
  180. {ingestr-0.10.3 → ingestr-0.12.1}/styles/config/vocabularies/bruin/accept.txt +0 -0
@@ -1,5 +1,5 @@
1
1
  .ONESHELL:
2
- .PHONY: test lint format test-ci lint-ci build upload-release setup
2
+ .PHONY: test lint format test-ci lint-ci build upload-release setup docker-shell
3
3
 
4
4
  venv: venv/touchfile
5
5
 
@@ -43,4 +43,8 @@ upload-release:
43
43
 
44
44
  setup:
45
45
  @echo "installing git hooks ..."
46
- @install -m 755 .githooks/pre-commit-hook.sh .git/hooks/pre-commit
46
+ @install -m 755 .githooks/pre-commit-hook.sh .git/hooks/pre-commit
47
+
48
+ docker-shell:
49
+ # run a docker container to build and run ingestr
50
+ @docker run -v $(PWD):/root/code -w /root/code -it --rm --entrypoint /bin/bash python:3.11
@@ -1,10 +1,11 @@
1
- Metadata-Version: 2.3
1
+ Metadata-Version: 2.4
2
2
  Name: ingestr
3
- Version: 0.10.3
3
+ Version: 0.12.1
4
4
  Summary: ingestr is a command-line application that ingests data from various sources and stores them in any database.
5
5
  Project-URL: Homepage, https://github.com/bruin-data/ingestr
6
6
  Project-URL: Issues, https://github.com/bruin-data/ingestr/issues
7
7
  Author-email: Burak Karakan <burak.karakan@getbruin.com>
8
+ License-File: LICENSE.md
8
9
  Classifier: Development Status :: 4 - Beta
9
10
  Classifier: Environment :: Console
10
11
  Classifier: Intended Audience :: Developers
@@ -13,6 +14,7 @@ Classifier: Operating System :: OS Independent
13
14
  Classifier: Programming Language :: Python :: 3
14
15
  Classifier: Topic :: Database
15
16
  Requires-Python: >=3.9
17
+ Requires-Dist: asana==3.2.3
16
18
  Requires-Dist: confluent-kafka>=2.6.1
17
19
  Requires-Dist: databricks-sql-connector==2.9.3
18
20
  Requires-Dist: dlt==1.4.0
@@ -199,7 +201,7 @@ Pull requests are welcome. However, please open an issue first to discuss what y
199
201
  <tr>
200
202
  <td colspan="3" style='text-align:center;'><strong>Platforms</strong></td>
201
203
  </tr>
202
- <td>Adjust</td>
204
+ <td>Adjust</td>
203
205
  <td>✅</td>
204
206
  <td>-</td>
205
207
  <tr>
@@ -207,17 +209,27 @@ Pull requests are welcome. However, please open an issue first to discuss what y
207
209
  <td>✅</td>
208
210
  <td>-</td>
209
211
  </tr>
210
- <tr>
212
+ <tr>
211
213
  <td>AppsFlyer</td>
212
214
  <td>✅</td>
213
215
  <td>-</td>
214
216
  </tr>
217
+ <tr>
218
+ <td>Asana</td>
219
+ <td>✅</td>
220
+ <td>-</td>
221
+ </tr>
215
222
  <tr>
216
223
  <td>Chess.com</td>
217
224
  <td>✅</td>
218
225
  <td>-</td>
219
226
  </tr>
220
- <tr>
227
+ <tr>
228
+ <td>DynamoDB</td>
229
+ <td>✅</td>
230
+ <td>-</td>
231
+ </tr>
232
+ <tr>
221
233
  <td>Facebook Ads</td>
222
234
  <td>✅</td>
223
235
  <td>-</td>
@@ -146,7 +146,7 @@ Pull requests are welcome. However, please open an issue first to discuss what y
146
146
  <tr>
147
147
  <td colspan="3" style='text-align:center;'><strong>Platforms</strong></td>
148
148
  </tr>
149
- <td>Adjust</td>
149
+ <td>Adjust</td>
150
150
  <td>✅</td>
151
151
  <td>-</td>
152
152
  <tr>
@@ -154,17 +154,27 @@ Pull requests are welcome. However, please open an issue first to discuss what y
154
154
  <td>✅</td>
155
155
  <td>-</td>
156
156
  </tr>
157
- <tr>
157
+ <tr>
158
158
  <td>AppsFlyer</td>
159
159
  <td>✅</td>
160
160
  <td>-</td>
161
161
  </tr>
162
+ <tr>
163
+ <td>Asana</td>
164
+ <td>✅</td>
165
+ <td>-</td>
166
+ </tr>
162
167
  <tr>
163
168
  <td>Chess.com</td>
164
169
  <td>✅</td>
165
170
  <td>-</td>
166
171
  </tr>
167
- <tr>
172
+ <tr>
173
+ <td>DynamoDB</td>
174
+ <td>✅</td>
175
+ <td>-</td>
176
+ </tr>
177
+ <tr>
168
178
  <td>Facebook Ads</td>
169
179
  <td>✅</td>
170
180
  <td>-</td>
@@ -57,7 +57,7 @@ export default defineConfig({
57
57
  text: "Databases",
58
58
  collapsed: false,
59
59
  items: [
60
- { text: "Athena", link: "/supported-sources/athena.md" },
60
+ { text: "AWS Athena", link: "/supported-sources/athena.md" },
61
61
  { text: "AWS Redshift", link: "/supported-sources/redshift.md" },
62
62
  { text: "Databricks", link: "/supported-sources/databricks.md" },
63
63
  { text: "DuckDB", link: "/supported-sources/duckdb.md" },
@@ -88,7 +88,9 @@ export default defineConfig({
88
88
  { text: "Adjust", link: "/supported-sources/adjust.md" },
89
89
  { text: "Airtable", link: "/supported-sources/airtable.md" },
90
90
  { text: "AppsFlyer", link: "/supported-sources/appsflyer.md" },
91
+ { text: "Asana", link: "/supported-sources/asana.md" },
91
92
  { text: "Chess.com", link: "/supported-sources/chess.md" },
93
+ { text: "DynamoDB", link: "/supported-sources/dynamodb.md" },
92
94
  {
93
95
  text: "Facebook Ads",
94
96
  link: "/supported-sources/facebook-ads.md",
@@ -62,7 +62,7 @@ ingestr ingest \
62
62
  --source-uri 'adjust://?api_key=nr_123' \
63
63
  --source-table 'campaigns' \
64
64
  --dest-uri duckdb:///adjust.duckdb \
65
- --dest-table 'adjust.output'
65
+ --dest-table 'dest.output'
66
66
  ```
67
67
 
68
68
  Copy creatives data from Adjust into a DuckDB database:
@@ -71,7 +71,7 @@ ingestr ingest \
71
71
  --source-uri 'adjust://?api_key=nr_123' \
72
72
  --source-table 'creatives' \
73
73
  --dest-uri duckdb:///adjust.duckdb \
74
- --dest-table 'adjust.output'
74
+ --dest-table 'dest.output'
75
75
  ```
76
76
 
77
77
  Copy custom data from Adjust into a DuckDB database:
@@ -0,0 +1,58 @@
1
+ # Asana
2
+ [Asana](https://asana.com/) is a software-as-a-service platform designed for team collaboration and work management. Teams can create projects, assign tasks, set deadlines, and communicate directly within Asana. It also includes reporting tools, file attachments, calendars, and goal tracking.
3
+
4
+ ## URI format
5
+
6
+ The URI format for Asana is as follows:
7
+ ```
8
+ asana://<workspace_id>?access_token=<access_token>
9
+ ```
10
+
11
+ URI parameters:
12
+ - `workspace_id` is the `gid` of the workspace.
13
+ - `access_token` is a personal access token.
14
+
15
+ You can obtain `workspace_id` by going to the [admin console](https://help.asana.com/s/article/how-to-access-the-admin-console). The URL in your browser will look something like this:
16
+
17
+ ```
18
+ https://app.asana.com/admin/fake-123456789/
19
+ ```
20
+
21
+ In this example `fake-123456789` is your workspace id.
22
+
23
+ ## Setting up an Asana Integration
24
+
25
+ You can obtain a personal access token from the [developer console](https://app.asana.com/0/my-apps). For more information, see [Asana developers documentation](https://developers.asana.com/docs/personal-access-token).
26
+
27
+ ## Example
28
+ Let's say you have a workspace with id `workspace-1337` and you want to ingest all tasks into a duckdb database called `work.db`. For this example the value of `access_token` will be `fake_token`
29
+
30
+ You can run the following to achieve this:
31
+ ```sh
32
+ ingestr ingest \
33
+ --source-uri "asana://workspace-1337?access_token=fake_token" \
34
+ --source-table "tasks" \
35
+ --dest-uri "duckdb://./work.db" \
36
+ --dest-table "public.tasks"
37
+ ```
38
+
39
+
40
+ ## Tables
41
+
42
+ Asana source allows ingesting the following sources into separate tables:
43
+
44
+ | **Table** | **Description** |
45
+ |---------------|---------------------------------------------------------------------------------|
46
+ | `workspaces` | Information about people, materials, or assets required to complete a task or project successfully. |
47
+ | `projects` | Collections of tasks and related information. |
48
+ | `tasks` | Tasks within a project. Only tasks that belong to a project can be ingested. Users private tasks are not ingested, for example. |
49
+ | `projects` | Collections of tasks and related information. |
50
+ | `tags` | Labels that can be attached to tasks, projects, or conversations to help categorize and organize them. |
51
+ | `stories` | Updates or comments that team members can add to a task or project. |
52
+ | `teams` | Groups of individuals who work together to complete projects and tasks. |
53
+ | `users` | Individuals who have access to the Asana platform. |
54
+
55
+ Use these as `--source-table` parameter in the `ingestr ingest` command.
56
+
57
+ > [!WARNING]
58
+ > Asana does not support incremental loading for many endpoints in its APIs, which means ingestr will load endpoints incrementally if they support it, and do a full-refresh if not.
@@ -1,4 +1,4 @@
1
- # Athena
1
+ # AWS Athena
2
2
  [Athena](https://aws.amazon.com/athena/) is an interactive query service that allows users to analyze data directly in Amazon S3 using standard SQL.
3
3
 
4
4
  The Athena destination stores data as Parquet files in S3 buckets and creates external tables in AWS Glue Catalog.
@@ -0,0 +1,90 @@
1
+ # DynamoDB
2
+
3
+ Amazon [DynamoDB](https://aws.amazon.com/dynamodb/) is a managed NoSQL database service provided by Amazon Web Services (AWS). It supports key-value and document data structures and is designed to handle a wide range of applications requiring scalability and performance.
4
+
5
+ ## URI format
6
+
7
+ The URI format for DynamoDB is as follows:
8
+ ```plaintext
9
+ dynamodb://dynamodb.<region>.amazonaws.com?access_key_id=<aws_access_key_id>&secret_access_key=<aws_secret_access_key>
10
+ ```
11
+
12
+ URI parameters:
13
+
14
+ - `access_key_id`: Identifes an IAM account.
15
+ - `secret_access_key`: Password for the IAM account.
16
+
17
+
18
+ ## Setting up a DynamoDB integration
19
+
20
+ ### Prerequisites
21
+ * AWS IAM access key pair.
22
+ * A DynamoDB Table that you will to load data from
23
+
24
+ To obtain the access keys, use the IAM console on AWS. See [IAM Documentation](https://docs.aws.amazon.com/IAM/latest/UserGuide/id_credentials_access-keys.html) for more information.
25
+
26
+
27
+ ### Configuring Permissions
28
+ To use DynamoDB source, the user account must have the following IAM permissions:
29
+ * `dynamodb:DescribeTable`
30
+ * `dynamodb:Scan`
31
+
32
+ Following AWS Best practices, you can create an IAM policy that you can assign to the user account you wish to use with `ingestr`.
33
+ Below is a sample policy:
34
+ ```json
35
+ {
36
+ "Version": "2012-10-17",
37
+ "Statement": [
38
+ {
39
+ "Sid": "Statement1",
40
+ "Effect": "Allow",
41
+ "Action": [
42
+ "dynamodb:DescribeTable",
43
+ "dynamodb:Scan"
44
+ ],
45
+ "Resource": [
46
+ "<TABLE_ARN>"
47
+ ]
48
+ }
49
+ ]
50
+ }
51
+ ```
52
+
53
+ Replace `TABLE_ARN` with the DynamoDB [Amazon Resource Name](https://docs.aws.amazon.com/IAM/latest/UserGuide/reference-arns.html) of your Table. You can find the ARN for your table in the [DynamoDB console](https://console.aws.amazon.com/dynamodb/home). You can add as many tables you want in the `Resource` field. Alternatively, if you'd like to give access to all tables that you own, you can set `Resource` to `["*"]`.
54
+
55
+ ### Example: Simple load
56
+
57
+ For this example, we'll assume the value of `access_key_id` and `secret_access_key` are `user` and `pass` respectively.
58
+
59
+ Say you have a table called `absolute-armadillo` in the region `ap-south-1` and you want to load this data to a duckdb database called `animal.db`.
60
+
61
+ You run the following to achieve this:
62
+ ```sh
63
+ ingestr ingest \
64
+ --source-uri "dynamodb://dynamodb.ap-south-1.amazonaws.com?access_key_id=user&secret_access_key=pass" \
65
+ --source-table "absolute-armadillo" \
66
+ --dest-uri "duckdb://./animal.db" \
67
+ --dest-table "public.armadillo"
68
+ ```
69
+
70
+ ### Example: Incremental load
71
+ `ingestr` supports incremental loading. Incremental loading is a technique whereby only rows or fields that are changed are fetched. This reduces load times of subsequent runs and improves efficiency of your pipelines.
72
+
73
+ Assuming the same setup from [Simple Load](#example-simple-load), we can run incremental load with:
74
+ ```sh
75
+ ingestr ingest \
76
+ --source-uri "dynamodb://dynamodb.ap-south-1.amazonaws.com?access_key_id=user&secret_access_key=pass" \
77
+ --source-table "absolute-armadillo" \
78
+ --dest-uri "duckdb://./animal.db" \
79
+ --dest-table "public.armadillo" \
80
+ --incremental-strategy "replace" \
81
+ --incremental-key "updated_at"
82
+ ```
83
+
84
+ Assuming that `absolute-armadillo` table has a datetime field called `updated_at`, whenever you run this command, only rows with value greater than `MAX(updated_at)` from previous load will be fetched from DynamoDB.
85
+
86
+ > [!WARNING]
87
+ > DynamoDB doesn't support indexed range scans.
88
+ > Whenever you run `ingestr ingest`, the whole table is scanned.
89
+ > Although `ingestr` does specify a filter critiera, DynamoDB only applies
90
+ > this _after_ running the table scan.
@@ -23,7 +23,7 @@ The URI is used to connect to the Gorgias API for extracting data.
23
23
  ingestr ingest --source-table 'tickets' --source-uri $GORGIAS_URI --dest-uri $BIGQUERY_URI --interval-start 2024-06-19 --dest-table 'gorgias.ticket_messages' --loader-file-format jsonl
24
24
 
25
25
  # get all the customers and write them to `gorgias.customers` table on DuckDB
26
- ingestr ingest --source-table 'customers' --source-uri $GORGIAS_URI --dest-uri duckdb:///gorgias.duckdb --interval-start 2024-01-01 --dest-table 'gorgias.customers'
26
+ ingestr ingest --source-table 'customers' --source-uri $GORGIAS_URI --dest-uri duckdb:///gorgias.duckdb --interval-start 2024-01-01 --dest-table 'dest.customers'
27
27
  ```
28
28
 
29
29
  ## Supported entities
@@ -37,7 +37,7 @@ Once you complete the guide, you should have a service account JSON file and the
37
37
  Based on this assumption, here's a sample command that will copy the data from the Google Sheets spreadsheet into a DuckDB database:
38
38
 
39
39
  ```sh
40
- ingestr ingest --source-uri 'gsheets://?credentials_path=/path/to/file.json' --source-table 'fkdUQ2bjdNfUq2CA.Sheet1' --dest-uri duckdb:///gsheets.duckdb --dest-table 'gsheets.output'
40
+ ingestr ingest --source-uri 'gsheets://?credentials_path=/path/to/file.json' --source-table 'fkdUQ2bjdNfUq2CA.Sheet1' --dest-uri duckdb:///gsheets.duckdb --dest-table 'dest.output'
41
41
  ```
42
42
 
43
43
  The result of this command will be a table in the `gsheets.duckdb` database.
@@ -32,7 +32,7 @@ ingestr ingest \
32
32
  --source-uri 'kafka://?bootstrap_servers=localhost:9092&group_id=test_group' \
33
33
  --source-table 'my-topic' \
34
34
  --dest-uri duckdb:///kafka.duckdb \
35
- --dest-table 'kafka.my_topic'
35
+ --dest-table 'dest.my_topic'
36
36
  ```
37
37
 
38
38
  The result of this command will be a table in the `kafka.duckdb` database with JSON columns.
@@ -19,10 +19,10 @@ URI parameters:
19
19
  The URI is used to connect to the Klaviyo API for extracting data.
20
20
 
21
21
  ```bash
22
- ingestr ingest --source-table 'events' --source-uri 'klaviyo://?api_key=pk_test' --dest-uri duckdb:///klaviyo.duckdb --interval-start 2022-01-01 --dest-table 'klaviyo.events' --extract-parallelism 20
22
+ ingestr ingest --source-table 'events' --source-uri 'klaviyo://?api_key=pk_test' --dest-uri duckdb:///klaviyo.duckdb --interval-start 2022-01-01 --dest-table 'dest.events' --extract-parallelism 20
23
23
  ```
24
24
 
25
- This command fetches all the events that are created/updated since 2022-01-01 and writes them to `klaviyo.events` table on DuckDB, using 20 parallel threads to improve performance and efficiently handle large data .
25
+ This command fetches all the events that are created/updated since 2022-01-01 and writes them to `dest.events` table on DuckDB, using 20 parallel threads to improve performance and efficiently handle large data .
26
26
 
27
27
  ## Tables
28
28
 
@@ -22,7 +22,7 @@ Notion requires a few steps to set up an integration, please follow the guide dl
22
22
  Once you complete the guide, you should have an API key, and the table ID to connect to. Let's say your API token is `secret_12345` and the database you'd like to connect to is `bfeaafc0c25f40a9asdasd672a9456f3`, here's a sample command that will copy the data from the Notion table into a DuckDB database:
23
23
 
24
24
  ```sh
25
- ingestr ingest --source-uri 'notion://?api_key=secret_12345' --source-table 'bfeaafc0c25f40a9asdasd672a9456f3' --dest-uri duckdb:///notion.duckdb --dest-table 'notion.output'
25
+ ingestr ingest --source-uri 'notion://?api_key=secret_12345' --source-table 'bfeaafc0c25f40a9asdasd672a9456f3' --dest-uri duckdb:///notion.duckdb --dest-table 'dest.output'
26
26
  ```
27
27
 
28
28
  The result of this command will be a table in the `notion.duckdb` database with JSON columns.
@@ -23,7 +23,7 @@ Shopify requires a few steps to set up an integration, please follow the guide d
23
23
  Once you complete the guide, you should have an API key and the store name to connect to. Let's say your API key is `shpkey_12345` and the store you'd like to connect to is `my-store`, here's a sample command that will copy the data from the Shopify store into a DuckDB database:
24
24
 
25
25
  ```sh
26
- ingestr ingest --source-uri 'shopify://my-store.myshopify.com?api_key=shpkey_12345' --source-table 'orders' --dest-uri duckdb:///shopify.duckdb --dest-table 'shopify.orders'
26
+ ingestr ingest --source-uri 'shopify://my-store.myshopify.com?api_key=shpkey_12345' --source-table 'orders' --dest-uri duckdb:///shopify.duckdb --dest-table 'dest.orders'
27
27
  ```
28
28
 
29
29
  The result of this command will be a table in the `shopify.duckdb` database with JSON columns.
@@ -25,7 +25,7 @@ Stripe requires a few steps to set up an integration, please follow the guide dl
25
25
  Once you complete the guide, you should have an API key. Let's say your API key is `sk_test_12345`, here's a sample command that will copy the data from Stripe into a DuckDB database:
26
26
 
27
27
  ```sh
28
- ingestr ingest --source-uri 'stripe://?api_key=sk_test_12345' --source-table 'charges' --dest-uri duckdb:///stripe.duckdb --dest-table 'stripe.charges'
28
+ ingestr ingest --source-uri 'stripe://?api_key=sk_test_12345' --source-table 'charges' --dest-uri duckdb:///stripe.duckdb --dest-table 'dest.charges'
29
29
  ```
30
30
 
31
31
  The result of this command will be a table in the `stripe.duckdb` database with JSON columns.
@@ -39,7 +39,7 @@ Once you complete the guide, if you decide to use an OAuth token, you should hav
39
39
  ingestr ingest --source-uri "zendesk://:qVsbdiasVt@mycompany" \
40
40
  --source-table 'tickets' \
41
41
  --dest-uri 'duckdb:///zendesk.duckdb' \
42
- --dest-table 'zendesk.tickets' \
42
+ --dest-table 'dest.tickets' \
43
43
  --interval-start '2024-01-01'
44
44
  ```
45
45
 
@@ -49,7 +49,7 @@ If you decide to use an API Token, you should have a subdomain, email, and API t
49
49
  ingestr ingest --source-uri "zendesk://john@get.com:nbs123@mycompany" \
50
50
  --source-table 'tickets' \
51
51
  --dest-uri 'duckdb:///zendesk.duckdb' \
52
- --dest-table 'zendesk.tickets' \
52
+ --dest-table 'dest.tickets' \
53
53
  --interval-start '2024-01-01'
54
54
  ```
55
55
 
@@ -288,7 +288,6 @@ def ingest(
288
288
  ),
289
289
  ] = [], # type: ignore
290
290
  ):
291
-
292
291
  # TODO(turtledev): can't we move this to the top of this file?
293
292
  import hashlib
294
293
  import tempfile
@@ -386,7 +385,7 @@ def ingest(
386
385
 
387
386
  factory = SourceDestinationFactory(source_uri, dest_uri)
388
387
  track(
389
- "command_running",
388
+ "command_running",
390
389
  {
391
390
  "command": "ingest",
392
391
  "source_type": factory.source_scheme,
@@ -67,13 +67,16 @@ def adjust_source(
67
67
  filters=filters,
68
68
  )
69
69
 
70
+ if not dimensions:
71
+ return campaigns, creatives
72
+
70
73
  merge_key = merge_key
74
+ type_hints = {}
71
75
  for dimension in REQUIRED_CUSTOM_DIMENSIONS:
72
76
  if dimension in dimensions:
73
77
  merge_key = dimension
74
78
  break
75
79
 
76
- type_hints = {}
77
80
  for dimension in dimensions:
78
81
  if dimension in KNOWN_TYPE_HINTS:
79
82
  type_hints[dimension] = KNOWN_TYPE_HINTS[dimension]