airbyte-cdk 0.72.0__py3-none-any.whl → 6.17.1.dev0__py3-none-any.whl

Sign up to get free protection for your applications and to get access to all the features.
Files changed (518) hide show
  1. airbyte_cdk/__init__.py +355 -6
  2. airbyte_cdk/cli/__init__.py +1 -0
  3. airbyte_cdk/cli/source_declarative_manifest/__init__.py +5 -0
  4. airbyte_cdk/cli/source_declarative_manifest/_run.py +230 -0
  5. airbyte_cdk/cli/source_declarative_manifest/spec.json +17 -0
  6. airbyte_cdk/config_observation.py +29 -10
  7. airbyte_cdk/connector.py +24 -24
  8. airbyte_cdk/connector_builder/README.md +53 -0
  9. airbyte_cdk/connector_builder/connector_builder_handler.py +37 -11
  10. airbyte_cdk/connector_builder/main.py +45 -13
  11. airbyte_cdk/connector_builder/message_grouper.py +189 -50
  12. airbyte_cdk/connector_builder/models.py +3 -2
  13. airbyte_cdk/destinations/__init__.py +4 -3
  14. airbyte_cdk/destinations/destination.py +54 -20
  15. airbyte_cdk/destinations/vector_db_based/README.md +37 -0
  16. airbyte_cdk/destinations/vector_db_based/config.py +40 -17
  17. airbyte_cdk/destinations/vector_db_based/document_processor.py +56 -17
  18. airbyte_cdk/destinations/vector_db_based/embedder.py +57 -15
  19. airbyte_cdk/destinations/vector_db_based/test_utils.py +14 -4
  20. airbyte_cdk/destinations/vector_db_based/utils.py +8 -2
  21. airbyte_cdk/destinations/vector_db_based/writer.py +24 -5
  22. airbyte_cdk/entrypoint.py +153 -44
  23. airbyte_cdk/exception_handler.py +21 -3
  24. airbyte_cdk/logger.py +30 -44
  25. airbyte_cdk/models/__init__.py +13 -2
  26. airbyte_cdk/models/airbyte_protocol.py +86 -1
  27. airbyte_cdk/models/airbyte_protocol_serializers.py +44 -0
  28. airbyte_cdk/models/file_transfer_record_message.py +13 -0
  29. airbyte_cdk/models/well_known_types.py +1 -1
  30. airbyte_cdk/sources/__init__.py +5 -1
  31. airbyte_cdk/sources/abstract_source.py +125 -79
  32. airbyte_cdk/sources/concurrent_source/__init__.py +7 -2
  33. airbyte_cdk/sources/concurrent_source/concurrent_read_processor.py +102 -36
  34. airbyte_cdk/sources/concurrent_source/concurrent_source.py +29 -36
  35. airbyte_cdk/sources/concurrent_source/concurrent_source_adapter.py +94 -10
  36. airbyte_cdk/sources/concurrent_source/stream_thread_exception.py +25 -0
  37. airbyte_cdk/sources/concurrent_source/thread_pool_manager.py +20 -14
  38. airbyte_cdk/sources/config.py +3 -2
  39. airbyte_cdk/sources/connector_state_manager.py +49 -83
  40. airbyte_cdk/sources/declarative/async_job/job.py +52 -0
  41. airbyte_cdk/sources/declarative/async_job/job_orchestrator.py +497 -0
  42. airbyte_cdk/sources/declarative/async_job/job_tracker.py +75 -0
  43. airbyte_cdk/sources/declarative/async_job/repository.py +35 -0
  44. airbyte_cdk/sources/declarative/async_job/status.py +24 -0
  45. airbyte_cdk/sources/declarative/async_job/timer.py +39 -0
  46. airbyte_cdk/sources/declarative/auth/__init__.py +2 -3
  47. airbyte_cdk/sources/declarative/auth/declarative_authenticator.py +3 -1
  48. airbyte_cdk/sources/declarative/auth/jwt.py +191 -0
  49. airbyte_cdk/sources/declarative/auth/oauth.py +60 -20
  50. airbyte_cdk/sources/declarative/auth/selective_authenticator.py +10 -2
  51. airbyte_cdk/sources/declarative/auth/token.py +28 -10
  52. airbyte_cdk/sources/declarative/auth/token_provider.py +9 -8
  53. airbyte_cdk/sources/declarative/checks/check_stream.py +16 -8
  54. airbyte_cdk/sources/declarative/checks/connection_checker.py +4 -2
  55. airbyte_cdk/sources/declarative/concurrency_level/__init__.py +7 -0
  56. airbyte_cdk/sources/declarative/concurrency_level/concurrency_level.py +50 -0
  57. airbyte_cdk/sources/declarative/concurrent_declarative_source.py +490 -0
  58. airbyte_cdk/sources/declarative/datetime/datetime_parser.py +4 -0
  59. airbyte_cdk/sources/declarative/datetime/min_max_datetime.py +26 -6
  60. airbyte_cdk/sources/declarative/declarative_component_schema.yaml +1213 -88
  61. airbyte_cdk/sources/declarative/declarative_source.py +5 -2
  62. airbyte_cdk/sources/declarative/declarative_stream.py +95 -9
  63. airbyte_cdk/sources/declarative/decoders/__init__.py +23 -2
  64. airbyte_cdk/sources/declarative/decoders/composite_raw_decoder.py +97 -0
  65. airbyte_cdk/sources/declarative/decoders/decoder.py +11 -4
  66. airbyte_cdk/sources/declarative/decoders/json_decoder.py +92 -5
  67. airbyte_cdk/sources/declarative/decoders/noop_decoder.py +21 -0
  68. airbyte_cdk/sources/declarative/decoders/pagination_decoder_decorator.py +39 -0
  69. airbyte_cdk/sources/declarative/decoders/xml_decoder.py +98 -0
  70. airbyte_cdk/sources/declarative/extractors/__init__.py +12 -1
  71. airbyte_cdk/sources/declarative/extractors/dpath_extractor.py +29 -24
  72. airbyte_cdk/sources/declarative/extractors/http_selector.py +4 -5
  73. airbyte_cdk/sources/declarative/extractors/record_extractor.py +2 -3
  74. airbyte_cdk/sources/declarative/extractors/record_filter.py +63 -8
  75. airbyte_cdk/sources/declarative/extractors/record_selector.py +85 -26
  76. airbyte_cdk/sources/declarative/extractors/response_to_file_extractor.py +177 -0
  77. airbyte_cdk/sources/declarative/extractors/type_transformer.py +55 -0
  78. airbyte_cdk/sources/declarative/incremental/__init__.py +31 -3
  79. airbyte_cdk/sources/declarative/incremental/concurrent_partition_cursor.py +346 -0
  80. airbyte_cdk/sources/declarative/incremental/datetime_based_cursor.py +156 -48
  81. airbyte_cdk/sources/declarative/incremental/declarative_cursor.py +13 -0
  82. airbyte_cdk/sources/declarative/incremental/global_substream_cursor.py +350 -0
  83. airbyte_cdk/sources/declarative/incremental/per_partition_cursor.py +173 -74
  84. airbyte_cdk/sources/declarative/incremental/per_partition_with_global.py +200 -0
  85. airbyte_cdk/sources/declarative/incremental/resumable_full_refresh_cursor.py +122 -0
  86. airbyte_cdk/sources/declarative/interpolation/filters.py +27 -1
  87. airbyte_cdk/sources/declarative/interpolation/interpolated_boolean.py +23 -5
  88. airbyte_cdk/sources/declarative/interpolation/interpolated_mapping.py +12 -8
  89. airbyte_cdk/sources/declarative/interpolation/interpolated_nested_mapping.py +13 -6
  90. airbyte_cdk/sources/declarative/interpolation/interpolated_string.py +21 -6
  91. airbyte_cdk/sources/declarative/interpolation/interpolation.py +9 -3
  92. airbyte_cdk/sources/declarative/interpolation/jinja.py +72 -37
  93. airbyte_cdk/sources/declarative/interpolation/macros.py +72 -17
  94. airbyte_cdk/sources/declarative/manifest_declarative_source.py +193 -52
  95. airbyte_cdk/sources/declarative/migrations/legacy_to_per_partition_state_migration.py +98 -0
  96. airbyte_cdk/sources/declarative/migrations/state_migration.py +24 -0
  97. airbyte_cdk/sources/declarative/models/__init__.py +1 -1
  98. airbyte_cdk/sources/declarative/models/declarative_component_schema.py +1329 -595
  99. airbyte_cdk/sources/declarative/parsers/custom_exceptions.py +2 -2
  100. airbyte_cdk/sources/declarative/parsers/manifest_component_transformer.py +26 -4
  101. airbyte_cdk/sources/declarative/parsers/manifest_reference_resolver.py +26 -15
  102. airbyte_cdk/sources/declarative/parsers/model_to_component_factory.py +1763 -226
  103. airbyte_cdk/sources/declarative/partition_routers/__init__.py +24 -4
  104. airbyte_cdk/sources/declarative/partition_routers/async_job_partition_router.py +65 -0
  105. airbyte_cdk/sources/declarative/partition_routers/cartesian_product_stream_slicer.py +176 -0
  106. airbyte_cdk/sources/declarative/partition_routers/list_partition_router.py +39 -9
  107. airbyte_cdk/sources/declarative/partition_routers/partition_router.py +62 -0
  108. airbyte_cdk/sources/declarative/partition_routers/single_partition_router.py +15 -3
  109. airbyte_cdk/sources/declarative/partition_routers/substream_partition_router.py +222 -39
  110. airbyte_cdk/sources/declarative/requesters/error_handlers/__init__.py +19 -5
  111. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/__init__.py +3 -1
  112. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/constant_backoff_strategy.py +19 -7
  113. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/exponential_backoff_strategy.py +19 -7
  114. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/header_helper.py +4 -2
  115. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/wait_time_from_header_backoff_strategy.py +41 -9
  116. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/wait_until_time_from_header_backoff_strategy.py +29 -14
  117. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategy.py +5 -13
  118. airbyte_cdk/sources/declarative/requesters/error_handlers/composite_error_handler.py +32 -16
  119. airbyte_cdk/sources/declarative/requesters/error_handlers/default_error_handler.py +46 -56
  120. airbyte_cdk/sources/declarative/requesters/error_handlers/default_http_response_filter.py +40 -0
  121. airbyte_cdk/sources/declarative/requesters/error_handlers/error_handler.py +6 -32
  122. airbyte_cdk/sources/declarative/requesters/error_handlers/http_response_filter.py +119 -41
  123. airbyte_cdk/sources/declarative/requesters/http_job_repository.py +228 -0
  124. airbyte_cdk/sources/declarative/requesters/http_requester.py +98 -344
  125. airbyte_cdk/sources/declarative/requesters/paginators/__init__.py +14 -3
  126. airbyte_cdk/sources/declarative/requesters/paginators/default_paginator.py +105 -46
  127. airbyte_cdk/sources/declarative/requesters/paginators/no_pagination.py +14 -8
  128. airbyte_cdk/sources/declarative/requesters/paginators/paginator.py +19 -8
  129. airbyte_cdk/sources/declarative/requesters/paginators/strategies/__init__.py +9 -3
  130. airbyte_cdk/sources/declarative/requesters/paginators/strategies/cursor_pagination_strategy.py +53 -21
  131. airbyte_cdk/sources/declarative/requesters/paginators/strategies/offset_increment.py +42 -19
  132. airbyte_cdk/sources/declarative/requesters/paginators/strategies/page_increment.py +25 -12
  133. airbyte_cdk/sources/declarative/requesters/paginators/strategies/pagination_strategy.py +13 -10
  134. airbyte_cdk/sources/declarative/requesters/paginators/strategies/stop_condition.py +26 -13
  135. airbyte_cdk/sources/declarative/requesters/request_options/__init__.py +15 -2
  136. airbyte_cdk/sources/declarative/requesters/request_options/datetime_based_request_options_provider.py +91 -0
  137. airbyte_cdk/sources/declarative/requesters/request_options/default_request_options_provider.py +60 -0
  138. airbyte_cdk/sources/declarative/requesters/request_options/interpolated_nested_request_input_provider.py +31 -14
  139. airbyte_cdk/sources/declarative/requesters/request_options/interpolated_request_input_provider.py +27 -15
  140. airbyte_cdk/sources/declarative/requesters/request_options/interpolated_request_options_provider.py +63 -10
  141. airbyte_cdk/sources/declarative/requesters/request_options/request_options_provider.py +1 -1
  142. airbyte_cdk/sources/declarative/requesters/requester.py +9 -17
  143. airbyte_cdk/sources/declarative/resolvers/__init__.py +41 -0
  144. airbyte_cdk/sources/declarative/resolvers/components_resolver.py +55 -0
  145. airbyte_cdk/sources/declarative/resolvers/config_components_resolver.py +136 -0
  146. airbyte_cdk/sources/declarative/resolvers/http_components_resolver.py +112 -0
  147. airbyte_cdk/sources/declarative/retrievers/__init__.py +6 -2
  148. airbyte_cdk/sources/declarative/retrievers/async_retriever.py +100 -0
  149. airbyte_cdk/sources/declarative/retrievers/retriever.py +1 -3
  150. airbyte_cdk/sources/declarative/retrievers/simple_retriever.py +229 -73
  151. airbyte_cdk/sources/declarative/schema/__init__.py +14 -1
  152. airbyte_cdk/sources/declarative/schema/default_schema_loader.py +5 -3
  153. airbyte_cdk/sources/declarative/schema/dynamic_schema_loader.py +236 -0
  154. airbyte_cdk/sources/declarative/schema/json_file_schema_loader.py +8 -8
  155. airbyte_cdk/sources/declarative/spec/spec.py +12 -5
  156. airbyte_cdk/sources/declarative/stream_slicers/__init__.py +1 -2
  157. airbyte_cdk/sources/declarative/stream_slicers/declarative_partition_generator.py +88 -0
  158. airbyte_cdk/sources/declarative/stream_slicers/stream_slicer.py +9 -14
  159. airbyte_cdk/sources/declarative/transformations/add_fields.py +19 -11
  160. airbyte_cdk/sources/declarative/transformations/flatten_fields.py +52 -0
  161. airbyte_cdk/sources/declarative/transformations/keys_replace_transformation.py +61 -0
  162. airbyte_cdk/sources/declarative/transformations/keys_to_lower_transformation.py +22 -0
  163. airbyte_cdk/sources/declarative/transformations/keys_to_snake_transformation.py +68 -0
  164. airbyte_cdk/sources/declarative/transformations/remove_fields.py +13 -10
  165. airbyte_cdk/sources/declarative/transformations/transformation.py +5 -5
  166. airbyte_cdk/sources/declarative/types.py +19 -110
  167. airbyte_cdk/sources/declarative/yaml_declarative_source.py +31 -10
  168. airbyte_cdk/sources/embedded/base_integration.py +16 -5
  169. airbyte_cdk/sources/embedded/catalog.py +16 -4
  170. airbyte_cdk/sources/embedded/runner.py +19 -3
  171. airbyte_cdk/sources/embedded/tools.py +5 -2
  172. airbyte_cdk/sources/file_based/README.md +152 -0
  173. airbyte_cdk/sources/file_based/__init__.py +24 -0
  174. airbyte_cdk/sources/file_based/availability_strategy/__init__.py +9 -2
  175. airbyte_cdk/sources/file_based/availability_strategy/abstract_file_based_availability_strategy.py +22 -6
  176. airbyte_cdk/sources/file_based/availability_strategy/default_file_based_availability_strategy.py +46 -10
  177. airbyte_cdk/sources/file_based/config/abstract_file_based_spec.py +47 -10
  178. airbyte_cdk/sources/file_based/config/avro_format.py +2 -1
  179. airbyte_cdk/sources/file_based/config/csv_format.py +29 -10
  180. airbyte_cdk/sources/file_based/config/excel_format.py +18 -0
  181. airbyte_cdk/sources/file_based/config/file_based_stream_config.py +16 -4
  182. airbyte_cdk/sources/file_based/config/jsonl_format.py +2 -1
  183. airbyte_cdk/sources/file_based/config/parquet_format.py +2 -1
  184. airbyte_cdk/sources/file_based/config/unstructured_format.py +13 -5
  185. airbyte_cdk/sources/file_based/discovery_policy/__init__.py +6 -2
  186. airbyte_cdk/sources/file_based/discovery_policy/abstract_discovery_policy.py +2 -4
  187. airbyte_cdk/sources/file_based/discovery_policy/default_discovery_policy.py +7 -2
  188. airbyte_cdk/sources/file_based/exceptions.py +18 -15
  189. airbyte_cdk/sources/file_based/file_based_source.py +140 -33
  190. airbyte_cdk/sources/file_based/file_based_stream_reader.py +69 -5
  191. airbyte_cdk/sources/file_based/file_types/__init__.py +14 -1
  192. airbyte_cdk/sources/file_based/file_types/avro_parser.py +75 -24
  193. airbyte_cdk/sources/file_based/file_types/csv_parser.py +116 -34
  194. airbyte_cdk/sources/file_based/file_types/excel_parser.py +196 -0
  195. airbyte_cdk/sources/file_based/file_types/file_transfer.py +37 -0
  196. airbyte_cdk/sources/file_based/file_types/file_type_parser.py +4 -1
  197. airbyte_cdk/sources/file_based/file_types/jsonl_parser.py +24 -8
  198. airbyte_cdk/sources/file_based/file_types/parquet_parser.py +60 -18
  199. airbyte_cdk/sources/file_based/file_types/unstructured_parser.py +141 -41
  200. airbyte_cdk/sources/file_based/remote_file.py +1 -1
  201. airbyte_cdk/sources/file_based/schema_helpers.py +38 -10
  202. airbyte_cdk/sources/file_based/schema_validation_policies/__init__.py +3 -1
  203. airbyte_cdk/sources/file_based/schema_validation_policies/abstract_schema_validation_policy.py +3 -1
  204. airbyte_cdk/sources/file_based/schema_validation_policies/default_schema_validation_policies.py +16 -5
  205. airbyte_cdk/sources/file_based/stream/abstract_file_based_stream.py +50 -13
  206. airbyte_cdk/sources/file_based/stream/concurrent/adapters.py +67 -27
  207. airbyte_cdk/sources/file_based/stream/concurrent/cursor/__init__.py +5 -1
  208. airbyte_cdk/sources/file_based/stream/concurrent/cursor/abstract_concurrent_file_based_cursor.py +14 -23
  209. airbyte_cdk/sources/file_based/stream/concurrent/cursor/file_based_concurrent_cursor.py +54 -18
  210. airbyte_cdk/sources/file_based/stream/concurrent/cursor/file_based_final_state_cursor.py +21 -9
  211. airbyte_cdk/sources/file_based/stream/cursor/abstract_file_based_cursor.py +3 -1
  212. airbyte_cdk/sources/file_based/stream/cursor/default_file_based_cursor.py +27 -10
  213. airbyte_cdk/sources/file_based/stream/default_file_based_stream.py +147 -45
  214. airbyte_cdk/sources/http_logger.py +8 -3
  215. airbyte_cdk/sources/message/__init__.py +7 -1
  216. airbyte_cdk/sources/message/repository.py +18 -4
  217. airbyte_cdk/sources/source.py +42 -38
  218. airbyte_cdk/sources/streams/__init__.py +2 -2
  219. airbyte_cdk/sources/streams/availability_strategy.py +54 -3
  220. airbyte_cdk/sources/streams/call_rate.py +64 -21
  221. airbyte_cdk/sources/streams/checkpoint/__init__.py +26 -0
  222. airbyte_cdk/sources/streams/checkpoint/checkpoint_reader.py +335 -0
  223. airbyte_cdk/sources/{declarative/incremental → streams/checkpoint}/cursor.py +17 -14
  224. airbyte_cdk/sources/streams/checkpoint/per_partition_key_serializer.py +22 -0
  225. airbyte_cdk/sources/streams/checkpoint/resumable_full_refresh_cursor.py +51 -0
  226. airbyte_cdk/sources/streams/checkpoint/substream_resumable_full_refresh_cursor.py +110 -0
  227. airbyte_cdk/sources/streams/concurrent/README.md +7 -0
  228. airbyte_cdk/sources/streams/concurrent/abstract_stream.py +7 -2
  229. airbyte_cdk/sources/streams/concurrent/adapters.py +84 -75
  230. airbyte_cdk/sources/streams/concurrent/availability_strategy.py +30 -2
  231. airbyte_cdk/sources/streams/concurrent/cursor.py +298 -42
  232. airbyte_cdk/sources/streams/concurrent/default_stream.py +12 -3
  233. airbyte_cdk/sources/streams/concurrent/exceptions.py +3 -0
  234. airbyte_cdk/sources/streams/concurrent/helpers.py +14 -3
  235. airbyte_cdk/sources/streams/concurrent/partition_enqueuer.py +12 -3
  236. airbyte_cdk/sources/streams/concurrent/partition_reader.py +10 -3
  237. airbyte_cdk/sources/streams/concurrent/partitions/partition.py +1 -16
  238. airbyte_cdk/sources/streams/concurrent/partitions/stream_slicer.py +21 -0
  239. airbyte_cdk/sources/streams/concurrent/partitions/types.py +15 -5
  240. airbyte_cdk/sources/streams/concurrent/state_converters/abstract_stream_state_converter.py +109 -17
  241. airbyte_cdk/sources/streams/concurrent/state_converters/datetime_stream_state_converter.py +90 -72
  242. airbyte_cdk/sources/streams/core.py +412 -87
  243. airbyte_cdk/sources/streams/http/__init__.py +2 -1
  244. airbyte_cdk/sources/streams/http/availability_strategy.py +12 -101
  245. airbyte_cdk/sources/streams/http/error_handlers/__init__.py +22 -0
  246. airbyte_cdk/sources/streams/http/error_handlers/backoff_strategy.py +28 -0
  247. airbyte_cdk/sources/streams/http/error_handlers/default_backoff_strategy.py +17 -0
  248. airbyte_cdk/sources/streams/http/error_handlers/default_error_mapping.py +86 -0
  249. airbyte_cdk/sources/streams/http/error_handlers/error_handler.py +42 -0
  250. airbyte_cdk/sources/streams/http/error_handlers/error_message_parser.py +19 -0
  251. airbyte_cdk/sources/streams/http/error_handlers/http_status_error_handler.py +110 -0
  252. airbyte_cdk/sources/streams/http/error_handlers/json_error_message_parser.py +52 -0
  253. airbyte_cdk/sources/streams/http/error_handlers/response_models.py +65 -0
  254. airbyte_cdk/sources/streams/http/exceptions.py +27 -7
  255. airbyte_cdk/sources/streams/http/http.py +369 -246
  256. airbyte_cdk/sources/streams/http/http_client.py +531 -0
  257. airbyte_cdk/sources/streams/http/rate_limiting.py +76 -12
  258. airbyte_cdk/sources/streams/http/requests_native_auth/abstract_oauth.py +28 -9
  259. airbyte_cdk/sources/streams/http/requests_native_auth/abstract_token.py +2 -1
  260. airbyte_cdk/sources/streams/http/requests_native_auth/oauth.py +90 -35
  261. airbyte_cdk/sources/streams/http/requests_native_auth/token.py +13 -3
  262. airbyte_cdk/sources/types.py +154 -0
  263. airbyte_cdk/sources/utils/record_helper.py +36 -21
  264. airbyte_cdk/sources/utils/schema_helpers.py +13 -6
  265. airbyte_cdk/sources/utils/slice_logger.py +4 -1
  266. airbyte_cdk/sources/utils/transform.py +54 -20
  267. airbyte_cdk/sql/_util/hashing.py +34 -0
  268. airbyte_cdk/sql/_util/name_normalizers.py +92 -0
  269. airbyte_cdk/sql/constants.py +32 -0
  270. airbyte_cdk/sql/exceptions.py +235 -0
  271. airbyte_cdk/sql/secrets.py +123 -0
  272. airbyte_cdk/sql/shared/__init__.py +15 -0
  273. airbyte_cdk/sql/shared/catalog_providers.py +145 -0
  274. airbyte_cdk/sql/shared/sql_processor.py +786 -0
  275. airbyte_cdk/sql/types.py +160 -0
  276. airbyte_cdk/test/catalog_builder.py +70 -18
  277. airbyte_cdk/test/entrypoint_wrapper.py +117 -42
  278. airbyte_cdk/test/mock_http/__init__.py +1 -1
  279. airbyte_cdk/test/mock_http/matcher.py +6 -0
  280. airbyte_cdk/test/mock_http/mocker.py +57 -10
  281. airbyte_cdk/test/mock_http/request.py +19 -3
  282. airbyte_cdk/test/mock_http/response.py +3 -1
  283. airbyte_cdk/test/mock_http/response_builder.py +32 -16
  284. airbyte_cdk/test/state_builder.py +18 -10
  285. airbyte_cdk/test/utils/__init__.py +1 -0
  286. airbyte_cdk/test/utils/data.py +24 -0
  287. airbyte_cdk/test/utils/http_mocking.py +16 -0
  288. airbyte_cdk/test/utils/manifest_only_fixtures.py +60 -0
  289. airbyte_cdk/test/utils/reading.py +26 -0
  290. airbyte_cdk/utils/__init__.py +2 -1
  291. airbyte_cdk/utils/airbyte_secrets_utils.py +5 -3
  292. airbyte_cdk/utils/analytics_message.py +10 -2
  293. airbyte_cdk/utils/datetime_format_inferrer.py +4 -1
  294. airbyte_cdk/utils/event_timing.py +10 -10
  295. airbyte_cdk/utils/mapping_helpers.py +3 -1
  296. airbyte_cdk/utils/message_utils.py +20 -11
  297. airbyte_cdk/utils/print_buffer.py +75 -0
  298. airbyte_cdk/utils/schema_inferrer.py +198 -28
  299. airbyte_cdk/utils/slice_hasher.py +30 -0
  300. airbyte_cdk/utils/spec_schema_transformations.py +6 -3
  301. airbyte_cdk/utils/stream_status_utils.py +8 -1
  302. airbyte_cdk/utils/traced_exception.py +61 -21
  303. airbyte_cdk-6.17.1.dev0.dist-info/METADATA +109 -0
  304. airbyte_cdk-6.17.1.dev0.dist-info/RECORD +350 -0
  305. {airbyte_cdk-0.72.0.dist-info → airbyte_cdk-6.17.1.dev0.dist-info}/WHEEL +1 -2
  306. airbyte_cdk-6.17.1.dev0.dist-info/entry_points.txt +3 -0
  307. airbyte_cdk/sources/declarative/create_partial.py +0 -92
  308. airbyte_cdk/sources/declarative/parsers/class_types_registry.py +0 -102
  309. airbyte_cdk/sources/declarative/parsers/default_implementation_registry.py +0 -64
  310. airbyte_cdk/sources/declarative/requesters/error_handlers/response_action.py +0 -16
  311. airbyte_cdk/sources/declarative/requesters/error_handlers/response_status.py +0 -68
  312. airbyte_cdk/sources/declarative/stream_slicers/cartesian_product_stream_slicer.py +0 -114
  313. airbyte_cdk/sources/deprecated/base_source.py +0 -94
  314. airbyte_cdk/sources/deprecated/client.py +0 -99
  315. airbyte_cdk/sources/singer/__init__.py +0 -8
  316. airbyte_cdk/sources/singer/singer_helpers.py +0 -304
  317. airbyte_cdk/sources/singer/source.py +0 -186
  318. airbyte_cdk/sources/streams/concurrent/partitions/record.py +0 -23
  319. airbyte_cdk/sources/streams/http/auth/__init__.py +0 -17
  320. airbyte_cdk/sources/streams/http/auth/core.py +0 -29
  321. airbyte_cdk/sources/streams/http/auth/oauth.py +0 -113
  322. airbyte_cdk/sources/streams/http/auth/token.py +0 -47
  323. airbyte_cdk/sources/streams/utils/stream_helper.py +0 -40
  324. airbyte_cdk/sources/utils/catalog_helpers.py +0 -22
  325. airbyte_cdk/sources/utils/schema_models.py +0 -84
  326. airbyte_cdk-0.72.0.dist-info/METADATA +0 -243
  327. airbyte_cdk-0.72.0.dist-info/RECORD +0 -466
  328. airbyte_cdk-0.72.0.dist-info/top_level.txt +0 -3
  329. source_declarative_manifest/main.py +0 -29
  330. unit_tests/connector_builder/__init__.py +0 -3
  331. unit_tests/connector_builder/test_connector_builder_handler.py +0 -871
  332. unit_tests/connector_builder/test_message_grouper.py +0 -713
  333. unit_tests/connector_builder/utils.py +0 -27
  334. unit_tests/destinations/test_destination.py +0 -243
  335. unit_tests/singer/test_singer_helpers.py +0 -56
  336. unit_tests/singer/test_singer_source.py +0 -112
  337. unit_tests/sources/__init__.py +0 -0
  338. unit_tests/sources/concurrent_source/__init__.py +0 -3
  339. unit_tests/sources/concurrent_source/test_concurrent_source_adapter.py +0 -106
  340. unit_tests/sources/declarative/__init__.py +0 -3
  341. unit_tests/sources/declarative/auth/__init__.py +0 -3
  342. unit_tests/sources/declarative/auth/test_oauth.py +0 -331
  343. unit_tests/sources/declarative/auth/test_selective_authenticator.py +0 -39
  344. unit_tests/sources/declarative/auth/test_session_token_auth.py +0 -182
  345. unit_tests/sources/declarative/auth/test_token_auth.py +0 -200
  346. unit_tests/sources/declarative/auth/test_token_provider.py +0 -73
  347. unit_tests/sources/declarative/checks/__init__.py +0 -3
  348. unit_tests/sources/declarative/checks/test_check_stream.py +0 -146
  349. unit_tests/sources/declarative/decoders/__init__.py +0 -0
  350. unit_tests/sources/declarative/decoders/test_json_decoder.py +0 -16
  351. unit_tests/sources/declarative/external_component.py +0 -13
  352. unit_tests/sources/declarative/extractors/__init__.py +0 -3
  353. unit_tests/sources/declarative/extractors/test_dpath_extractor.py +0 -55
  354. unit_tests/sources/declarative/extractors/test_record_filter.py +0 -55
  355. unit_tests/sources/declarative/extractors/test_record_selector.py +0 -179
  356. unit_tests/sources/declarative/incremental/__init__.py +0 -0
  357. unit_tests/sources/declarative/incremental/test_datetime_based_cursor.py +0 -860
  358. unit_tests/sources/declarative/incremental/test_per_partition_cursor.py +0 -406
  359. unit_tests/sources/declarative/incremental/test_per_partition_cursor_integration.py +0 -332
  360. unit_tests/sources/declarative/interpolation/__init__.py +0 -3
  361. unit_tests/sources/declarative/interpolation/test_filters.py +0 -80
  362. unit_tests/sources/declarative/interpolation/test_interpolated_boolean.py +0 -40
  363. unit_tests/sources/declarative/interpolation/test_interpolated_mapping.py +0 -35
  364. unit_tests/sources/declarative/interpolation/test_interpolated_nested_mapping.py +0 -45
  365. unit_tests/sources/declarative/interpolation/test_interpolated_string.py +0 -25
  366. unit_tests/sources/declarative/interpolation/test_jinja.py +0 -240
  367. unit_tests/sources/declarative/interpolation/test_macros.py +0 -73
  368. unit_tests/sources/declarative/parsers/__init__.py +0 -3
  369. unit_tests/sources/declarative/parsers/test_manifest_component_transformer.py +0 -406
  370. unit_tests/sources/declarative/parsers/test_manifest_reference_resolver.py +0 -139
  371. unit_tests/sources/declarative/parsers/test_model_to_component_factory.py +0 -1841
  372. unit_tests/sources/declarative/parsers/testing_components.py +0 -36
  373. unit_tests/sources/declarative/partition_routers/__init__.py +0 -3
  374. unit_tests/sources/declarative/partition_routers/test_list_partition_router.py +0 -155
  375. unit_tests/sources/declarative/partition_routers/test_single_partition_router.py +0 -14
  376. unit_tests/sources/declarative/partition_routers/test_substream_partition_router.py +0 -404
  377. unit_tests/sources/declarative/requesters/__init__.py +0 -3
  378. unit_tests/sources/declarative/requesters/error_handlers/__init__.py +0 -3
  379. unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/__init__.py +0 -3
  380. unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/test_constant_backoff.py +0 -34
  381. unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/test_exponential_backoff.py +0 -36
  382. unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/test_header_helper.py +0 -38
  383. unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/test_wait_time_from_header.py +0 -35
  384. unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/test_wait_until_time_from_header.py +0 -64
  385. unit_tests/sources/declarative/requesters/error_handlers/test_composite_error_handler.py +0 -213
  386. unit_tests/sources/declarative/requesters/error_handlers/test_default_error_handler.py +0 -178
  387. unit_tests/sources/declarative/requesters/error_handlers/test_http_response_filter.py +0 -121
  388. unit_tests/sources/declarative/requesters/error_handlers/test_response_status.py +0 -44
  389. unit_tests/sources/declarative/requesters/paginators/__init__.py +0 -3
  390. unit_tests/sources/declarative/requesters/paginators/test_cursor_pagination_strategy.py +0 -64
  391. unit_tests/sources/declarative/requesters/paginators/test_default_paginator.py +0 -313
  392. unit_tests/sources/declarative/requesters/paginators/test_no_paginator.py +0 -12
  393. unit_tests/sources/declarative/requesters/paginators/test_offset_increment.py +0 -58
  394. unit_tests/sources/declarative/requesters/paginators/test_page_increment.py +0 -70
  395. unit_tests/sources/declarative/requesters/paginators/test_request_option.py +0 -43
  396. unit_tests/sources/declarative/requesters/paginators/test_stop_condition.py +0 -105
  397. unit_tests/sources/declarative/requesters/request_options/__init__.py +0 -3
  398. unit_tests/sources/declarative/requesters/request_options/test_interpolated_request_options_provider.py +0 -101
  399. unit_tests/sources/declarative/requesters/test_http_requester.py +0 -974
  400. unit_tests/sources/declarative/requesters/test_interpolated_request_input_provider.py +0 -32
  401. unit_tests/sources/declarative/retrievers/__init__.py +0 -3
  402. unit_tests/sources/declarative/retrievers/test_simple_retriever.py +0 -542
  403. unit_tests/sources/declarative/schema/__init__.py +0 -6
  404. unit_tests/sources/declarative/schema/source_test/SourceTest.py +0 -8
  405. unit_tests/sources/declarative/schema/source_test/__init__.py +0 -3
  406. unit_tests/sources/declarative/schema/test_default_schema_loader.py +0 -32
  407. unit_tests/sources/declarative/schema/test_inline_schema_loader.py +0 -19
  408. unit_tests/sources/declarative/schema/test_json_file_schema_loader.py +0 -26
  409. unit_tests/sources/declarative/states/__init__.py +0 -3
  410. unit_tests/sources/declarative/stream_slicers/__init__.py +0 -3
  411. unit_tests/sources/declarative/stream_slicers/test_cartesian_product_stream_slicer.py +0 -225
  412. unit_tests/sources/declarative/test_create_partial.py +0 -83
  413. unit_tests/sources/declarative/test_declarative_stream.py +0 -103
  414. unit_tests/sources/declarative/test_manifest_declarative_source.py +0 -1260
  415. unit_tests/sources/declarative/test_types.py +0 -39
  416. unit_tests/sources/declarative/test_yaml_declarative_source.py +0 -148
  417. unit_tests/sources/file_based/__init__.py +0 -0
  418. unit_tests/sources/file_based/availability_strategy/__init__.py +0 -0
  419. unit_tests/sources/file_based/availability_strategy/test_default_file_based_availability_strategy.py +0 -100
  420. unit_tests/sources/file_based/config/__init__.py +0 -0
  421. unit_tests/sources/file_based/config/test_abstract_file_based_spec.py +0 -28
  422. unit_tests/sources/file_based/config/test_csv_format.py +0 -34
  423. unit_tests/sources/file_based/config/test_file_based_stream_config.py +0 -84
  424. unit_tests/sources/file_based/discovery_policy/__init__.py +0 -0
  425. unit_tests/sources/file_based/discovery_policy/test_default_discovery_policy.py +0 -31
  426. unit_tests/sources/file_based/file_types/__init__.py +0 -0
  427. unit_tests/sources/file_based/file_types/test_avro_parser.py +0 -243
  428. unit_tests/sources/file_based/file_types/test_csv_parser.py +0 -546
  429. unit_tests/sources/file_based/file_types/test_jsonl_parser.py +0 -158
  430. unit_tests/sources/file_based/file_types/test_parquet_parser.py +0 -274
  431. unit_tests/sources/file_based/file_types/test_unstructured_parser.py +0 -593
  432. unit_tests/sources/file_based/helpers.py +0 -70
  433. unit_tests/sources/file_based/in_memory_files_source.py +0 -211
  434. unit_tests/sources/file_based/scenarios/__init__.py +0 -0
  435. unit_tests/sources/file_based/scenarios/avro_scenarios.py +0 -744
  436. unit_tests/sources/file_based/scenarios/check_scenarios.py +0 -220
  437. unit_tests/sources/file_based/scenarios/concurrent_incremental_scenarios.py +0 -2844
  438. unit_tests/sources/file_based/scenarios/csv_scenarios.py +0 -3105
  439. unit_tests/sources/file_based/scenarios/file_based_source_builder.py +0 -91
  440. unit_tests/sources/file_based/scenarios/incremental_scenarios.py +0 -1926
  441. unit_tests/sources/file_based/scenarios/jsonl_scenarios.py +0 -930
  442. unit_tests/sources/file_based/scenarios/parquet_scenarios.py +0 -754
  443. unit_tests/sources/file_based/scenarios/scenario_builder.py +0 -234
  444. unit_tests/sources/file_based/scenarios/unstructured_scenarios.py +0 -608
  445. unit_tests/sources/file_based/scenarios/user_input_schema_scenarios.py +0 -746
  446. unit_tests/sources/file_based/scenarios/validation_policy_scenarios.py +0 -726
  447. unit_tests/sources/file_based/stream/__init__.py +0 -0
  448. unit_tests/sources/file_based/stream/concurrent/__init__.py +0 -0
  449. unit_tests/sources/file_based/stream/concurrent/test_adapters.py +0 -362
  450. unit_tests/sources/file_based/stream/concurrent/test_file_based_concurrent_cursor.py +0 -458
  451. unit_tests/sources/file_based/stream/test_default_file_based_cursor.py +0 -310
  452. unit_tests/sources/file_based/stream/test_default_file_based_stream.py +0 -244
  453. unit_tests/sources/file_based/test_file_based_scenarios.py +0 -320
  454. unit_tests/sources/file_based/test_file_based_stream_reader.py +0 -272
  455. unit_tests/sources/file_based/test_scenarios.py +0 -253
  456. unit_tests/sources/file_based/test_schema_helpers.py +0 -346
  457. unit_tests/sources/fixtures/__init__.py +0 -3
  458. unit_tests/sources/fixtures/source_test_fixture.py +0 -153
  459. unit_tests/sources/message/__init__.py +0 -0
  460. unit_tests/sources/message/test_repository.py +0 -153
  461. unit_tests/sources/streams/__init__.py +0 -0
  462. unit_tests/sources/streams/concurrent/__init__.py +0 -3
  463. unit_tests/sources/streams/concurrent/scenarios/__init__.py +0 -3
  464. unit_tests/sources/streams/concurrent/scenarios/incremental_scenarios.py +0 -250
  465. unit_tests/sources/streams/concurrent/scenarios/stream_facade_builder.py +0 -140
  466. unit_tests/sources/streams/concurrent/scenarios/stream_facade_scenarios.py +0 -452
  467. unit_tests/sources/streams/concurrent/scenarios/test_concurrent_scenarios.py +0 -76
  468. unit_tests/sources/streams/concurrent/scenarios/thread_based_concurrent_stream_scenarios.py +0 -418
  469. unit_tests/sources/streams/concurrent/scenarios/thread_based_concurrent_stream_source_builder.py +0 -142
  470. unit_tests/sources/streams/concurrent/scenarios/utils.py +0 -55
  471. unit_tests/sources/streams/concurrent/test_adapters.py +0 -380
  472. unit_tests/sources/streams/concurrent/test_concurrent_read_processor.py +0 -684
  473. unit_tests/sources/streams/concurrent/test_cursor.py +0 -139
  474. unit_tests/sources/streams/concurrent/test_datetime_state_converter.py +0 -369
  475. unit_tests/sources/streams/concurrent/test_default_stream.py +0 -197
  476. unit_tests/sources/streams/concurrent/test_partition_enqueuer.py +0 -90
  477. unit_tests/sources/streams/concurrent/test_partition_reader.py +0 -67
  478. unit_tests/sources/streams/concurrent/test_thread_pool_manager.py +0 -106
  479. unit_tests/sources/streams/http/__init__.py +0 -0
  480. unit_tests/sources/streams/http/auth/__init__.py +0 -0
  481. unit_tests/sources/streams/http/auth/test_auth.py +0 -173
  482. unit_tests/sources/streams/http/requests_native_auth/__init__.py +0 -0
  483. unit_tests/sources/streams/http/requests_native_auth/test_requests_native_auth.py +0 -423
  484. unit_tests/sources/streams/http/test_availability_strategy.py +0 -180
  485. unit_tests/sources/streams/http/test_http.py +0 -635
  486. unit_tests/sources/streams/test_availability_strategy.py +0 -70
  487. unit_tests/sources/streams/test_call_rate.py +0 -300
  488. unit_tests/sources/streams/test_stream_read.py +0 -405
  489. unit_tests/sources/streams/test_streams_core.py +0 -184
  490. unit_tests/sources/test_abstract_source.py +0 -1442
  491. unit_tests/sources/test_concurrent_source.py +0 -112
  492. unit_tests/sources/test_config.py +0 -92
  493. unit_tests/sources/test_connector_state_manager.py +0 -482
  494. unit_tests/sources/test_http_logger.py +0 -252
  495. unit_tests/sources/test_integration_source.py +0 -86
  496. unit_tests/sources/test_source.py +0 -684
  497. unit_tests/sources/test_source_read.py +0 -460
  498. unit_tests/test/__init__.py +0 -0
  499. unit_tests/test/mock_http/__init__.py +0 -0
  500. unit_tests/test/mock_http/test_matcher.py +0 -53
  501. unit_tests/test/mock_http/test_mocker.py +0 -214
  502. unit_tests/test/mock_http/test_request.py +0 -117
  503. unit_tests/test/mock_http/test_response_builder.py +0 -177
  504. unit_tests/test/test_entrypoint_wrapper.py +0 -240
  505. unit_tests/utils/__init__.py +0 -0
  506. unit_tests/utils/test_datetime_format_inferrer.py +0 -60
  507. unit_tests/utils/test_mapping_helpers.py +0 -54
  508. unit_tests/utils/test_message_utils.py +0 -91
  509. unit_tests/utils/test_rate_limiting.py +0 -26
  510. unit_tests/utils/test_schema_inferrer.py +0 -202
  511. unit_tests/utils/test_secret_utils.py +0 -135
  512. unit_tests/utils/test_stream_status_utils.py +0 -61
  513. unit_tests/utils/test_traced_exception.py +0 -107
  514. /airbyte_cdk/sources/{deprecated → declarative/async_job}/__init__.py +0 -0
  515. {source_declarative_manifest → airbyte_cdk/sources/declarative/migrations}/__init__.py +0 -0
  516. {unit_tests/destinations → airbyte_cdk/sql}/__init__.py +0 -0
  517. {unit_tests/singer → airbyte_cdk/sql/_util}/__init__.py +0 -0
  518. {airbyte_cdk-0.72.0.dist-info → airbyte_cdk-6.17.1.dev0.dist-info}/LICENSE.txt +0 -0
@@ -7,8 +7,12 @@ version: 1.0.0
7
7
  required:
8
8
  - type
9
9
  - check
10
- - streams
11
10
  - version
11
+ anyOf:
12
+ - required:
13
+ - streams
14
+ - required:
15
+ - dynamic_streams
12
16
  properties:
13
17
  type:
14
18
  type: string
@@ -19,18 +23,28 @@ properties:
19
23
  type: array
20
24
  items:
21
25
  "$ref": "#/definitions/DeclarativeStream"
26
+ dynamic_streams:
27
+ type: array
28
+ items:
29
+ "$ref": "#/definitions/DynamicDeclarativeStream"
22
30
  version:
23
31
  type: string
32
+ description: The version of the Airbyte CDK used to build and test the source.
24
33
  schemas:
25
34
  "$ref": "#/definitions/Schemas"
26
35
  definitions:
27
36
  type: object
28
37
  spec:
29
38
  "$ref": "#/definitions/Spec"
39
+ concurrency_level:
40
+ "$ref": "#/definitions/ConcurrencyLevel"
30
41
  metadata:
31
42
  type: object
32
43
  description: For internal Airbyte use only - DO NOT modify manually. Used by consumers of declarative manifests for storing related metadata.
33
44
  additionalProperties: true
45
+ description:
46
+ type: string
47
+ description: A description of the connector. It will be presented on the Source documentation page.
34
48
  additionalProperties: false
35
49
  definitions:
36
50
  AddedFieldDefinition:
@@ -257,6 +271,7 @@ definitions:
257
271
  - "$ref": "#/definitions/BearerAuthenticator"
258
272
  - "$ref": "#/definitions/CustomAuthenticator"
259
273
  - "$ref": "#/definitions/OAuthAuthenticator"
274
+ - "$ref": "#/definitions/JwtAuthenticator"
260
275
  - "$ref": "#/definitions/NoAuth"
261
276
  - "$ref": "#/definitions/SessionTokenAuthenticator"
262
277
  - "$ref": "#/definitions/LegacySessionTokenAuthenticator"
@@ -264,6 +279,7 @@ definitions:
264
279
  - authenticators:
265
280
  token: "#/definitions/ApiKeyAuthenticator"
266
281
  oauth: "#/definitions/OAuthAuthenticator"
282
+ jwt: "#/definitions/JwtAuthenticator"
267
283
  $parameters:
268
284
  type: object
269
285
  additionalProperties: true
@@ -309,6 +325,37 @@ definitions:
309
325
  $parameters:
310
326
  type: object
311
327
  additionalProperties: true
328
+ ConcurrencyLevel:
329
+ title: Concurrency Level
330
+ description: Defines the amount of parallelization for the streams that are being synced. The factor of parallelization is how many partitions or streams are synced at the same time. For example, with a concurrency_level of 10, ten streams or partitions of data will processed at the same time. Note that a value of 1 could create deadlock if a stream has a very high number of partitions.
331
+ type: object
332
+ required:
333
+ - default_concurrency
334
+ properties:
335
+ type:
336
+ type: string
337
+ enum: [ConcurrencyLevel]
338
+ default_concurrency:
339
+ title: Default Concurrency
340
+ description: The amount of concurrency that will applied during a sync. This value can be hardcoded or user-defined in the config if different users have varying volume thresholds in the target API.
341
+ anyOf:
342
+ - type: integer
343
+ - type: string
344
+ interpolation_context:
345
+ - config
346
+ examples:
347
+ - 10
348
+ - "{{ config['num_workers'] or 10 }}"
349
+ max_concurrency:
350
+ title: Max Concurrency
351
+ description: The maximum level of concurrency that will be used during a sync. This becomes a required field when the default_concurrency derives from the config, because it serves as a safeguard against a user-defined threshold that is too high.
352
+ type: integer
353
+ examples:
354
+ - 20
355
+ - 100
356
+ $parameters:
357
+ type: object
358
+ additionalProperties: true
312
359
  ConstantBackoffStrategy:
313
360
  title: Constant Backoff
314
361
  description: Backoff strategy with a constant backoff interval.
@@ -353,11 +400,12 @@ definitions:
353
400
  interpolation_context:
354
401
  - config
355
402
  - headers
356
- - last_records
403
+ - last_page_size
404
+ - last_record
357
405
  - response
358
406
  examples:
359
407
  - "{{ headers.link.next.cursor }}"
360
- - "{{ last_records[-1]['key'] }}"
408
+ - "{{ last_record['key'] }}"
361
409
  - "{{ response['nextPage'] }}"
362
410
  page_size:
363
411
  title: Page Size
@@ -372,15 +420,11 @@ definitions:
372
420
  interpolation_context:
373
421
  - config
374
422
  - headers
375
- - last_records
423
+ - last_record
376
424
  - response
377
425
  examples:
378
426
  - "{{ response.data.has_more is false }}"
379
427
  - "{{ 'next' not in headers['link'] }}"
380
- decoder:
381
- title: Decoder
382
- description: Component decoding the response so records can be extracted.
383
- "$ref": "#/definitions/JsonDecoder"
384
428
  $parameters:
385
429
  type: object
386
430
  additionalProperties: true
@@ -623,6 +667,49 @@ definitions:
623
667
  $parameters:
624
668
  type: object
625
669
  additionalProperties: true
670
+ CustomSchemaNormalization:
671
+ title: Custom Schema Normalization
672
+ description: Schema normalization component whose behavior is derived from a custom code implementation of the connector.
673
+ type: object
674
+ additionalProperties: true
675
+ required:
676
+ - type
677
+ - class_name
678
+ properties:
679
+ type:
680
+ type: string
681
+ enum: [ CustomSchemaNormalization ]
682
+ class_name:
683
+ title: Class Name
684
+ description: Fully-qualified name of the class that will be implementing the custom normalization. The format is `source_<name>.<package>.<class_name>`.
685
+ type: string
686
+ additionalProperties: true
687
+ examples:
688
+ - "source_amazon_seller_partner.components.LedgerDetailedViewReportsTypeTransformer"
689
+ $parameters:
690
+ type: object
691
+ additionalProperties: true
692
+ CustomStateMigration:
693
+ title: Custom State Migration
694
+ description: Apply a custom transformation on the input state.
695
+ type: object
696
+ additionalProperties: true
697
+ required:
698
+ - type
699
+ - class_name
700
+ properties:
701
+ type:
702
+ type: string
703
+ enum: [CustomStateMigration]
704
+ class_name:
705
+ title: Class Name
706
+ description: Fully-qualified name of the class that will be implementing the custom state migration. The format is `source_<name>.<package>.<class_name>`.
707
+ type: string
708
+ examples:
709
+ - "source_railz.components.MyCustomStateMigration"
710
+ $parameters:
711
+ type: object
712
+ additionalProperties: true
626
713
  CustomTransformation:
627
714
  title: Custom Transformation
628
715
  description: Transformation component whose behavior is derived from a custom code implementation of the connector.
@@ -644,6 +731,29 @@ definitions:
644
731
  $parameters:
645
732
  type: object
646
733
  additionalProperties: true
734
+ LegacyToPerPartitionStateMigration:
735
+ title: Legacy To Per-partition-state Migration
736
+ description:
737
+ 'Transforms the input state for per-partitioned streams from the legacy format to the low-code format.
738
+ The cursor field and partition ID fields are automatically extracted from the stream''s DatetimebasedCursor and SubstreamPartitionRouter.
739
+
740
+ Example input state:
741
+ {
742
+ "13506132": {
743
+ "last_changed": "2022-12-27T08:34:39+00:00"
744
+ }
745
+ Example output state:
746
+ {
747
+ "partition": {"id": "13506132"},
748
+ "cursor": {"last_changed": "2022-12-27T08:34:39+00:00"}
749
+ }
750
+ '
751
+ type: object
752
+ additionalProperties: true
753
+ properties:
754
+ type:
755
+ type: string
756
+ enum: [LegacyToPerPartitionStateMigration]
647
757
  DatetimeBasedCursor:
648
758
  title: Datetime Based Cursor
649
759
  description: Cursor to provide incremental capabilities over datetime.
@@ -671,6 +781,7 @@ definitions:
671
781
  description: |
672
782
  The datetime format used to format the datetime values that are sent in outgoing requests to the API. Use placeholders starting with "%" to describe the format the API is using. The following placeholders are available:
673
783
  * **%s**: Epoch unix timestamp - `1686218963`
784
+ * **%s_as_float**: Epoch unix timestamp in seconds as float with microsecond precision - `1686218963.123456`
674
785
  * **%ms**: Epoch unix timestamp (milliseconds) - `1686218963123`
675
786
  * **%a**: Weekday (abbreviated) - `Sun`
676
787
  * **%A**: Weekday (full) - `Sunday`
@@ -704,6 +815,7 @@ definitions:
704
815
  - "%Y-%m-%d"
705
816
  - "%s"
706
817
  - "%ms"
818
+ - "%s_as_float"
707
819
  start_datetime:
708
820
  title: Start Datetime
709
821
  description: The datetime that determines the earliest record that should be synced.
@@ -753,6 +865,20 @@ definitions:
753
865
  title: Whether the target API is formatted as a data feed
754
866
  description: A data feed API is an API that does not allow filtering and paginates the content from the most recent to the least recent. Given this, the CDK needs to know when to stop paginating and this field will generate a stop condition for pagination.
755
867
  type: boolean
868
+ is_client_side_incremental:
869
+ title: Whether the target API does not support filtering and returns all data (the cursor filters records in the client instead of the API side)
870
+ description: If the target API endpoint does not take cursor values to filter records and returns all records anyway, the connector with this cursor will filter out records locally, and only emit new records from the last sync, hence incremental. This means that all records would be read from the API, but only new records will be emitted to the destination.
871
+ type: boolean
872
+ is_compare_strictly:
873
+ title: Whether to skip requests if the start time equals the end time
874
+ description: Set to True if the target API does not accept queries where the start time equal the end time.
875
+ type: boolean
876
+ default: False
877
+ global_substream_cursor:
878
+ title: Whether to store cursor as one value instead of per partition
879
+ description: This setting optimizes performance when the parent stream has thousands of partitions by storing the cursor as a single value rather than per partition. Notably, the substream state is updated only at the end of the sync, which helps prevent data loss in case of a sync failure. See more info in the [docs](https://docs.airbyte.com/connector-development/config-based/understanding-the-yaml-file/incremental-syncs).
880
+ type: boolean
881
+ default: false
756
882
  lookback_window:
757
883
  title: Lookback Window
758
884
  description: Time interval before the start_datetime to read data for, e.g. P1M for looking back one month.
@@ -788,6 +914,127 @@ definitions:
788
914
  $parameters:
789
915
  type: object
790
916
  additionalProperties: true
917
+ JwtAuthenticator:
918
+ title: JWT Authenticator
919
+ description: Authenticator for requests using JWT authentication flow.
920
+ type: object
921
+ required:
922
+ - type
923
+ - secret_key
924
+ - algorithm
925
+ properties:
926
+ type:
927
+ type: string
928
+ enum: [JwtAuthenticator]
929
+ secret_key:
930
+ type: string
931
+ description: Secret used to sign the JSON web token.
932
+ examples:
933
+ - "{{ config['secret_key'] }}"
934
+ base64_encode_secret_key:
935
+ type: boolean
936
+ description: When set to true, the secret key will be base64 encoded prior to being encoded as part of the JWT. Only set to "true" when required by the API.
937
+ default: False
938
+ algorithm:
939
+ type: string
940
+ description: Algorithm used to sign the JSON web token.
941
+ enum:
942
+ [
943
+ "HS256",
944
+ "HS384",
945
+ "HS512",
946
+ "ES256",
947
+ "ES256K",
948
+ "ES384",
949
+ "ES512",
950
+ "RS256",
951
+ "RS384",
952
+ "RS512",
953
+ "PS256",
954
+ "PS384",
955
+ "PS512",
956
+ "EdDSA",
957
+ ]
958
+ examples:
959
+ - ES256
960
+ - HS256
961
+ - RS256
962
+ - "{{ config['algorithm'] }}"
963
+ token_duration:
964
+ type: integer
965
+ title: Token Duration
966
+ description: The amount of time in seconds a JWT token can be valid after being issued.
967
+ default: 1200
968
+ examples:
969
+ - 1200
970
+ - 3600
971
+ header_prefix:
972
+ type: string
973
+ title: Header Prefix
974
+ description: The prefix to be used within the Authentication header.
975
+ examples:
976
+ - "Bearer"
977
+ - "Basic"
978
+ jwt_headers:
979
+ type: object
980
+ title: JWT Headers
981
+ description: JWT headers used when signing JSON web token.
982
+ additionalProperties: false
983
+ properties:
984
+ kid:
985
+ type: string
986
+ title: Key Identifier
987
+ description: Private key ID for user account.
988
+ examples:
989
+ - "{{ config['kid'] }}"
990
+ typ:
991
+ type: string
992
+ title: Type
993
+ description: The media type of the complete JWT.
994
+ default: JWT
995
+ examples:
996
+ - JWT
997
+ cty:
998
+ type: string
999
+ title: Content Type
1000
+ description: Content type of JWT header.
1001
+ examples:
1002
+ - JWT
1003
+ additional_jwt_headers:
1004
+ type: object
1005
+ title: Additional JWT Headers
1006
+ description: Additional headers to be included with the JWT headers object.
1007
+ additionalProperties: true
1008
+ jwt_payload:
1009
+ type: object
1010
+ title: JWT Payload
1011
+ description: JWT Payload used when signing JSON web token.
1012
+ additionalProperties: false
1013
+ properties:
1014
+ iss:
1015
+ type: string
1016
+ title: Issuer
1017
+ description: The user/principal that issued the JWT. Commonly a value unique to the user.
1018
+ examples:
1019
+ - "{{ config['iss'] }}"
1020
+ sub:
1021
+ type: string
1022
+ title: Subject
1023
+ description: The subject of the JWT. Commonly defined by the API.
1024
+ aud:
1025
+ type: string
1026
+ title: Audience
1027
+ description: The recipient that the JWT is intended for. Commonly defined by the API.
1028
+ examples:
1029
+ - "appstoreconnect-v1"
1030
+ additional_jwt_payload:
1031
+ type: object
1032
+ title: Additional JWT Payload Properties
1033
+ description: Additional properties to be added to the JWT payload.
1034
+ additionalProperties: true
1035
+ $parameters:
1036
+ type: object
1037
+ additionalProperties: true
791
1038
  OAuthAuthenticator:
792
1039
  title: OAuth2
793
1040
  description: Authenticator for requests using OAuth 2.0 authorization flow.
@@ -796,7 +1043,6 @@ definitions:
796
1043
  - type
797
1044
  - client_id
798
1045
  - client_secret
799
- - token_refresh_endpoint
800
1046
  properties:
801
1047
  type:
802
1048
  type: string
@@ -835,6 +1081,12 @@ definitions:
835
1081
  default: "access_token"
836
1082
  examples:
837
1083
  - access_token
1084
+ access_token_value:
1085
+ title: Access Token Value
1086
+ description: The value of the access_token to bypass the token refreshing using `refresh_token`.
1087
+ type: string
1088
+ examples:
1089
+ - secret_access_token_value
838
1090
  expires_in_name:
839
1091
  title: Token Expiry Property Name
840
1092
  description: The name of the property which contains the expiry date in the response from the token refresh endpoint.
@@ -924,6 +1176,31 @@ definitions:
924
1176
  default: ["credentials", "token_expiry_date"]
925
1177
  examples:
926
1178
  - ["credentials", "token_expiry_date"]
1179
+ refresh_token_error_status_codes:
1180
+ title: Refresh Token Error Status Codes
1181
+ description: Status Codes to Identify refresh token error in response (Refresh Token Error Key and Refresh Token Error Values should be also specified). Responses with one of the error status code and containing an error value will be flagged as a config error
1182
+ type: array
1183
+ items:
1184
+ type: integer
1185
+ default: []
1186
+ examples:
1187
+ - [400, 500]
1188
+ refresh_token_error_key:
1189
+ title: Refresh Token Error Key
1190
+ description: Key to Identify refresh token error in response (Refresh Token Error Status Codes and Refresh Token Error Values should be also specified).
1191
+ type: string
1192
+ default: ""
1193
+ examples:
1194
+ - "error"
1195
+ refresh_token_error_values:
1196
+ title: Refresh Token Error Values
1197
+ description: 'List of values to check for exception during token refresh process. Used to check if the error found in the response matches the key from the Refresh Token Error Key field (e.g. response={"error": "invalid_grant"}). Only responses with one of the error status code and containing an error value will be flagged as a config error'
1198
+ type: array
1199
+ items:
1200
+ type: string
1201
+ default: []
1202
+ examples:
1203
+ - ["invalid_grant", "invalid_permissions"]
927
1204
  $parameters:
928
1205
  type: object
929
1206
  additionalProperties: true
@@ -943,6 +1220,7 @@ definitions:
943
1220
  title: Retriever
944
1221
  description: Component used to coordinate how records are extracted across stream slices and request pages.
945
1222
  anyOf:
1223
+ - "$ref": "#/definitions/AsyncRetriever"
946
1224
  - "$ref": "#/definitions/CustomRetriever"
947
1225
  - "$ref": "#/definitions/SimpleRetriever"
948
1226
  incremental_sync:
@@ -967,6 +1245,7 @@ definitions:
967
1245
  title: Schema Loader
968
1246
  description: Component used to retrieve the schema for the current stream.
969
1247
  anyOf:
1248
+ - "$ref": "#/definitions/DynamicSchemaLoader"
970
1249
  - "$ref": "#/definitions/InlineSchemaLoader"
971
1250
  - "$ref": "#/definitions/JsonFileSchemaLoader"
972
1251
  - "$ref": "#/definitions/CustomSchemaLoader"
@@ -981,6 +1260,19 @@ definitions:
981
1260
  - "$ref": "#/definitions/AddFields"
982
1261
  - "$ref": "#/definitions/CustomTransformation"
983
1262
  - "$ref": "#/definitions/RemoveFields"
1263
+ - "$ref": "#/definitions/KeysToLower"
1264
+ - "$ref": "#/definitions/KeysToSnakeCase"
1265
+ - "$ref": "#/definitions/FlattenFields"
1266
+ - "$ref": "#/definitions/KeysReplace"
1267
+ state_migrations:
1268
+ title: State Migrations
1269
+ description: Array of state migrations to be applied on the input state
1270
+ type: array
1271
+ items:
1272
+ anyOf:
1273
+ - "$ref": "#/definitions/LegacyToPerPartitionStateMigration"
1274
+ - "$ref": "#/definitions/CustomStateMigration"
1275
+ default: []
984
1276
  $parameters:
985
1277
  type: object
986
1278
  additional_properties: true
@@ -1042,10 +1334,6 @@ definitions:
1042
1334
  - "$ref": "#/definitions/CustomPaginationStrategy"
1043
1335
  - "$ref": "#/definitions/OffsetIncrement"
1044
1336
  - "$ref": "#/definitions/PageIncrement"
1045
- decoder:
1046
- title: Decoder
1047
- description: Component decoding the response so records can be extracted.
1048
- "$ref": "#/definitions/JsonDecoder"
1049
1337
  page_size_option:
1050
1338
  "$ref": "#/definitions/RequestOption"
1051
1339
  page_token_option:
@@ -1072,17 +1360,26 @@ definitions:
1072
1360
  type: array
1073
1361
  items:
1074
1362
  - type: string
1075
- interpolation_content:
1363
+ interpolation_context:
1076
1364
  - config
1077
1365
  examples:
1078
1366
  - ["data"]
1079
1367
  - ["data", "records"]
1080
1368
  - ["data", "{{ parameters.name }}"]
1081
1369
  - ["data", "*", "record"]
1082
- decoder:
1083
- title: Decoder
1084
- description: Component decoding the response so records can be extracted.
1085
- "$ref": "#/definitions/JsonDecoder"
1370
+ $parameters:
1371
+ type: object
1372
+ additionalProperties: true
1373
+ ResponseToFileExtractor:
1374
+ title: CSV To File Extractor
1375
+ description: A record extractor designed for handling large responses that may exceed memory limits (to prevent OOM issues). It downloads a CSV file to disk, reads the data from disk, and deletes the file once it has been fully processed.
1376
+ type: object
1377
+ required:
1378
+ - type
1379
+ properties:
1380
+ type:
1381
+ type: string
1382
+ enum: [ResponseToFileExtractor]
1086
1383
  $parameters:
1087
1384
  type: object
1088
1385
  additionalProperties: true
@@ -1157,6 +1454,12 @@ definitions:
1157
1454
  anyOf:
1158
1455
  - "$ref": "#/definitions/SessionTokenRequestApiKeyAuthenticator"
1159
1456
  - "$ref": "#/definitions/SessionTokenRequestBearerAuthenticator"
1457
+ decoder:
1458
+ title: Decoder
1459
+ description: Component used to decode the response.
1460
+ anyOf:
1461
+ - "$ref": "#/definitions/JsonDecoder"
1462
+ - "$ref": "#/definitions/XmlDecoder"
1160
1463
  $parameters:
1161
1464
  type: object
1162
1465
  additionalProperties: true
@@ -1232,6 +1535,7 @@ definitions:
1232
1535
  - "$ref": "#/definitions/BearerAuthenticator"
1233
1536
  - "$ref": "#/definitions/CustomAuthenticator"
1234
1537
  - "$ref": "#/definitions/OAuthAuthenticator"
1538
+ - "$ref": "#/definitions/JwtAuthenticator"
1235
1539
  - "$ref": "#/definitions/NoAuth"
1236
1540
  - "$ref": "#/definitions/SessionTokenAuthenticator"
1237
1541
  - "$ref": "#/definitions/LegacySessionTokenAuthenticator"
@@ -1342,7 +1646,6 @@ definitions:
1342
1646
  type: object
1343
1647
  required:
1344
1648
  - type
1345
- - action
1346
1649
  properties:
1347
1650
  type:
1348
1651
  type: string
@@ -1356,11 +1659,25 @@ definitions:
1356
1659
  - FAIL
1357
1660
  - RETRY
1358
1661
  - IGNORE
1662
+ - RATE_LIMITED
1359
1663
  examples:
1360
1664
  - SUCCESS
1361
1665
  - FAIL
1362
1666
  - RETRY
1363
1667
  - IGNORE
1668
+ - RATE_LIMITED
1669
+ failure_type:
1670
+ title: Failure Type
1671
+ description: Failure type of traced exception if a response matches the filter.
1672
+ type: string
1673
+ enum:
1674
+ - system_error
1675
+ - config_error
1676
+ - transient_error
1677
+ examples:
1678
+ - system_error
1679
+ - config_error
1680
+ - transient_error
1364
1681
  error_message:
1365
1682
  title: Error Message
1366
1683
  description: Error Message to display if the response matches the filter.
@@ -1398,6 +1715,105 @@ definitions:
1398
1715
  $parameters:
1399
1716
  type: object
1400
1717
  additionalProperties: true
1718
+ TypesMap:
1719
+ title: Types Map
1720
+ description: (This component is experimental. Use at your own risk.) Represents a mapping between a current type and its corresponding target type.
1721
+ type: object
1722
+ required:
1723
+ - target_type
1724
+ - current_type
1725
+ properties:
1726
+ target_type:
1727
+ anyOf:
1728
+ - type: string
1729
+ - type: array
1730
+ items:
1731
+ type: string
1732
+ current_type:
1733
+ anyOf:
1734
+ - type: string
1735
+ - type: array
1736
+ items:
1737
+ type: string
1738
+ SchemaTypeIdentifier:
1739
+ title: Schema Type Identifier
1740
+ description: (This component is experimental. Use at your own risk.) Identifies schema details for dynamic schema extraction and processing.
1741
+ type: object
1742
+ required:
1743
+ - key_pointer
1744
+ properties:
1745
+ type:
1746
+ type: string
1747
+ enum: [SchemaTypeIdentifier]
1748
+ schema_pointer:
1749
+ title: Schema Path
1750
+ description: List of nested fields defining the schema field path to extract. Defaults to [].
1751
+ type: array
1752
+ default: []
1753
+ items:
1754
+ - type: string
1755
+ interpolation_context:
1756
+ - config
1757
+ key_pointer:
1758
+ title: Key Path
1759
+ description: List of potentially nested fields describing the full path of the field key to extract.
1760
+ type: array
1761
+ items:
1762
+ - type: string
1763
+ interpolation_context:
1764
+ - config
1765
+ type_pointer:
1766
+ title: Type Path
1767
+ description: List of potentially nested fields describing the full path of the field type to extract.
1768
+ type: array
1769
+ items:
1770
+ - type: string
1771
+ interpolation_context:
1772
+ - config
1773
+ types_mapping:
1774
+ type: array
1775
+ items:
1776
+ - "$ref": "#/definitions/TypesMap"
1777
+ $parameters:
1778
+ type: object
1779
+ additionalProperties: true
1780
+ DynamicSchemaLoader:
1781
+ title: Dynamic Schema Loader
1782
+ description: (This component is experimental. Use at your own risk.) Loads a schema by extracting data from retrieved records.
1783
+ type: object
1784
+ required:
1785
+ - type
1786
+ - retriever
1787
+ - schema_type_identifier
1788
+ properties:
1789
+ type:
1790
+ type: string
1791
+ enum: [DynamicSchemaLoader]
1792
+ retriever:
1793
+ title: Retriever
1794
+ description: Component used to coordinate how records are extracted across stream slices and request pages.
1795
+ anyOf:
1796
+ - "$ref": "#/definitions/AsyncRetriever"
1797
+ - "$ref": "#/definitions/CustomRetriever"
1798
+ - "$ref": "#/definitions/SimpleRetriever"
1799
+ schema_transformations:
1800
+ title: Schema Transformations
1801
+ description: A list of transformations to be applied to the schema.
1802
+ type: array
1803
+ items:
1804
+ anyOf:
1805
+ - "$ref": "#/definitions/AddFields"
1806
+ - "$ref": "#/definitions/CustomTransformation"
1807
+ - "$ref": "#/definitions/RemoveFields"
1808
+ - "$ref": "#/definitions/KeysToLower"
1809
+ - "$ref": "#/definitions/KeysToSnakeCase"
1810
+ - "$ref": "#/definitions/FlattenFields"
1811
+ - "$ref": "#/definitions/KeysReplace"
1812
+ schema_type_identifier:
1813
+ "$ref": "#/definitions/SchemaTypeIdentifier"
1814
+ $parameters:
1815
+ type: object
1816
+ additionalProperties: true
1401
1817
  InlineSchemaLoader:
1402
1818
  title: Inline Schema Loader
1403
1819
  description: Loads a schema that is defined directly in the manifest file.
@@ -1442,66 +1858,222 @@ definitions:
1442
1858
  type:
1443
1859
  type: string
1444
1860
  enum: [JsonDecoder]
1445
- ListPartitionRouter:
1446
- title: List Partition Router
1447
- description: A Partition router that specifies a list of attributes where each attribute describes a portion of the complete data set for a stream. During a sync, each value is iterated over and can be used as input to outbound API requests.
1861
+ JsonlDecoder:
1862
+ title: JSONL Decoder
1863
+ description: Use this if the response consists of JSON objects separated by new lines (`\n`) in JSONL format.
1448
1864
  type: object
1449
1865
  required:
1450
1866
  - type
1451
- - cursor_field
1452
- - values
1453
1867
  properties:
1454
1868
  type:
1455
1869
  type: string
1456
- enum: [ListPartitionRouter]
1457
- cursor_field:
1458
- title: Current Partition Value Identifier
1459
- description: While iterating over list values, the name of field used to reference a list value. The partition value can be accessed with string interpolation. e.g. "{{ stream_partition['my_key'] }}" where "my_key" is the value of the cursor_field.
1870
+ enum: [JsonlDecoder]
1871
+ KeysToLower:
1872
+ title: Keys to Lower Case
1873
+ description: A transformation that renames all keys to lower case.
1874
+ type: object
1875
+ required:
1876
+ - type
1877
+ properties:
1878
+ type:
1460
1879
  type: string
1461
- interpolation_context:
1462
- - config
1463
- examples:
1464
- - "section"
1465
- - "{{ config['section_key'] }}"
1466
- values:
1467
- title: Partition Values
1468
- description: The list of attributes being iterated over and used as input for the requests made to the source API.
1469
- anyOf:
1470
- - type: string
1471
- - type: array
1472
- items:
1473
- type: string
1474
- interpolation_context:
1475
- - config
1476
- examples:
1477
- - ["section_a", "section_b", "section_c"]
1478
- - "{{ config['sections'] }}"
1479
- request_option:
1480
- title: Inject Partition Value Into Outgoing HTTP Request
1481
- description: A request option describing where the list value should be injected into and under what field name if applicable.
1482
- "$ref": "#/definitions/RequestOption"
1880
+ enum: [KeysToLower]
1483
1881
  $parameters:
1484
1882
  type: object
1485
1883
  additionalProperties: true
1486
- MinMaxDatetime:
1487
- title: Min-Max Datetime
1488
- description: Compares the provided date against optional minimum or maximum times. The max_datetime serves as the ceiling and will be returned when datetime exceeds it. The min_datetime serves as the floor.
1884
+ KeysToSnakeCase:
1885
+ title: Key to Snake Case
1886
+ description: A transformation that renames all keys to snake case.
1489
1887
  type: object
1490
1888
  required:
1491
1889
  - type
1492
- - datetime
1493
1890
  properties:
1494
1891
  type:
1495
1892
  type: string
1496
- enum: [MinMaxDatetime]
1497
- datetime:
1498
- title: Datetime
1499
- description: Datetime value.
1893
+ enum: [KeysToSnakeCase]
1894
+ $parameters:
1895
+ type: object
1896
+ additionalProperties: true
1897
+ FlattenFields:
1898
+ title: Flatten Fields
1899
+ description: A transformation that flatten record to single level format.
1900
+ type: object
1901
+ required:
1902
+ - type
1903
+ properties:
1904
+ type:
1500
1905
  type: string
1501
- interpolation_context:
1502
- - config
1503
- examples:
1504
- - 2021-01-01
1906
+ enum: [FlattenFields]
1907
+ flatten_lists:
1908
+ title: Flatten Lists
1909
+ description: Whether to flatten lists or leave it as is. Default is True.
1910
+ type: boolean
1911
+ default: true
1912
+ $parameters:
1913
+ type: object
1914
+ additionalProperties: true
1915
+ KeysReplace:
1916
+ title: Keys Replace
1917
+ description: A transformation that replaces symbols in keys.
1918
+ type: object
1919
+ required:
1920
+ - type
1921
+ - old
1922
+ - new
1923
+ properties:
1924
+ type:
1925
+ type: string
1926
+ enum: [KeysReplace]
1927
+ old:
1928
+ type: string
1929
+ title: Old value
1930
+ description: Old value to replace.
1931
+ examples:
1932
+ - " "
1933
+ - "{{ record.id }}"
1934
+ - "{{ config['id'] }}"
1935
+ - "{{ stream_slice['id'] }}"
1936
+ interpolation_context:
1937
+ - config
1938
+ - record
1939
+ - stream_state
1940
+ - stream_slice
1941
+ new:
1942
+ type: string
1943
+ title: New value
1944
+ description: New value to set.
1945
+ examples:
1946
+ - "_"
1947
+ - "{{ record.id }}"
1948
+ - "{{ config['id'] }}"
1949
+ - "{{ stream_slice['id'] }}"
1950
+ interpolation_context:
1951
+ - config
1952
+ - record
1953
+ - stream_state
1954
+ - stream_slice
1955
+ $parameters:
1956
+ type: object
1957
+ additionalProperties: true
1958
+ IterableDecoder:
1959
+ title: Iterable Decoder
1960
+ description: Use this if the response consists of strings separated by new lines (`\n`). The Decoder will wrap each row into a JSON object with the `record` key.
1961
+ type: object
1962
+ required:
1963
+ - type
1964
+ properties:
1965
+ type:
1966
+ type: string
1967
+ enum: [IterableDecoder]
1968
+ XmlDecoder:
1969
+ title: XML Decoder
1970
+ description: Use this if the response is XML.
1971
+ type: object
1972
+ required:
1973
+ - type
1974
+ properties:
1975
+ type:
1976
+ type: string
1977
+ enum: [XmlDecoder]
1978
+ CustomDecoder:
1979
+ title: Custom Decoder
1980
+ description: Use this to implement custom decoder logic.
1981
+ type: object
1982
+ additionalProperties: true
1983
+ required:
1984
+ - type
1985
+ - class_name
1986
+ properties:
1987
+ type:
1988
+ type: string
1989
+ enum: [CustomDecoder]
1990
+ class_name:
1991
+ title: Class Name
1992
+ description: Fully-qualified name of the class that will be implementing the custom decoding. Has to be a sub class of Decoder. The format is `source_<name>.<package>.<class_name>`.
1993
+ type: string
1994
+ additionalProperties: true
1995
+ examples:
1996
+ - "source_amazon_ads.components.GzipJsonlDecoder"
1997
+ $parameters:
1998
+ type: object
1999
+ additionalProperties: true
2000
+ GzipJsonDecoder:
2001
+ title: GzipJson Decoder
2002
+ description: Use this if the response is Gzip compressed Json.
2003
+ type: object
2004
+ additionalProperties: true
2005
+ required:
2006
+ - type
2007
+ properties:
2008
+ type:
2009
+ type: string
2010
+ enum: [GzipJsonDecoder]
2011
+ encoding:
2012
+ type: string
2013
+ default: utf-8
2014
+ $parameters:
2015
+ type: object
2016
+ additionalProperties: true
2017
+ ListPartitionRouter:
2018
+ title: List Partition Router
2019
+ description: A Partition router that specifies a list of attributes where each attribute describes a portion of the complete data set for a stream. During a sync, each value is iterated over and can be used as input to outbound API requests.
2020
+ type: object
2021
+ required:
2022
+ - type
2023
+ - cursor_field
2024
+ - values
2025
+ properties:
2026
+ type:
2027
+ type: string
2028
+ enum: [ListPartitionRouter]
2029
+ cursor_field:
2030
+ title: Current Partition Value Identifier
2031
+ description: While iterating over list values, the name of field used to reference a list value. The partition value can be accessed with string interpolation. e.g. "{{ stream_partition['my_key'] }}" where "my_key" is the value of the cursor_field.
2032
+ type: string
2033
+ interpolation_context:
2034
+ - config
2035
+ examples:
2036
+ - "section"
2037
+ - "{{ config['section_key'] }}"
2038
+ values:
2039
+ title: Partition Values
2040
+ description: The list of attributes being iterated over and used as input for the requests made to the source API.
2041
+ anyOf:
2042
+ - type: string
2043
+ - type: array
2044
+ items:
2045
+ type: string
2046
+ interpolation_context:
2047
+ - config
2048
+ examples:
2049
+ - ["section_a", "section_b", "section_c"]
2050
+ - "{{ config['sections'] }}"
2051
+ request_option:
2052
+ title: Inject Partition Value Into Outgoing HTTP Request
2053
+ description: A request option describing where the list value should be injected into and under what field name if applicable.
2054
+ "$ref": "#/definitions/RequestOption"
2055
+ $parameters:
2056
+ type: object
2057
+ additionalProperties: true
2058
+ MinMaxDatetime:
2059
+ title: Min-Max Datetime
2060
+ description: Compares the provided date against optional minimum or maximum times. The max_datetime serves as the ceiling and will be returned when datetime exceeds it. The min_datetime serves as the floor.
2061
+ type: object
2062
+ required:
2063
+ - type
2064
+ - datetime
2065
+ properties:
2066
+ type:
2067
+ type: string
2068
+ enum: [MinMaxDatetime]
2069
+ datetime:
2070
+ title: Datetime
2071
+ description: Datetime value.
2072
+ type: string
2073
+ interpolation_context:
2074
+ - config
2075
+ examples:
2076
+ - 2021-01-01
1505
2077
  - 2021-01-01T00:00:00Z
1506
2078
  - "{{ config['start_time'] }}"
1507
2079
  datetime_format:
@@ -1509,6 +2081,7 @@ definitions:
1509
2081
  description: |
1510
2082
  Format of the datetime value. Defaults to "%Y-%m-%dT%H:%M:%S.%f%z" if left empty. Use placeholders starting with "%" to describe the format the API is using. The following placeholders are available:
1511
2083
  * **%s**: Epoch unix timestamp - `1686218963`
2084
+ * **%s_as_float**: Epoch unix timestamp in seconds as float with microsecond precision - `1686218963.123456`
1512
2085
  * **%ms**: Epoch unix timestamp - `1686218963123`
1513
2086
  * **%a**: Weekday (abbreviated) - `Sun`
1514
2087
  * **%A**: Weekday (full) - `Sunday`
@@ -1624,6 +2197,170 @@ definitions:
1624
2197
  - app_id:
1625
2198
  type: string
1626
2199
  path_in_connector_config: ["info", "app_id"]
2200
+ oauth_connector_input_specification:
2201
+ title: DeclarativeOAuth Connector Specification
2202
+ description: |-
2203
+ The DeclarativeOAuth specific blob.
2204
+ Pertains to the fields defined by the connector relating to the OAuth flow.
2205
+
2206
+ Interpolation capabilities:
2207
+ - The variables placeholders are declared as `{my_var}`.
2208
+ - The nested resolution variables like `{{my_nested_var}}` is allowed as well.
2209
+
2210
+ - The allowed interpolation context is:
2211
+ + base64Encoder - encode to `base64`, {base64Encoder:{my_var_a}:{my_var_b}}
2212
+ + base64Decorer - decode from `base64` encoded string, {base64Decoder:{my_string_variable_or_string_value}}
2213
+ + urlEncoder - encode the input string to URL-like format, {urlEncoder:https://test.host.com/endpoint}
2214
+ + urlDecorer - decode the input url-encoded string into text format, {urlDecoder:https%3A%2F%2Fairbyte.io}
2215
+ + codeChallengeS256 - get the `codeChallenge` encoded value to provide additional data-provider specific authorisation values, {codeChallengeS256:{state_value}}
2216
+
2217
+ Examples:
2218
+ - The TikTok Marketing DeclarativeOAuth spec:
2219
+ {
2220
+ "oauth_connector_input_specification": {
2221
+ "type": "object",
2222
+ "additionalProperties": false,
2223
+ "properties": {
2224
+ "consent_url": "https://ads.tiktok.com/marketing_api/auth?{client_id_key}={{client_id_key}}&{redirect_uri_key}={urlEncoder:{{redirect_uri_key}}}&{state_key}={{state_key}}",
2225
+ "access_token_url": "https://business-api.tiktok.com/open_api/v1.3/oauth2/access_token/",
2226
+ "access_token_params": {
2227
+ "{auth_code_key}": "{{auth_code_key}}",
2228
+ "{client_id_key}": "{{client_id_key}}",
2229
+ "{client_secret_key}": "{{client_secret_key}}"
2230
+ },
2231
+ "access_token_headers": {
2232
+ "Content-Type": "application/json",
2233
+ "Accept": "application/json"
2234
+ },
2235
+ "extract_output": ["data.access_token"],
2236
+ "client_id_key": "app_id",
2237
+ "client_secret_key": "secret",
2238
+ "auth_code_key": "auth_code"
2239
+ }
2240
+ }
2241
+ }
2242
+ type: object
2243
+ additionalProperties: true
2244
+ required:
2245
+ - consent_url
2246
+ - access_token_url
2247
+ - extract_output
2248
+ properties:
2249
+ consent_url:
2250
+ title: Consent URL
2251
+ type: string
2252
+ description: |-
2253
+ The DeclarativeOAuth Specific string URL string template to initiate the authentication.
2254
+ The placeholders are replaced during the processing to provide neccessary values.
2255
+ examples:
2256
+ - https://domain.host.com/marketing_api/auth?{client_id_key}={{client_id_key}}&{redirect_uri_key}={urlEncoder:{{redirect_uri_key}}}&{state_key}={{state_key}}
2257
+ - https://endpoint.host.com/oauth2/authorize?{client_id_key}={{client_id_key}}&{redirect_uri_key}={urlEncoder:{{redirect_uri_key}}}&{scope_key}={urlEncoder:{{scope_key}}}&{state_key}={{state_key}}&subdomain={subdomain}
2258
+ scope:
2259
+ title: Scopes
2260
+ type: string
2261
+ description: |-
2262
+ The DeclarativeOAuth Specific string of the scopes needed to be grant for authenticated user.
2263
+ examples:
2264
+ - user:read user:read_orders workspaces:read
2265
+ access_token_url:
2266
+ title: Access Token URL
2267
+ type: string
2268
+ description: |-
2269
+ The DeclarativeOAuth Specific URL templated string to obtain the `access_token`, `refresh_token` etc.
2270
+ The placeholders are replaced during the processing to provide neccessary values.
2271
+ examples:
2272
+ - https://auth.host.com/oauth2/token?{client_id_key}={{client_id_key}}&{client_secret_key}={{client_secret_key}}&{auth_code_key}={{auth_code_key}}&{redirect_uri_key}={urlEncoder:{{redirect_uri_key}}}
2273
+ access_token_headers:
2274
+ title: Access Token Headers
2275
+ type: object
2276
+ additionalProperties: true
2277
+ description: |-
2278
+ The DeclarativeOAuth Specific optional headers to inject while exchanging the `auth_code` to `access_token` during `completeOAuthFlow` step.
2279
+ examples:
2280
+ - {
2281
+ "Authorization": "Basic {base64Encoder:{client_id}:{client_secret}}",
2282
+ }
2283
+ access_token_params:
2284
+ title: Access Token Query Params (Json Encoded)
2285
+ type: object
2286
+ additionalProperties: true
2287
+ description: |-
2288
+ The DeclarativeOAuth Specific optional query parameters to inject while exchanging the `auth_code` to `access_token` during `completeOAuthFlow` step.
2289
+ When this property is provided, the query params will be encoded as `Json` and included in the outgoing API request.
2290
+ examples:
2291
+ - {
2292
+ "{auth_code_key}": "{{auth_code_key}}",
2293
+ "{client_id_key}": "{{client_id_key}}",
2294
+ "{client_secret_key}": "{{client_secret_key}}",
2295
+ }
2296
+ extract_output:
2297
+ title: Extract Output
2298
+ type: array
2299
+ items:
2300
+ type: string
2301
+ description: |-
2302
+ The DeclarativeOAuth Specific list of strings to indicate which keys should be extracted and returned back to the input config.
2303
+ examples:
2304
+ - ["access_token", "refresh_token", "other_field"]
2305
+ state:
2306
+ title: Configurable State Query Param
2307
+ type: object
2308
+ additionalProperties: true
2309
+ required:
2310
+ - min
2311
+ - max
2312
+ description: |-
2313
+ The DeclarativeOAuth Specific object to provide the criteria of how the `state` query param should be constructed,
2314
+ including length and complexity.
2315
+ properties:
2316
+ min:
2317
+ type: integer
2318
+ max:
2319
+ type: integer
2320
+ examples:
2321
+ - { "min": 7, "max": 128 }
2322
+ client_id_key:
2323
+ title: Client ID Key Override
2324
+ type: string
2325
+ description: |-
2326
+ The DeclarativeOAuth Specific optional override to provide the custom `client_id` key name, if required by data-provider.
2327
+ examples:
2328
+ - "my_custom_client_id_key_name"
2329
+ client_secret_key:
2330
+ title: Client Secret Key Override
2331
+ type: string
2332
+ description: |-
2333
+ The DeclarativeOAuth Specific optional override to provide the custom `client_secret` key name, if required by data-provider.
2334
+ examples:
2335
+ - "my_custom_client_secret_key_name"
2336
+ scope_key:
2337
+ title: Scopes Key Override
2338
+ type: string
2339
+ description: |-
2340
+ The DeclarativeOAuth Specific optional override to provide the custom `scope` key name, if required by data-provider.
2341
+ examples:
2342
+ - "my_custom_scope_key_key_name"
2343
+ state_key:
2344
+ title: State Key Override
2345
+ type: string
2346
+ description: |-
2347
+ The DeclarativeOAuth Specific optional override to provide the custom `state` key name, if required by data-provider.
2348
+ examples:
2349
+ - "my_custom_state_key_key_name"
2350
+ auth_code_key:
2351
+ title: Auth Code Key Override
2352
+ type: string
2353
+ description: |-
2354
+ The DeclarativeOAuth Specific optional override to provide the custom `code` key name to something like `auth_code` or `custom_auth_code`, if required by data-provider.
2355
+ examples:
2356
+ - "my_custom_auth_code_key_name"
2357
+ redirect_uri_key:
2358
+ title: Redirect URI Key Override
2359
+ type: string
2360
+ description: |-
2361
+ The DeclarativeOAuth Specific optional override to provide the custom `redirect_uri` key name to something like `callback_uri`, if required by data-provider.
2362
+ examples:
2363
+ - "my_custom_redirect_uri_key_name"
1627
2364
  complete_oauth_output_specification:
1628
2365
  title: "OAuth output specification"
1629
2366
  description: |-
@@ -1801,6 +2538,25 @@ definitions:
1801
2538
  title: Request Option
1802
2539
  description: A request option describing where the parent key value should be injected into and under what field name if applicable.
1803
2540
  "$ref": "#/definitions/RequestOption"
2541
+ incremental_dependency:
2542
+ title: Incremental Dependency
2543
+ description: Indicates whether the parent stream should be read incrementally based on updates in the child stream.
2544
+ type: boolean
2545
+ default: false
2546
+ extra_fields:
2547
+ title: Extra Fields
2548
+ description: Array of field paths to include as additional fields in the stream slice. Each path is an array of strings representing keys to access fields in the respective parent record. Accessible via `stream_slice.extra_fields`. Missing fields are set to `None`.
2549
+ interpolation_context:
2550
+ - config
2551
+ type: array
2552
+ items:
2553
+ type: array
2554
+ items:
2555
+ type: string
2556
+ description: Defines a field path as an array of strings.
2557
+ examples:
2558
+ - ["field1"]
2559
+ - ["nested", "field2"]
1804
2560
  $parameters:
1805
2561
  type: object
1806
2562
  additionalProperties: true
@@ -1871,7 +2627,11 @@ definitions:
1871
2627
  - "$ref": "#/definitions/CustomRecordFilter"
1872
2628
  - "$ref": "#/definitions/RecordFilter"
1873
2629
  schema_normalization:
1874
- "$ref": "#/definitions/SchemaNormalization"
2630
+ title: Schema Normalization
2631
+ description: Responsible for normalization according to the schema.
2632
+ anyOf:
2633
+ - "$ref": "#/definitions/SchemaNormalization"
2634
+ - "$ref": "#/definitions/CustomSchemaNormalization"
1875
2635
  default: None
1876
2636
  $parameters:
1877
2637
  type: object
@@ -2072,6 +2832,205 @@ definitions:
2072
2832
  - "$ref": "#/definitions/CustomPartitionRouter"
2073
2833
  - "$ref": "#/definitions/ListPartitionRouter"
2074
2834
  - "$ref": "#/definitions/SubstreamPartitionRouter"
2835
+ decoder:
2836
+ title: Decoder
2837
+ description: Component decoding the response so records can be extracted.
2838
+ anyOf:
2839
+ - "$ref": "#/definitions/CustomDecoder"
2840
+ - "$ref": "#/definitions/JsonDecoder"
2841
+ - "$ref": "#/definitions/JsonlDecoder"
2842
+ - "$ref": "#/definitions/IterableDecoder"
2843
+ - "$ref": "#/definitions/XmlDecoder"
2844
+ - "$ref": "#/definitions/GzipJsonDecoder"
2845
+ - "$ref": "#/definitions/CompositeRawDecoder"
2846
+ $parameters:
2847
+ type: object
2848
+ additionalProperties: true
2849
+ CompositeRawDecoder:
2850
+ description: "(This is experimental, use at your own risk)"
2851
+ type: object
2852
+ required:
2853
+ - type
2854
+ - parser
2855
+ properties:
2856
+ type:
2857
+ type: string
2858
+ enum: [CompositeRawDecoder]
2859
+ parser:
2860
+ anyOf:
2861
+ - "$ref": "#/definitions/GzipParser"
2862
+ - "$ref": "#/definitions/JsonLineParser"
2863
+ - "$ref": "#/definitions/CsvParser"
2864
+ # PARSERS
2865
+ GzipParser:
2866
+ type: object
2867
+ required:
2868
+ - type
2869
+ - inner_parser
2870
+ properties:
2871
+ type:
2872
+ type: string
2873
+ enum: [GzipParser]
2874
+ inner_parser:
2875
+ anyOf:
2876
+ - "$ref": "#/definitions/JsonLineParser"
2877
+ - "$ref": "#/definitions/CsvParser"
2878
+ JsonLineParser:
2879
+ type: object
2880
+ required:
2881
+ - type
2882
+ properties:
2883
+ type:
2884
+ type: string
2885
+ enum: [JsonLineParser]
2886
+ encoding:
2887
+ type: string
2888
+ default: utf-8
2889
+ CsvParser:
2890
+ type: object
2891
+ required:
2892
+ - type
2893
+ properties:
2894
+ type:
2895
+ type: string
2896
+ enum: [CsvParser]
2897
+ encoding:
2898
+ type: string
2899
+ default: utf-8
2900
+ delimiter:
2901
+ type: string
2902
+ default: ","
2903
+ AsyncJobStatusMap:
2904
+ description: Matches the api job status to Async Job Status.
2905
+ type: object
2906
+ required:
2907
+ - running
2908
+ - completed
2909
+ - failed
2910
+ - timeout
2911
+ properties:
2912
+ type:
2913
+ type: string
2914
+ enum: [AsyncJobStatusMap]
2915
+ running:
2916
+ type: array
2917
+ items:
2918
+ type: string
2919
+ completed:
2920
+ type: array
2921
+ items:
2922
+ type: string
2923
+ failed:
2924
+ type: array
2925
+ items:
2926
+ type: string
2927
+ timeout:
2928
+ type: array
2929
+ items:
2930
+ type: string
2931
+ AsyncRetriever:
2932
+ description: "[Experimental - We expect the interface to change shortly and we reserve the right to not consider this a breaking change] Retrieves records by Asynchronously sending requests to fetch records. The retriever acts as an orchestrator between the requester, the record selector, the paginator, and the partition router."
2933
+ type: object
2934
+ required:
2935
+ - type
2936
+ - record_selector
2937
+ - status_mapping
2938
+ - creation_requester
2939
+ - polling_requester
2940
+ - download_requester
2941
+ - status_extractor
2942
+ - urls_extractor
2943
+ properties:
2944
+ type:
2945
+ type: string
2946
+ enum: [AsyncRetriever]
2947
+ record_selector:
2948
+ description: Component that describes how to extract records from a HTTP response.
2949
+ "$ref": "#/definitions/RecordSelector"
2950
+ status_mapping:
2951
+ description: Async Job Status to Airbyte CDK Async Job Status mapping.
2952
+ anyOf:
2953
+ - "$ref": "#/definitions/AsyncJobStatusMap"
2954
+ status_extractor:
2955
+ description: Responsible for fetching the actual status of the async job.
2956
+ anyOf:
2957
+ - "$ref": "#/definitions/CustomRecordExtractor"
2958
+ - "$ref": "#/definitions/DpathExtractor"
2959
+ urls_extractor:
2960
+ description: Responsible for fetching the final result `urls` provided by the completed / finished / ready async job.
2961
+ anyOf:
2962
+ - "$ref": "#/definitions/CustomRecordExtractor"
2963
+ - "$ref": "#/definitions/DpathExtractor"
2964
+ download_extractor:
2965
+ description: Responsible for fetching the records from provided urls.
2966
+ anyOf:
2967
+ - "$ref": "#/definitions/CustomRecordExtractor"
2968
+ - "$ref": "#/definitions/DpathExtractor"
2969
+ - "$ref": "#/definitions/ResponseToFileExtractor"
2970
+ creation_requester:
2971
+ description: Requester component that describes how to prepare HTTP requests to send to the source API to create the async server-side job.
2972
+ anyOf:
2973
+ - "$ref": "#/definitions/CustomRequester"
2974
+ - "$ref": "#/definitions/HttpRequester"
2975
+ polling_requester:
2976
+ description: Requester component that describes how to prepare HTTP requests to send to the source API to fetch the status of the running async job.
2977
+ anyOf:
2978
+ - "$ref": "#/definitions/CustomRequester"
2979
+ - "$ref": "#/definitions/HttpRequester"
2980
+ download_requester:
2981
+ description: Requester component that describes how to prepare HTTP requests to send to the source API to download the data provided by the completed async job.
2982
+ anyOf:
2983
+ - "$ref": "#/definitions/CustomRequester"
2984
+ - "$ref": "#/definitions/HttpRequester"
2985
+ download_paginator:
2986
+ description: Paginator component that describes how to navigate through the API's pages during download.
2987
+ anyOf:
2988
+ - "$ref": "#/definitions/DefaultPaginator"
2989
+ - "$ref": "#/definitions/NoPagination"
2990
+ abort_requester:
2991
+ description: Requester component that describes how to prepare HTTP requests to send to the source API to abort a job once it is timed out from the source's perspective.
2992
+ anyOf:
2993
+ - "$ref": "#/definitions/CustomRequester"
2994
+ - "$ref": "#/definitions/HttpRequester"
2995
+ delete_requester:
2996
+ description: Requester component that describes how to prepare HTTP requests to send to the source API to delete a job once the records are extracted.
2997
+ anyOf:
2998
+ - "$ref": "#/definitions/CustomRequester"
2999
+ - "$ref": "#/definitions/HttpRequester"
3000
+ partition_router:
3001
+ title: Partition Router
3002
+ description: PartitionRouter component that describes how to partition the stream, enabling incremental syncs and checkpointing.
3003
+ default: []
3004
+ anyOf:
3005
+ - "$ref": "#/definitions/CustomPartitionRouter"
3006
+ - "$ref": "#/definitions/ListPartitionRouter"
3007
+ - "$ref": "#/definitions/SubstreamPartitionRouter"
3008
+ - type: array
3009
+ items:
3010
+ anyOf:
3011
+ - "$ref": "#/definitions/CustomPartitionRouter"
3012
+ - "$ref": "#/definitions/ListPartitionRouter"
3013
+ - "$ref": "#/definitions/SubstreamPartitionRouter"
3014
+ decoder:
3015
+ title: Decoder
3016
+ description: Component decoding the response so records can be extracted.
3017
+ anyOf:
3018
+ - "$ref": "#/definitions/CustomDecoder"
3019
+ - "$ref": "#/definitions/JsonDecoder"
3020
+ - "$ref": "#/definitions/JsonlDecoder"
3021
+ - "$ref": "#/definitions/IterableDecoder"
3022
+ - "$ref": "#/definitions/XmlDecoder"
3023
+ - "$ref": "#/definitions/GzipJsonDecoder"
3024
+ download_decoder:
3025
+ title: Download Decoder
3026
+ description: Component decoding the download response so records can be extracted.
3027
+ anyOf:
3028
+ - "$ref": "#/definitions/CustomDecoder"
3029
+ - "$ref": "#/definitions/JsonDecoder"
3030
+ - "$ref": "#/definitions/JsonlDecoder"
3031
+ - "$ref": "#/definitions/IterableDecoder"
3032
+ - "$ref": "#/definitions/XmlDecoder"
3033
+ - "$ref": "#/definitions/GzipJsonDecoder"
2075
3034
  $parameters:
2076
3035
  type: object
2077
3036
  additionalProperties: true
@@ -2155,6 +3114,12 @@ definitions:
2155
3114
  type: string
2156
3115
  examples:
2157
3116
  - "([-+]?\\d+)"
3117
+ max_waiting_time_in_seconds:
3118
+ title: Max Waiting Time in Seconds
3119
+ description: Given the value extracted from the header is greater than this value, stop the stream.
3120
+ type: number
3121
+ examples:
3122
+ - 3600
2158
3123
  $parameters:
2159
3124
  type: object
2160
3125
  additionalProperties: true
@@ -2199,6 +3164,150 @@ definitions:
2199
3164
  $parameters:
2200
3165
  type: object
2201
3166
  additionalProperties: true
3167
+ ComponentMappingDefinition:
3168
+ title: Component Mapping Definition
3169
+ description: (This component is experimental. Use at your own risk.) Specifies a mapping definition to update or add fields in a record or configuration. This allows dynamic mapping of data by interpolating values into the template based on provided contexts.
3170
+ type: object
3171
+ required:
3172
+ - type
3173
+ - field_path
3174
+ - value
3175
+ properties:
3176
+ type:
3177
+ type: string
3178
+ enum: [ComponentMappingDefinition]
3179
+ field_path:
3180
+ title: Field Path
3181
+ description: A list of potentially nested fields indicating the full path where value will be added or updated.
3182
+ type: array
3183
+ items:
3184
+ - type: string
3185
+ interpolation_context:
3186
+ - config
3187
+ - components_values
3188
+ - stream_slice
3189
+ - stream_template_config
3190
+ examples:
3191
+ - ["data"]
3192
+ - ["data", "records"]
3193
+ - ["data", 1, "name"]
3194
+ - ["data", "{{ components_values.name }}"]
3195
+ - ["data", "*", "record"]
3196
+ - ["*", "**", "name"]
3197
+ value:
3198
+ title: Value
3199
+ description: The dynamic or static value to assign to the key. Interpolated values can be used to dynamically determine the value during runtime.
3200
+ type: string
3201
+ interpolation_context:
3202
+ - config
3203
+ - stream_template_config
3204
+ - components_values
3205
+ - stream_slice
3206
+ examples:
3207
+ - "{{ components_values['updates'] }}"
3208
+ - "{{ components_values['MetaData']['LastUpdatedTime'] }}"
3209
+ - "{{ config['segment_id'] }}"
3210
+ - "{{ stream_slice['parent_id'] }}"
3211
+ - "{{ stream_slice['extra_fields']['name'] }}"
3212
+ value_type:
3213
+ title: Value Type
3214
+ description: The expected data type of the value. If omitted, the type will be inferred from the value provided.
3215
+ "$ref": "#/definitions/ValueType"
3216
+ $parameters:
3217
+ type: object
3218
+ additionalProperties: true
3219
+ HttpComponentsResolver:
3220
+ type: object
3221
+ description: (This component is experimental. Use at your own risk.) Component resolve and populates stream templates with components fetched via an HTTP retriever.
3222
+ properties:
3223
+ type:
3224
+ type: string
3225
+ enum: [HttpComponentsResolver]
3226
+ retriever:
3227
+ title: Retriever
3228
+ description: Component used to coordinate how records are extracted across stream slices and request pages.
3229
+ anyOf:
3230
+ - "$ref": "#/definitions/AsyncRetriever"
3231
+ - "$ref": "#/definitions/CustomRetriever"
3232
+ - "$ref": "#/definitions/SimpleRetriever"
3233
+ components_mapping:
3234
+ type: array
3235
+ items:
3236
+ "$ref": "#/definitions/ComponentMappingDefinition"
3237
+ $parameters:
3238
+ type: object
3239
+ additionalProperties: true
3240
+ required:
3241
+ - type
3242
+ - retriever
3243
+ - components_mapping
3244
+ StreamConfig:
3245
+ title: Stream Config
3246
+ description: (This component is experimental. Use at your own risk.) Describes how to get streams config from the source config.
3247
+ type: object
3248
+ required:
3249
+ - type
3250
+ - configs_pointer
3251
+ properties:
3252
+ type:
3253
+ type: string
3254
+ enum: [StreamConfig]
3255
+ configs_pointer:
3256
+ title: Configs Pointer
3257
+ description: A list of potentially nested fields indicating the full path in source config file where streams configs located.
3258
+ type: array
3259
+ items:
3260
+ - type: string
3261
+ interpolation_context:
3262
+ - parameters
3263
+ examples:
3264
+ - ["data"]
3265
+ - ["data", "streams"]
3266
+ - ["data", "{{ parameters.name }}"]
3267
+ $parameters:
3268
+ type: object
3269
+ additionalProperties: true
3270
+ ConfigComponentsResolver:
3271
+ type: object
3272
+ description: (This component is experimental. Use at your own risk.) Resolves and populates stream templates with components fetched from the source config.
3273
+ properties:
3274
+ type:
3275
+ type: string
3276
+ enum: [ConfigComponentsResolver]
3277
+ stream_config:
3278
+ "$ref": "#/definitions/StreamConfig"
3279
+ components_mapping:
3280
+ type: array
3281
+ items:
3282
+ "$ref": "#/definitions/ComponentMappingDefinition"
3283
+ $parameters:
3284
+ type: object
3285
+ additionalProperties: true
3286
+ required:
3287
+ - type
3288
+ - stream_config
3289
+ - components_mapping
3290
+ DynamicDeclarativeStream:
3291
+ type: object
3292
+ description: (This component is experimental. Use at your own risk.) A component that described how will be created declarative streams based on stream template.
3293
+ properties:
3294
+ type:
3295
+ type: string
3296
+ enum: [DynamicDeclarativeStream]
3297
+ stream_template:
3298
+ title: Stream Template
3299
+ description: Reference to the stream template.
3300
+ "$ref": "#/definitions/DeclarativeStream"
3301
+ components_resolver:
3302
+ title: Components Resolver
3303
+ description: Component resolve and populates stream templates with components values.
3304
+ anyOf:
3305
+ - "$ref": "#/definitions/HttpComponentsResolver"
3306
+ - "$ref": "#/definitions/ConfigComponentsResolver"
3307
+ required:
3308
+ - type
3309
+ - stream_template
3310
+ - components_resolver
2202
3311
  interpolation:
2203
3312
  variables:
2204
3313
  - title: config
@@ -2228,20 +3337,20 @@ interpolation:
2228
3337
  x-ratelimit-limit: "600"
2229
3338
  x-ratelimit-remaining: "598"
2230
3339
  x-ratelimit-reset: "39"
2231
- - title: last_records
2232
- description: List of records extracted from the last response received from the API.
2233
- type: list
3340
+ - title: last_record
3341
+ description: Last record extracted from the response received from the API.
3342
+ type: object
3343
+ examples:
3344
+ - name: "Test List: 19"
3345
+ id: 0236d6d2
3346
+ contact_count: 20
3347
+ _metadata:
3348
+ self: https://api.sendgrid.com/v3/marketing/lists/0236d6d2
3349
+ - title: last_page_size
3350
+ description: Number of records extracted from the last response received from the API.
3351
+ type: object
2234
3352
  examples:
2235
- - - name: "Test List: 19"
2236
- id: 0236d6d2
2237
- contact_count: 20
2238
- _metadata:
2239
- self: https://api.sendgrid.com/v3/marketing/lists/0236d6d2
2240
- - name: List for CI tests, number 30
2241
- id: 041ee031
2242
- contact_count: 0
2243
- _metadata:
2244
- self: https://api.sendgrid.com/v3/marketing/lists/041ee031
3353
+ - 2
2245
3354
  - title: next_page_token
2246
3355
  description: Object describing the token to fetch the next page of records. The object has a single key "next_page_token".
2247
3356
  type: object
@@ -2289,21 +3398,21 @@ interpolation:
2289
3398
  - created_at: "2020-01-01 00:00:00.000+00:00"
2290
3399
  - updated_at: "2020-01-02 00:00:00.000+00:00"
2291
3400
  macros:
2292
- - title: Now (UTC)
3401
+ - title: now_utc
2293
3402
  description: Returns the current date and time in the UTC timezone.
2294
3403
  arguments: {}
2295
3404
  return_type: Datetime
2296
3405
  examples:
2297
3406
  - "'{{ now_utc() }}' -> '2021-09-01 00:00:00+00:00'"
2298
3407
  - "'{{ now_utc().strftime('%Y-%m-%d') }}' -> '2021-09-01'"
2299
- - title: Today (UTC)
3408
+ - title: today_utc
2300
3409
  description: Returns the current date in UTC timezone. The output is a date object.
2301
3410
  arguments: {}
2302
3411
  return_type: Date
2303
3412
  examples:
2304
3413
  - "'{{ today_utc() }}' -> '2021-09-01'"
2305
3414
  - "'{{ today_utc().strftime('%Y/%m/%d')}}' -> '2021/09/01'"
2306
- - title: Timestamp
3415
+ - title: timestamp
2307
3416
  description: Converts a number or a string representing a datetime (formatted as ISO8601) to a timestamp. If the input is a number, it is converted to an int. If no timezone is specified, the string is interpreted as UTC.
2308
3417
  arguments:
2309
3418
  datetime: A string formatted as ISO8601 or an integer representing a unix timestamp
@@ -2314,7 +3423,7 @@ interpolation:
2314
3423
  - "'{{ timestamp('2022-02-28T00:00:00Z') }}' -> 1646006400"
2315
3424
  - "'{{ timestamp('2022-02-28 00:00:00Z') }}' -> 1646006400"
2316
3425
  - "'{{ timestamp('2022-02-28T00:00:00-08:00') }}' -> 1646035200"
2317
- - title: Max
3426
+ - title: max
2318
3427
  description: Returns the largest object of a iterable, or or two or more arguments.
2319
3428
  arguments:
2320
3429
  args: iterable or a sequence of two or more arguments
@@ -2322,7 +3431,7 @@ interpolation:
2322
3431
  examples:
2323
3432
  - "'{{ max(2, 3) }}' -> 3"
2324
3433
  - "'{{ max([2, 3]) }}' -> 3"
2325
- - title: Day Delta
3434
+ - title: day_delta
2326
3435
  description: Returns the datetime of now() + num_days.
2327
3436
  arguments:
2328
3437
  num_days: The number of days to add to now
@@ -2332,8 +3441,8 @@ interpolation:
2332
3441
  - "'{{ day_delta(1) }}' -> '2021-09-02T00:00:00.000000+0000'"
2333
3442
  - "'{{ day_delta(-1) }}' -> '2021-08-31:00:00.000000+0000'"
2334
3443
  - "'{{ day_delta(25, format='%Y-%m-%d') }}' -> '2021-09-02'"
2335
- - title: Duration
2336
- description: Converts an ISO8601 duratioin to datetime.timedelta.
3444
+ - title: duration
3445
+ description: Converts an ISO8601 duration to datetime timedelta.
2337
3446
  arguments:
2338
3447
  duration_string: "A string representing an ISO8601 duration. See https://www.digi.com/resources/documentation/digidocs//90001488-13/reference/r_iso_8601_duration_format.htm for more details."
2339
3448
  return_type: datetime.timedelta
@@ -2341,17 +3450,19 @@ interpolation:
2341
3450
  - "'{{ duration('P1D') }}' -> '1 day, 0:00:00'"
2342
3451
  - "'{{ duration('P6DT23H') }}' -> '6 days, 23:00:00'"
2343
3452
  - "'{{ (now_utc() - duration('P1D')).strftime('%Y-%m-%dT%H:%M:%SZ') }}' -> '2021-08-31T00:00:00Z'"
2344
- - title: Format Datetime
3453
+ - title: format_datetime
2345
3454
  description: Converts a datetime or a datetime-string to the specified format.
2346
3455
  arguments:
2347
3456
  datetime: The datetime object or a string to convert. If datetime is a string, it must be formatted as ISO8601.
2348
- format: The datetime format
3457
+ format: The datetime format.
3458
+ input_format: (optional) The datetime format in the case it is an string.
2349
3459
  return_type: str
2350
3460
  examples:
2351
3461
  - "{{ format_datetime(config['start_time'], '%Y-%m-%d') }}"
2352
3462
  - "{{ format_datetime(config['start_date'], '%Y-%m-%dT%H:%M:%S.%fZ') }}"
3463
+ - "{{ format_datetime(config['start_date'], '%Y-%m-%dT%H:%M:%S.%fZ', '%a, %d %b %Y %H:%M:%S %z') }}"
2353
3464
  filters:
2354
- - title: Hash
3465
+ - title: hash
2355
3466
  description: Convert the specified value to a hashed string.
2356
3467
  arguments:
2357
3468
  hash_type: Valid hash type for converts ('md5' as default value).
@@ -2361,15 +3472,29 @@ interpolation:
2361
3472
  - "{{ 'Test client_secret' | hash() }} -> '3032d57a12f76b61a820e47b9a5a0cbb'"
2362
3473
  - "{{ 'Test client_secret' | hash('md5') }} -> '3032d57a12f76b61a820e47b9a5a0cbb'"
2363
3474
  - "{{ 'Test client_secret' | hash('md5', salt='salt') }} -> '5011a0168579c2d94cbbe1c6ad14327c'"
2364
- - title: Base64 encoder
3475
+ - title: base64encode
2365
3476
  description: Convert the specified value to a string in the base64 format.
2366
3477
  arguments: {}
2367
3478
  return_type: str
2368
3479
  examples:
2369
3480
  - "{{ 'Test client_secret' | base64encode }} -> 'VGVzdCBjbGllbnRfc2VjcmV0'"
2370
- - title: Base64 decoder
3481
+ - title: base64decode
2371
3482
  description: Decodes the specified base64 format value into a common string.
2372
3483
  arguments: {}
2373
3484
  return_type: str
2374
3485
  examples:
2375
3486
  - "{{ 'ZmFrZSByZWZyZXNoX3Rva2VuIHZhbHVl' | base64decode }} -> 'fake refresh_token value'"
3487
+ - title: string
3488
+ description: Converts the specified value to a string.
3489
+ arguments: {}
3490
+ return_type: str
3491
+ examples:
3492
+ - '{{ 1 | string }} -> "1"'
3493
+ - '{{ ["hello", "world" | string }} -> "["hello", "world"]"'
3494
+ - title: regex_search
3495
+ description: Match the input string against a regular expression and return the first match.
3496
+ arguments:
3497
+ regex: The regular expression to search for. It must include a capture group.
3498
+ return_type: str
3499
+ examples:
3500
+ - '{{ "goodbye, cruel world" | regex_search("goodbye,\s(.*)$") }} -> "cruel world"'