airbyte-cdk 0.72.0__py3-none-any.whl → 6.13.1.dev4106__py3-none-any.whl

Sign up to get free protection for your applications and to get access to all the features.
Files changed (517) hide show
  1. airbyte_cdk/__init__.py +355 -6
  2. airbyte_cdk/cli/__init__.py +1 -0
  3. airbyte_cdk/cli/source_declarative_manifest/__init__.py +5 -0
  4. airbyte_cdk/cli/source_declarative_manifest/_run.py +230 -0
  5. airbyte_cdk/cli/source_declarative_manifest/spec.json +17 -0
  6. airbyte_cdk/config_observation.py +29 -10
  7. airbyte_cdk/connector.py +24 -24
  8. airbyte_cdk/connector_builder/README.md +53 -0
  9. airbyte_cdk/connector_builder/connector_builder_handler.py +37 -11
  10. airbyte_cdk/connector_builder/main.py +45 -13
  11. airbyte_cdk/connector_builder/message_grouper.py +189 -50
  12. airbyte_cdk/connector_builder/models.py +3 -2
  13. airbyte_cdk/destinations/__init__.py +4 -3
  14. airbyte_cdk/destinations/destination.py +54 -20
  15. airbyte_cdk/destinations/vector_db_based/README.md +37 -0
  16. airbyte_cdk/destinations/vector_db_based/config.py +40 -17
  17. airbyte_cdk/destinations/vector_db_based/document_processor.py +56 -17
  18. airbyte_cdk/destinations/vector_db_based/embedder.py +57 -15
  19. airbyte_cdk/destinations/vector_db_based/test_utils.py +14 -4
  20. airbyte_cdk/destinations/vector_db_based/utils.py +8 -2
  21. airbyte_cdk/destinations/vector_db_based/writer.py +24 -5
  22. airbyte_cdk/entrypoint.py +153 -44
  23. airbyte_cdk/exception_handler.py +21 -3
  24. airbyte_cdk/logger.py +30 -44
  25. airbyte_cdk/models/__init__.py +13 -2
  26. airbyte_cdk/models/airbyte_protocol.py +86 -1
  27. airbyte_cdk/models/airbyte_protocol_serializers.py +44 -0
  28. airbyte_cdk/models/file_transfer_record_message.py +13 -0
  29. airbyte_cdk/models/well_known_types.py +1 -1
  30. airbyte_cdk/sources/__init__.py +5 -1
  31. airbyte_cdk/sources/abstract_source.py +125 -79
  32. airbyte_cdk/sources/concurrent_source/__init__.py +7 -2
  33. airbyte_cdk/sources/concurrent_source/concurrent_read_processor.py +102 -36
  34. airbyte_cdk/sources/concurrent_source/concurrent_source.py +29 -36
  35. airbyte_cdk/sources/concurrent_source/concurrent_source_adapter.py +94 -10
  36. airbyte_cdk/sources/concurrent_source/stream_thread_exception.py +25 -0
  37. airbyte_cdk/sources/concurrent_source/thread_pool_manager.py +20 -14
  38. airbyte_cdk/sources/config.py +3 -2
  39. airbyte_cdk/sources/connector_state_manager.py +49 -83
  40. airbyte_cdk/sources/declarative/async_job/job.py +52 -0
  41. airbyte_cdk/sources/declarative/async_job/job_orchestrator.py +497 -0
  42. airbyte_cdk/sources/declarative/async_job/job_tracker.py +75 -0
  43. airbyte_cdk/sources/declarative/async_job/repository.py +35 -0
  44. airbyte_cdk/sources/declarative/async_job/status.py +24 -0
  45. airbyte_cdk/sources/declarative/async_job/timer.py +39 -0
  46. airbyte_cdk/sources/declarative/auth/__init__.py +2 -3
  47. airbyte_cdk/sources/declarative/auth/declarative_authenticator.py +3 -1
  48. airbyte_cdk/sources/declarative/auth/jwt.py +191 -0
  49. airbyte_cdk/sources/declarative/auth/oauth.py +60 -20
  50. airbyte_cdk/sources/declarative/auth/selective_authenticator.py +10 -2
  51. airbyte_cdk/sources/declarative/auth/token.py +28 -10
  52. airbyte_cdk/sources/declarative/auth/token_provider.py +9 -8
  53. airbyte_cdk/sources/declarative/checks/check_stream.py +16 -8
  54. airbyte_cdk/sources/declarative/checks/connection_checker.py +4 -2
  55. airbyte_cdk/sources/declarative/concurrency_level/__init__.py +7 -0
  56. airbyte_cdk/sources/declarative/concurrency_level/concurrency_level.py +50 -0
  57. airbyte_cdk/sources/declarative/concurrent_declarative_source.py +421 -0
  58. airbyte_cdk/sources/declarative/datetime/datetime_parser.py +4 -0
  59. airbyte_cdk/sources/declarative/datetime/min_max_datetime.py +26 -6
  60. airbyte_cdk/sources/declarative/declarative_component_schema.yaml +1213 -88
  61. airbyte_cdk/sources/declarative/declarative_source.py +5 -2
  62. airbyte_cdk/sources/declarative/declarative_stream.py +95 -9
  63. airbyte_cdk/sources/declarative/decoders/__init__.py +23 -2
  64. airbyte_cdk/sources/declarative/decoders/composite_raw_decoder.py +97 -0
  65. airbyte_cdk/sources/declarative/decoders/decoder.py +11 -4
  66. airbyte_cdk/sources/declarative/decoders/json_decoder.py +92 -5
  67. airbyte_cdk/sources/declarative/decoders/noop_decoder.py +21 -0
  68. airbyte_cdk/sources/declarative/decoders/pagination_decoder_decorator.py +39 -0
  69. airbyte_cdk/sources/declarative/decoders/xml_decoder.py +98 -0
  70. airbyte_cdk/sources/declarative/extractors/__init__.py +12 -1
  71. airbyte_cdk/sources/declarative/extractors/dpath_extractor.py +29 -24
  72. airbyte_cdk/sources/declarative/extractors/http_selector.py +4 -5
  73. airbyte_cdk/sources/declarative/extractors/record_extractor.py +2 -3
  74. airbyte_cdk/sources/declarative/extractors/record_filter.py +65 -8
  75. airbyte_cdk/sources/declarative/extractors/record_selector.py +85 -26
  76. airbyte_cdk/sources/declarative/extractors/response_to_file_extractor.py +177 -0
  77. airbyte_cdk/sources/declarative/extractors/type_transformer.py +55 -0
  78. airbyte_cdk/sources/declarative/incremental/__init__.py +25 -3
  79. airbyte_cdk/sources/declarative/incremental/datetime_based_cursor.py +156 -48
  80. airbyte_cdk/sources/declarative/incremental/declarative_cursor.py +13 -0
  81. airbyte_cdk/sources/declarative/incremental/global_substream_cursor.py +350 -0
  82. airbyte_cdk/sources/declarative/incremental/per_partition_cursor.py +159 -74
  83. airbyte_cdk/sources/declarative/incremental/per_partition_with_global.py +200 -0
  84. airbyte_cdk/sources/declarative/incremental/resumable_full_refresh_cursor.py +122 -0
  85. airbyte_cdk/sources/declarative/interpolation/filters.py +27 -1
  86. airbyte_cdk/sources/declarative/interpolation/interpolated_boolean.py +23 -5
  87. airbyte_cdk/sources/declarative/interpolation/interpolated_mapping.py +12 -8
  88. airbyte_cdk/sources/declarative/interpolation/interpolated_nested_mapping.py +13 -6
  89. airbyte_cdk/sources/declarative/interpolation/interpolated_string.py +21 -6
  90. airbyte_cdk/sources/declarative/interpolation/interpolation.py +9 -3
  91. airbyte_cdk/sources/declarative/interpolation/jinja.py +72 -37
  92. airbyte_cdk/sources/declarative/interpolation/macros.py +72 -17
  93. airbyte_cdk/sources/declarative/manifest_declarative_source.py +193 -52
  94. airbyte_cdk/sources/declarative/migrations/legacy_to_per_partition_state_migration.py +98 -0
  95. airbyte_cdk/sources/declarative/migrations/state_migration.py +24 -0
  96. airbyte_cdk/sources/declarative/models/__init__.py +1 -1
  97. airbyte_cdk/sources/declarative/models/declarative_component_schema.py +1329 -595
  98. airbyte_cdk/sources/declarative/parsers/custom_exceptions.py +2 -2
  99. airbyte_cdk/sources/declarative/parsers/manifest_component_transformer.py +26 -4
  100. airbyte_cdk/sources/declarative/parsers/manifest_reference_resolver.py +26 -15
  101. airbyte_cdk/sources/declarative/parsers/model_to_component_factory.py +1699 -226
  102. airbyte_cdk/sources/declarative/partition_routers/__init__.py +24 -4
  103. airbyte_cdk/sources/declarative/partition_routers/async_job_partition_router.py +65 -0
  104. airbyte_cdk/sources/declarative/partition_routers/cartesian_product_stream_slicer.py +176 -0
  105. airbyte_cdk/sources/declarative/partition_routers/list_partition_router.py +39 -9
  106. airbyte_cdk/sources/declarative/partition_routers/partition_router.py +62 -0
  107. airbyte_cdk/sources/declarative/partition_routers/single_partition_router.py +15 -3
  108. airbyte_cdk/sources/declarative/partition_routers/substream_partition_router.py +222 -39
  109. airbyte_cdk/sources/declarative/requesters/error_handlers/__init__.py +19 -5
  110. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/__init__.py +3 -1
  111. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/constant_backoff_strategy.py +19 -7
  112. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/exponential_backoff_strategy.py +19 -7
  113. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/header_helper.py +4 -2
  114. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/wait_time_from_header_backoff_strategy.py +41 -9
  115. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/wait_until_time_from_header_backoff_strategy.py +29 -14
  116. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategy.py +5 -13
  117. airbyte_cdk/sources/declarative/requesters/error_handlers/composite_error_handler.py +32 -16
  118. airbyte_cdk/sources/declarative/requesters/error_handlers/default_error_handler.py +46 -56
  119. airbyte_cdk/sources/declarative/requesters/error_handlers/default_http_response_filter.py +40 -0
  120. airbyte_cdk/sources/declarative/requesters/error_handlers/error_handler.py +6 -32
  121. airbyte_cdk/sources/declarative/requesters/error_handlers/http_response_filter.py +119 -41
  122. airbyte_cdk/sources/declarative/requesters/http_job_repository.py +228 -0
  123. airbyte_cdk/sources/declarative/requesters/http_requester.py +98 -344
  124. airbyte_cdk/sources/declarative/requesters/paginators/__init__.py +14 -3
  125. airbyte_cdk/sources/declarative/requesters/paginators/default_paginator.py +105 -46
  126. airbyte_cdk/sources/declarative/requesters/paginators/no_pagination.py +14 -8
  127. airbyte_cdk/sources/declarative/requesters/paginators/paginator.py +19 -8
  128. airbyte_cdk/sources/declarative/requesters/paginators/strategies/__init__.py +9 -3
  129. airbyte_cdk/sources/declarative/requesters/paginators/strategies/cursor_pagination_strategy.py +53 -21
  130. airbyte_cdk/sources/declarative/requesters/paginators/strategies/offset_increment.py +42 -19
  131. airbyte_cdk/sources/declarative/requesters/paginators/strategies/page_increment.py +25 -12
  132. airbyte_cdk/sources/declarative/requesters/paginators/strategies/pagination_strategy.py +13 -10
  133. airbyte_cdk/sources/declarative/requesters/paginators/strategies/stop_condition.py +26 -13
  134. airbyte_cdk/sources/declarative/requesters/request_options/__init__.py +15 -2
  135. airbyte_cdk/sources/declarative/requesters/request_options/datetime_based_request_options_provider.py +91 -0
  136. airbyte_cdk/sources/declarative/requesters/request_options/default_request_options_provider.py +60 -0
  137. airbyte_cdk/sources/declarative/requesters/request_options/interpolated_nested_request_input_provider.py +31 -14
  138. airbyte_cdk/sources/declarative/requesters/request_options/interpolated_request_input_provider.py +27 -15
  139. airbyte_cdk/sources/declarative/requesters/request_options/interpolated_request_options_provider.py +63 -10
  140. airbyte_cdk/sources/declarative/requesters/request_options/request_options_provider.py +1 -1
  141. airbyte_cdk/sources/declarative/requesters/requester.py +9 -17
  142. airbyte_cdk/sources/declarative/resolvers/__init__.py +41 -0
  143. airbyte_cdk/sources/declarative/resolvers/components_resolver.py +55 -0
  144. airbyte_cdk/sources/declarative/resolvers/config_components_resolver.py +136 -0
  145. airbyte_cdk/sources/declarative/resolvers/http_components_resolver.py +112 -0
  146. airbyte_cdk/sources/declarative/retrievers/__init__.py +6 -2
  147. airbyte_cdk/sources/declarative/retrievers/async_retriever.py +100 -0
  148. airbyte_cdk/sources/declarative/retrievers/retriever.py +1 -3
  149. airbyte_cdk/sources/declarative/retrievers/simple_retriever.py +228 -72
  150. airbyte_cdk/sources/declarative/schema/__init__.py +14 -1
  151. airbyte_cdk/sources/declarative/schema/default_schema_loader.py +5 -3
  152. airbyte_cdk/sources/declarative/schema/dynamic_schema_loader.py +236 -0
  153. airbyte_cdk/sources/declarative/schema/json_file_schema_loader.py +8 -8
  154. airbyte_cdk/sources/declarative/spec/spec.py +12 -5
  155. airbyte_cdk/sources/declarative/stream_slicers/__init__.py +1 -2
  156. airbyte_cdk/sources/declarative/stream_slicers/declarative_partition_generator.py +88 -0
  157. airbyte_cdk/sources/declarative/stream_slicers/stream_slicer.py +9 -14
  158. airbyte_cdk/sources/declarative/transformations/add_fields.py +19 -11
  159. airbyte_cdk/sources/declarative/transformations/flatten_fields.py +52 -0
  160. airbyte_cdk/sources/declarative/transformations/keys_replace_transformation.py +61 -0
  161. airbyte_cdk/sources/declarative/transformations/keys_to_lower_transformation.py +22 -0
  162. airbyte_cdk/sources/declarative/transformations/keys_to_snake_transformation.py +68 -0
  163. airbyte_cdk/sources/declarative/transformations/remove_fields.py +13 -10
  164. airbyte_cdk/sources/declarative/transformations/transformation.py +5 -5
  165. airbyte_cdk/sources/declarative/types.py +19 -110
  166. airbyte_cdk/sources/declarative/yaml_declarative_source.py +31 -10
  167. airbyte_cdk/sources/embedded/base_integration.py +16 -5
  168. airbyte_cdk/sources/embedded/catalog.py +16 -4
  169. airbyte_cdk/sources/embedded/runner.py +19 -3
  170. airbyte_cdk/sources/embedded/tools.py +5 -2
  171. airbyte_cdk/sources/file_based/README.md +152 -0
  172. airbyte_cdk/sources/file_based/__init__.py +24 -0
  173. airbyte_cdk/sources/file_based/availability_strategy/__init__.py +9 -2
  174. airbyte_cdk/sources/file_based/availability_strategy/abstract_file_based_availability_strategy.py +22 -6
  175. airbyte_cdk/sources/file_based/availability_strategy/default_file_based_availability_strategy.py +46 -10
  176. airbyte_cdk/sources/file_based/config/abstract_file_based_spec.py +58 -10
  177. airbyte_cdk/sources/file_based/config/avro_format.py +2 -1
  178. airbyte_cdk/sources/file_based/config/csv_format.py +29 -10
  179. airbyte_cdk/sources/file_based/config/excel_format.py +18 -0
  180. airbyte_cdk/sources/file_based/config/file_based_stream_config.py +16 -4
  181. airbyte_cdk/sources/file_based/config/jsonl_format.py +2 -1
  182. airbyte_cdk/sources/file_based/config/parquet_format.py +2 -1
  183. airbyte_cdk/sources/file_based/config/unstructured_format.py +13 -5
  184. airbyte_cdk/sources/file_based/discovery_policy/__init__.py +6 -2
  185. airbyte_cdk/sources/file_based/discovery_policy/abstract_discovery_policy.py +2 -4
  186. airbyte_cdk/sources/file_based/discovery_policy/default_discovery_policy.py +7 -2
  187. airbyte_cdk/sources/file_based/exceptions.py +52 -15
  188. airbyte_cdk/sources/file_based/file_based_source.py +163 -33
  189. airbyte_cdk/sources/file_based/file_based_stream_reader.py +83 -5
  190. airbyte_cdk/sources/file_based/file_types/__init__.py +14 -1
  191. airbyte_cdk/sources/file_based/file_types/avro_parser.py +75 -24
  192. airbyte_cdk/sources/file_based/file_types/csv_parser.py +116 -34
  193. airbyte_cdk/sources/file_based/file_types/excel_parser.py +196 -0
  194. airbyte_cdk/sources/file_based/file_types/file_transfer.py +37 -0
  195. airbyte_cdk/sources/file_based/file_types/file_type_parser.py +4 -1
  196. airbyte_cdk/sources/file_based/file_types/jsonl_parser.py +24 -8
  197. airbyte_cdk/sources/file_based/file_types/parquet_parser.py +60 -18
  198. airbyte_cdk/sources/file_based/file_types/unstructured_parser.py +145 -41
  199. airbyte_cdk/sources/file_based/remote_file.py +1 -1
  200. airbyte_cdk/sources/file_based/schema_helpers.py +38 -10
  201. airbyte_cdk/sources/file_based/schema_validation_policies/__init__.py +3 -1
  202. airbyte_cdk/sources/file_based/schema_validation_policies/abstract_schema_validation_policy.py +3 -1
  203. airbyte_cdk/sources/file_based/schema_validation_policies/default_schema_validation_policies.py +16 -5
  204. airbyte_cdk/sources/file_based/stream/abstract_file_based_stream.py +50 -13
  205. airbyte_cdk/sources/file_based/stream/concurrent/adapters.py +67 -27
  206. airbyte_cdk/sources/file_based/stream/concurrent/cursor/__init__.py +5 -1
  207. airbyte_cdk/sources/file_based/stream/concurrent/cursor/abstract_concurrent_file_based_cursor.py +14 -23
  208. airbyte_cdk/sources/file_based/stream/concurrent/cursor/file_based_concurrent_cursor.py +54 -18
  209. airbyte_cdk/sources/file_based/stream/concurrent/cursor/file_based_final_state_cursor.py +21 -9
  210. airbyte_cdk/sources/file_based/stream/cursor/abstract_file_based_cursor.py +3 -1
  211. airbyte_cdk/sources/file_based/stream/cursor/default_file_based_cursor.py +27 -10
  212. airbyte_cdk/sources/file_based/stream/default_file_based_stream.py +175 -45
  213. airbyte_cdk/sources/http_logger.py +8 -3
  214. airbyte_cdk/sources/message/__init__.py +7 -1
  215. airbyte_cdk/sources/message/repository.py +18 -4
  216. airbyte_cdk/sources/source.py +42 -38
  217. airbyte_cdk/sources/streams/__init__.py +2 -2
  218. airbyte_cdk/sources/streams/availability_strategy.py +54 -3
  219. airbyte_cdk/sources/streams/call_rate.py +64 -21
  220. airbyte_cdk/sources/streams/checkpoint/__init__.py +26 -0
  221. airbyte_cdk/sources/streams/checkpoint/checkpoint_reader.py +335 -0
  222. airbyte_cdk/sources/{declarative/incremental → streams/checkpoint}/cursor.py +17 -14
  223. airbyte_cdk/sources/streams/checkpoint/per_partition_key_serializer.py +22 -0
  224. airbyte_cdk/sources/streams/checkpoint/resumable_full_refresh_cursor.py +51 -0
  225. airbyte_cdk/sources/streams/checkpoint/substream_resumable_full_refresh_cursor.py +110 -0
  226. airbyte_cdk/sources/streams/concurrent/README.md +7 -0
  227. airbyte_cdk/sources/streams/concurrent/abstract_stream.py +7 -2
  228. airbyte_cdk/sources/streams/concurrent/adapters.py +84 -75
  229. airbyte_cdk/sources/streams/concurrent/availability_strategy.py +30 -2
  230. airbyte_cdk/sources/streams/concurrent/cursor.py +298 -42
  231. airbyte_cdk/sources/streams/concurrent/default_stream.py +12 -3
  232. airbyte_cdk/sources/streams/concurrent/exceptions.py +3 -0
  233. airbyte_cdk/sources/streams/concurrent/helpers.py +14 -3
  234. airbyte_cdk/sources/streams/concurrent/partition_enqueuer.py +12 -3
  235. airbyte_cdk/sources/streams/concurrent/partition_reader.py +10 -3
  236. airbyte_cdk/sources/streams/concurrent/partitions/partition.py +1 -16
  237. airbyte_cdk/sources/streams/concurrent/partitions/stream_slicer.py +21 -0
  238. airbyte_cdk/sources/streams/concurrent/partitions/types.py +15 -5
  239. airbyte_cdk/sources/streams/concurrent/state_converters/abstract_stream_state_converter.py +109 -17
  240. airbyte_cdk/sources/streams/concurrent/state_converters/datetime_stream_state_converter.py +90 -72
  241. airbyte_cdk/sources/streams/core.py +412 -87
  242. airbyte_cdk/sources/streams/http/__init__.py +2 -1
  243. airbyte_cdk/sources/streams/http/availability_strategy.py +12 -101
  244. airbyte_cdk/sources/streams/http/error_handlers/__init__.py +22 -0
  245. airbyte_cdk/sources/streams/http/error_handlers/backoff_strategy.py +28 -0
  246. airbyte_cdk/sources/streams/http/error_handlers/default_backoff_strategy.py +17 -0
  247. airbyte_cdk/sources/streams/http/error_handlers/default_error_mapping.py +86 -0
  248. airbyte_cdk/sources/streams/http/error_handlers/error_handler.py +42 -0
  249. airbyte_cdk/sources/streams/http/error_handlers/error_message_parser.py +19 -0
  250. airbyte_cdk/sources/streams/http/error_handlers/http_status_error_handler.py +110 -0
  251. airbyte_cdk/sources/streams/http/error_handlers/json_error_message_parser.py +52 -0
  252. airbyte_cdk/sources/streams/http/error_handlers/response_models.py +65 -0
  253. airbyte_cdk/sources/streams/http/exceptions.py +27 -7
  254. airbyte_cdk/sources/streams/http/http.py +369 -246
  255. airbyte_cdk/sources/streams/http/http_client.py +531 -0
  256. airbyte_cdk/sources/streams/http/rate_limiting.py +76 -12
  257. airbyte_cdk/sources/streams/http/requests_native_auth/abstract_oauth.py +28 -9
  258. airbyte_cdk/sources/streams/http/requests_native_auth/abstract_token.py +2 -1
  259. airbyte_cdk/sources/streams/http/requests_native_auth/oauth.py +90 -35
  260. airbyte_cdk/sources/streams/http/requests_native_auth/token.py +13 -3
  261. airbyte_cdk/sources/types.py +154 -0
  262. airbyte_cdk/sources/utils/record_helper.py +36 -21
  263. airbyte_cdk/sources/utils/schema_helpers.py +13 -6
  264. airbyte_cdk/sources/utils/slice_logger.py +4 -1
  265. airbyte_cdk/sources/utils/transform.py +54 -20
  266. airbyte_cdk/sql/_util/hashing.py +34 -0
  267. airbyte_cdk/sql/_util/name_normalizers.py +92 -0
  268. airbyte_cdk/sql/constants.py +32 -0
  269. airbyte_cdk/sql/exceptions.py +235 -0
  270. airbyte_cdk/sql/secrets.py +123 -0
  271. airbyte_cdk/sql/shared/__init__.py +15 -0
  272. airbyte_cdk/sql/shared/catalog_providers.py +145 -0
  273. airbyte_cdk/sql/shared/sql_processor.py +786 -0
  274. airbyte_cdk/sql/types.py +160 -0
  275. airbyte_cdk/test/catalog_builder.py +70 -18
  276. airbyte_cdk/test/entrypoint_wrapper.py +117 -42
  277. airbyte_cdk/test/mock_http/__init__.py +1 -1
  278. airbyte_cdk/test/mock_http/matcher.py +6 -0
  279. airbyte_cdk/test/mock_http/mocker.py +57 -10
  280. airbyte_cdk/test/mock_http/request.py +19 -3
  281. airbyte_cdk/test/mock_http/response.py +3 -1
  282. airbyte_cdk/test/mock_http/response_builder.py +32 -16
  283. airbyte_cdk/test/state_builder.py +18 -10
  284. airbyte_cdk/test/utils/__init__.py +1 -0
  285. airbyte_cdk/test/utils/data.py +24 -0
  286. airbyte_cdk/test/utils/http_mocking.py +16 -0
  287. airbyte_cdk/test/utils/manifest_only_fixtures.py +60 -0
  288. airbyte_cdk/test/utils/reading.py +26 -0
  289. airbyte_cdk/utils/__init__.py +2 -1
  290. airbyte_cdk/utils/airbyte_secrets_utils.py +5 -3
  291. airbyte_cdk/utils/analytics_message.py +10 -2
  292. airbyte_cdk/utils/datetime_format_inferrer.py +4 -1
  293. airbyte_cdk/utils/event_timing.py +10 -10
  294. airbyte_cdk/utils/mapping_helpers.py +3 -1
  295. airbyte_cdk/utils/message_utils.py +20 -11
  296. airbyte_cdk/utils/print_buffer.py +75 -0
  297. airbyte_cdk/utils/schema_inferrer.py +198 -28
  298. airbyte_cdk/utils/slice_hasher.py +30 -0
  299. airbyte_cdk/utils/spec_schema_transformations.py +6 -3
  300. airbyte_cdk/utils/stream_status_utils.py +8 -1
  301. airbyte_cdk/utils/traced_exception.py +61 -21
  302. airbyte_cdk-6.13.1.dev4106.dist-info/METADATA +109 -0
  303. airbyte_cdk-6.13.1.dev4106.dist-info/RECORD +349 -0
  304. {airbyte_cdk-0.72.0.dist-info → airbyte_cdk-6.13.1.dev4106.dist-info}/WHEEL +1 -2
  305. airbyte_cdk-6.13.1.dev4106.dist-info/entry_points.txt +3 -0
  306. airbyte_cdk/sources/declarative/create_partial.py +0 -92
  307. airbyte_cdk/sources/declarative/parsers/class_types_registry.py +0 -102
  308. airbyte_cdk/sources/declarative/parsers/default_implementation_registry.py +0 -64
  309. airbyte_cdk/sources/declarative/requesters/error_handlers/response_action.py +0 -16
  310. airbyte_cdk/sources/declarative/requesters/error_handlers/response_status.py +0 -68
  311. airbyte_cdk/sources/declarative/stream_slicers/cartesian_product_stream_slicer.py +0 -114
  312. airbyte_cdk/sources/deprecated/base_source.py +0 -94
  313. airbyte_cdk/sources/deprecated/client.py +0 -99
  314. airbyte_cdk/sources/singer/__init__.py +0 -8
  315. airbyte_cdk/sources/singer/singer_helpers.py +0 -304
  316. airbyte_cdk/sources/singer/source.py +0 -186
  317. airbyte_cdk/sources/streams/concurrent/partitions/record.py +0 -23
  318. airbyte_cdk/sources/streams/http/auth/__init__.py +0 -17
  319. airbyte_cdk/sources/streams/http/auth/core.py +0 -29
  320. airbyte_cdk/sources/streams/http/auth/oauth.py +0 -113
  321. airbyte_cdk/sources/streams/http/auth/token.py +0 -47
  322. airbyte_cdk/sources/streams/utils/stream_helper.py +0 -40
  323. airbyte_cdk/sources/utils/catalog_helpers.py +0 -22
  324. airbyte_cdk/sources/utils/schema_models.py +0 -84
  325. airbyte_cdk-0.72.0.dist-info/METADATA +0 -243
  326. airbyte_cdk-0.72.0.dist-info/RECORD +0 -466
  327. airbyte_cdk-0.72.0.dist-info/top_level.txt +0 -3
  328. source_declarative_manifest/main.py +0 -29
  329. unit_tests/connector_builder/__init__.py +0 -3
  330. unit_tests/connector_builder/test_connector_builder_handler.py +0 -871
  331. unit_tests/connector_builder/test_message_grouper.py +0 -713
  332. unit_tests/connector_builder/utils.py +0 -27
  333. unit_tests/destinations/test_destination.py +0 -243
  334. unit_tests/singer/test_singer_helpers.py +0 -56
  335. unit_tests/singer/test_singer_source.py +0 -112
  336. unit_tests/sources/__init__.py +0 -0
  337. unit_tests/sources/concurrent_source/__init__.py +0 -3
  338. unit_tests/sources/concurrent_source/test_concurrent_source_adapter.py +0 -106
  339. unit_tests/sources/declarative/__init__.py +0 -3
  340. unit_tests/sources/declarative/auth/__init__.py +0 -3
  341. unit_tests/sources/declarative/auth/test_oauth.py +0 -331
  342. unit_tests/sources/declarative/auth/test_selective_authenticator.py +0 -39
  343. unit_tests/sources/declarative/auth/test_session_token_auth.py +0 -182
  344. unit_tests/sources/declarative/auth/test_token_auth.py +0 -200
  345. unit_tests/sources/declarative/auth/test_token_provider.py +0 -73
  346. unit_tests/sources/declarative/checks/__init__.py +0 -3
  347. unit_tests/sources/declarative/checks/test_check_stream.py +0 -146
  348. unit_tests/sources/declarative/decoders/__init__.py +0 -0
  349. unit_tests/sources/declarative/decoders/test_json_decoder.py +0 -16
  350. unit_tests/sources/declarative/external_component.py +0 -13
  351. unit_tests/sources/declarative/extractors/__init__.py +0 -3
  352. unit_tests/sources/declarative/extractors/test_dpath_extractor.py +0 -55
  353. unit_tests/sources/declarative/extractors/test_record_filter.py +0 -55
  354. unit_tests/sources/declarative/extractors/test_record_selector.py +0 -179
  355. unit_tests/sources/declarative/incremental/__init__.py +0 -0
  356. unit_tests/sources/declarative/incremental/test_datetime_based_cursor.py +0 -860
  357. unit_tests/sources/declarative/incremental/test_per_partition_cursor.py +0 -406
  358. unit_tests/sources/declarative/incremental/test_per_partition_cursor_integration.py +0 -332
  359. unit_tests/sources/declarative/interpolation/__init__.py +0 -3
  360. unit_tests/sources/declarative/interpolation/test_filters.py +0 -80
  361. unit_tests/sources/declarative/interpolation/test_interpolated_boolean.py +0 -40
  362. unit_tests/sources/declarative/interpolation/test_interpolated_mapping.py +0 -35
  363. unit_tests/sources/declarative/interpolation/test_interpolated_nested_mapping.py +0 -45
  364. unit_tests/sources/declarative/interpolation/test_interpolated_string.py +0 -25
  365. unit_tests/sources/declarative/interpolation/test_jinja.py +0 -240
  366. unit_tests/sources/declarative/interpolation/test_macros.py +0 -73
  367. unit_tests/sources/declarative/parsers/__init__.py +0 -3
  368. unit_tests/sources/declarative/parsers/test_manifest_component_transformer.py +0 -406
  369. unit_tests/sources/declarative/parsers/test_manifest_reference_resolver.py +0 -139
  370. unit_tests/sources/declarative/parsers/test_model_to_component_factory.py +0 -1841
  371. unit_tests/sources/declarative/parsers/testing_components.py +0 -36
  372. unit_tests/sources/declarative/partition_routers/__init__.py +0 -3
  373. unit_tests/sources/declarative/partition_routers/test_list_partition_router.py +0 -155
  374. unit_tests/sources/declarative/partition_routers/test_single_partition_router.py +0 -14
  375. unit_tests/sources/declarative/partition_routers/test_substream_partition_router.py +0 -404
  376. unit_tests/sources/declarative/requesters/__init__.py +0 -3
  377. unit_tests/sources/declarative/requesters/error_handlers/__init__.py +0 -3
  378. unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/__init__.py +0 -3
  379. unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/test_constant_backoff.py +0 -34
  380. unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/test_exponential_backoff.py +0 -36
  381. unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/test_header_helper.py +0 -38
  382. unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/test_wait_time_from_header.py +0 -35
  383. unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/test_wait_until_time_from_header.py +0 -64
  384. unit_tests/sources/declarative/requesters/error_handlers/test_composite_error_handler.py +0 -213
  385. unit_tests/sources/declarative/requesters/error_handlers/test_default_error_handler.py +0 -178
  386. unit_tests/sources/declarative/requesters/error_handlers/test_http_response_filter.py +0 -121
  387. unit_tests/sources/declarative/requesters/error_handlers/test_response_status.py +0 -44
  388. unit_tests/sources/declarative/requesters/paginators/__init__.py +0 -3
  389. unit_tests/sources/declarative/requesters/paginators/test_cursor_pagination_strategy.py +0 -64
  390. unit_tests/sources/declarative/requesters/paginators/test_default_paginator.py +0 -313
  391. unit_tests/sources/declarative/requesters/paginators/test_no_paginator.py +0 -12
  392. unit_tests/sources/declarative/requesters/paginators/test_offset_increment.py +0 -58
  393. unit_tests/sources/declarative/requesters/paginators/test_page_increment.py +0 -70
  394. unit_tests/sources/declarative/requesters/paginators/test_request_option.py +0 -43
  395. unit_tests/sources/declarative/requesters/paginators/test_stop_condition.py +0 -105
  396. unit_tests/sources/declarative/requesters/request_options/__init__.py +0 -3
  397. unit_tests/sources/declarative/requesters/request_options/test_interpolated_request_options_provider.py +0 -101
  398. unit_tests/sources/declarative/requesters/test_http_requester.py +0 -974
  399. unit_tests/sources/declarative/requesters/test_interpolated_request_input_provider.py +0 -32
  400. unit_tests/sources/declarative/retrievers/__init__.py +0 -3
  401. unit_tests/sources/declarative/retrievers/test_simple_retriever.py +0 -542
  402. unit_tests/sources/declarative/schema/__init__.py +0 -6
  403. unit_tests/sources/declarative/schema/source_test/SourceTest.py +0 -8
  404. unit_tests/sources/declarative/schema/source_test/__init__.py +0 -3
  405. unit_tests/sources/declarative/schema/test_default_schema_loader.py +0 -32
  406. unit_tests/sources/declarative/schema/test_inline_schema_loader.py +0 -19
  407. unit_tests/sources/declarative/schema/test_json_file_schema_loader.py +0 -26
  408. unit_tests/sources/declarative/states/__init__.py +0 -3
  409. unit_tests/sources/declarative/stream_slicers/__init__.py +0 -3
  410. unit_tests/sources/declarative/stream_slicers/test_cartesian_product_stream_slicer.py +0 -225
  411. unit_tests/sources/declarative/test_create_partial.py +0 -83
  412. unit_tests/sources/declarative/test_declarative_stream.py +0 -103
  413. unit_tests/sources/declarative/test_manifest_declarative_source.py +0 -1260
  414. unit_tests/sources/declarative/test_types.py +0 -39
  415. unit_tests/sources/declarative/test_yaml_declarative_source.py +0 -148
  416. unit_tests/sources/file_based/__init__.py +0 -0
  417. unit_tests/sources/file_based/availability_strategy/__init__.py +0 -0
  418. unit_tests/sources/file_based/availability_strategy/test_default_file_based_availability_strategy.py +0 -100
  419. unit_tests/sources/file_based/config/__init__.py +0 -0
  420. unit_tests/sources/file_based/config/test_abstract_file_based_spec.py +0 -28
  421. unit_tests/sources/file_based/config/test_csv_format.py +0 -34
  422. unit_tests/sources/file_based/config/test_file_based_stream_config.py +0 -84
  423. unit_tests/sources/file_based/discovery_policy/__init__.py +0 -0
  424. unit_tests/sources/file_based/discovery_policy/test_default_discovery_policy.py +0 -31
  425. unit_tests/sources/file_based/file_types/__init__.py +0 -0
  426. unit_tests/sources/file_based/file_types/test_avro_parser.py +0 -243
  427. unit_tests/sources/file_based/file_types/test_csv_parser.py +0 -546
  428. unit_tests/sources/file_based/file_types/test_jsonl_parser.py +0 -158
  429. unit_tests/sources/file_based/file_types/test_parquet_parser.py +0 -274
  430. unit_tests/sources/file_based/file_types/test_unstructured_parser.py +0 -593
  431. unit_tests/sources/file_based/helpers.py +0 -70
  432. unit_tests/sources/file_based/in_memory_files_source.py +0 -211
  433. unit_tests/sources/file_based/scenarios/__init__.py +0 -0
  434. unit_tests/sources/file_based/scenarios/avro_scenarios.py +0 -744
  435. unit_tests/sources/file_based/scenarios/check_scenarios.py +0 -220
  436. unit_tests/sources/file_based/scenarios/concurrent_incremental_scenarios.py +0 -2844
  437. unit_tests/sources/file_based/scenarios/csv_scenarios.py +0 -3105
  438. unit_tests/sources/file_based/scenarios/file_based_source_builder.py +0 -91
  439. unit_tests/sources/file_based/scenarios/incremental_scenarios.py +0 -1926
  440. unit_tests/sources/file_based/scenarios/jsonl_scenarios.py +0 -930
  441. unit_tests/sources/file_based/scenarios/parquet_scenarios.py +0 -754
  442. unit_tests/sources/file_based/scenarios/scenario_builder.py +0 -234
  443. unit_tests/sources/file_based/scenarios/unstructured_scenarios.py +0 -608
  444. unit_tests/sources/file_based/scenarios/user_input_schema_scenarios.py +0 -746
  445. unit_tests/sources/file_based/scenarios/validation_policy_scenarios.py +0 -726
  446. unit_tests/sources/file_based/stream/__init__.py +0 -0
  447. unit_tests/sources/file_based/stream/concurrent/__init__.py +0 -0
  448. unit_tests/sources/file_based/stream/concurrent/test_adapters.py +0 -362
  449. unit_tests/sources/file_based/stream/concurrent/test_file_based_concurrent_cursor.py +0 -458
  450. unit_tests/sources/file_based/stream/test_default_file_based_cursor.py +0 -310
  451. unit_tests/sources/file_based/stream/test_default_file_based_stream.py +0 -244
  452. unit_tests/sources/file_based/test_file_based_scenarios.py +0 -320
  453. unit_tests/sources/file_based/test_file_based_stream_reader.py +0 -272
  454. unit_tests/sources/file_based/test_scenarios.py +0 -253
  455. unit_tests/sources/file_based/test_schema_helpers.py +0 -346
  456. unit_tests/sources/fixtures/__init__.py +0 -3
  457. unit_tests/sources/fixtures/source_test_fixture.py +0 -153
  458. unit_tests/sources/message/__init__.py +0 -0
  459. unit_tests/sources/message/test_repository.py +0 -153
  460. unit_tests/sources/streams/__init__.py +0 -0
  461. unit_tests/sources/streams/concurrent/__init__.py +0 -3
  462. unit_tests/sources/streams/concurrent/scenarios/__init__.py +0 -3
  463. unit_tests/sources/streams/concurrent/scenarios/incremental_scenarios.py +0 -250
  464. unit_tests/sources/streams/concurrent/scenarios/stream_facade_builder.py +0 -140
  465. unit_tests/sources/streams/concurrent/scenarios/stream_facade_scenarios.py +0 -452
  466. unit_tests/sources/streams/concurrent/scenarios/test_concurrent_scenarios.py +0 -76
  467. unit_tests/sources/streams/concurrent/scenarios/thread_based_concurrent_stream_scenarios.py +0 -418
  468. unit_tests/sources/streams/concurrent/scenarios/thread_based_concurrent_stream_source_builder.py +0 -142
  469. unit_tests/sources/streams/concurrent/scenarios/utils.py +0 -55
  470. unit_tests/sources/streams/concurrent/test_adapters.py +0 -380
  471. unit_tests/sources/streams/concurrent/test_concurrent_read_processor.py +0 -684
  472. unit_tests/sources/streams/concurrent/test_cursor.py +0 -139
  473. unit_tests/sources/streams/concurrent/test_datetime_state_converter.py +0 -369
  474. unit_tests/sources/streams/concurrent/test_default_stream.py +0 -197
  475. unit_tests/sources/streams/concurrent/test_partition_enqueuer.py +0 -90
  476. unit_tests/sources/streams/concurrent/test_partition_reader.py +0 -67
  477. unit_tests/sources/streams/concurrent/test_thread_pool_manager.py +0 -106
  478. unit_tests/sources/streams/http/__init__.py +0 -0
  479. unit_tests/sources/streams/http/auth/__init__.py +0 -0
  480. unit_tests/sources/streams/http/auth/test_auth.py +0 -173
  481. unit_tests/sources/streams/http/requests_native_auth/__init__.py +0 -0
  482. unit_tests/sources/streams/http/requests_native_auth/test_requests_native_auth.py +0 -423
  483. unit_tests/sources/streams/http/test_availability_strategy.py +0 -180
  484. unit_tests/sources/streams/http/test_http.py +0 -635
  485. unit_tests/sources/streams/test_availability_strategy.py +0 -70
  486. unit_tests/sources/streams/test_call_rate.py +0 -300
  487. unit_tests/sources/streams/test_stream_read.py +0 -405
  488. unit_tests/sources/streams/test_streams_core.py +0 -184
  489. unit_tests/sources/test_abstract_source.py +0 -1442
  490. unit_tests/sources/test_concurrent_source.py +0 -112
  491. unit_tests/sources/test_config.py +0 -92
  492. unit_tests/sources/test_connector_state_manager.py +0 -482
  493. unit_tests/sources/test_http_logger.py +0 -252
  494. unit_tests/sources/test_integration_source.py +0 -86
  495. unit_tests/sources/test_source.py +0 -684
  496. unit_tests/sources/test_source_read.py +0 -460
  497. unit_tests/test/__init__.py +0 -0
  498. unit_tests/test/mock_http/__init__.py +0 -0
  499. unit_tests/test/mock_http/test_matcher.py +0 -53
  500. unit_tests/test/mock_http/test_mocker.py +0 -214
  501. unit_tests/test/mock_http/test_request.py +0 -117
  502. unit_tests/test/mock_http/test_response_builder.py +0 -177
  503. unit_tests/test/test_entrypoint_wrapper.py +0 -240
  504. unit_tests/utils/__init__.py +0 -0
  505. unit_tests/utils/test_datetime_format_inferrer.py +0 -60
  506. unit_tests/utils/test_mapping_helpers.py +0 -54
  507. unit_tests/utils/test_message_utils.py +0 -91
  508. unit_tests/utils/test_rate_limiting.py +0 -26
  509. unit_tests/utils/test_schema_inferrer.py +0 -202
  510. unit_tests/utils/test_secret_utils.py +0 -135
  511. unit_tests/utils/test_stream_status_utils.py +0 -61
  512. unit_tests/utils/test_traced_exception.py +0 -107
  513. /airbyte_cdk/sources/{deprecated → declarative/async_job}/__init__.py +0 -0
  514. {source_declarative_manifest → airbyte_cdk/sources/declarative/migrations}/__init__.py +0 -0
  515. {unit_tests/destinations → airbyte_cdk/sql}/__init__.py +0 -0
  516. {unit_tests/singer → airbyte_cdk/sql/_util}/__init__.py +0 -0
  517. {airbyte_cdk-0.72.0.dist-info → airbyte_cdk-6.13.1.dev4106.dist-info}/LICENSE.txt +0 -0
@@ -1,332 +0,0 @@
1
- #
2
- # Copyright (c) 2023 Airbyte, Inc., all rights reserved.
3
- #
4
-
5
- from unittest.mock import patch
6
-
7
- from airbyte_cdk.logger import init_logger
8
- from airbyte_cdk.models import ConfiguredAirbyteCatalog, SyncMode, Type
9
- from airbyte_cdk.sources.declarative.incremental.per_partition_cursor import StreamSlice
10
- from airbyte_cdk.sources.declarative.manifest_declarative_source import ManifestDeclarativeSource
11
- from airbyte_cdk.sources.declarative.retrievers.simple_retriever import SimpleRetriever
12
- from airbyte_cdk.sources.declarative.types import Record
13
-
14
- CURSOR_FIELD = "cursor_field"
15
- SYNC_MODE = SyncMode.incremental
16
-
17
-
18
- class ManifestBuilder:
19
- def __init__(self):
20
- self._incremental_sync = {}
21
- self._partition_router = {}
22
- self._substream_partition_router = {}
23
-
24
- def with_list_partition_router(self, stream_name, cursor_field, partitions):
25
- self._partition_router[stream_name] = {
26
- "type": "ListPartitionRouter",
27
- "cursor_field": cursor_field,
28
- "values": partitions,
29
- }
30
- return self
31
-
32
- def with_substream_partition_router(self, stream_name):
33
- self._substream_partition_router[stream_name] = {
34
- "type": "SubstreamPartitionRouter",
35
- "parent_stream_configs": [
36
- {
37
- "type": "ParentStreamConfig",
38
- "stream": "#/definitions/Rates",
39
- "parent_key": "id",
40
- "partition_field": "parent_id",
41
-
42
- }
43
- ]
44
- }
45
- return self
46
-
47
- def with_incremental_sync(self, stream_name, start_datetime, end_datetime, datetime_format, cursor_field, step, cursor_granularity):
48
- self._incremental_sync[stream_name] = {
49
- "type": "DatetimeBasedCursor",
50
- "start_datetime": start_datetime,
51
- "end_datetime": end_datetime,
52
- "datetime_format": datetime_format,
53
- "cursor_field": cursor_field,
54
- "step": step,
55
- "cursor_granularity": cursor_granularity,
56
- }
57
- return self
58
-
59
- def build(self):
60
- manifest = {
61
- "version": "0.34.2",
62
- "type": "DeclarativeSource",
63
- "check": {"type": "CheckStream", "stream_names": ["Rates"]},
64
- "definitions": {
65
- "AnotherStream": {
66
- "type": "DeclarativeStream",
67
- "name": "AnotherStream",
68
- "primary_key": [],
69
- "schema_loader": {
70
- "type": "InlineSchemaLoader",
71
- "schema": {"$schema": "http://json-schema.org/schema#", "properties": {"id": {"type": "string"}}, "type": "object"},
72
- },
73
- "retriever": {
74
- "type": "SimpleRetriever",
75
- "requester": {
76
- "type": "HttpRequester",
77
- "url_base": "https://api.apilayer.com",
78
- "path": "/exchangerates_data/latest",
79
- "http_method": "GET",
80
- },
81
- "record_selector": {"type": "RecordSelector", "extractor": {"type": "DpathExtractor", "field_path": []}},
82
- },
83
- },
84
- "Rates": {
85
- "type": "DeclarativeStream",
86
- "name": "Rates",
87
- "primary_key": [],
88
- "schema_loader": {
89
- "type": "InlineSchemaLoader",
90
- "schema": {"$schema": "http://json-schema.org/schema#", "properties": {}, "type": "object"},
91
- },
92
- "retriever": {
93
- "type": "SimpleRetriever",
94
- "requester": {
95
- "type": "HttpRequester",
96
- "url_base": "https://api.apilayer.com",
97
- "path": "/exchangerates_data/latest",
98
- "http_method": "GET",
99
- },
100
- "record_selector": {"type": "RecordSelector", "extractor": {"type": "DpathExtractor", "field_path": []}},
101
- },
102
- },
103
- },
104
- "streams": [
105
- {"$ref": "#/definitions/Rates"},
106
- {"$ref": "#/definitions/AnotherStream"}
107
- ],
108
- "spec": {
109
- "connection_specification": {
110
- "$schema": "http://json-schema.org/draft-07/schema#",
111
- "type": "object",
112
- "required": [],
113
- "properties": {},
114
- "additionalProperties": True,
115
- },
116
- "documentation_url": "https://example.org",
117
- "type": "Spec",
118
- },
119
- }
120
- for stream_name, incremental_sync_definition in self._incremental_sync.items():
121
- manifest["definitions"][stream_name]["incremental_sync"] = incremental_sync_definition
122
- for stream_name, partition_router_definition in self._partition_router.items():
123
- manifest["definitions"][stream_name]["retriever"]["partition_router"] = partition_router_definition
124
- for stream_name, partition_router_definition in self._substream_partition_router.items():
125
- manifest["definitions"][stream_name]["retriever"]["partition_router"] = partition_router_definition
126
- return manifest
127
-
128
-
129
- def test_given_state_for_only_some_partition_when_stream_slices_then_create_slices_using_state_or_start_from_start_datetime():
130
- source = ManifestDeclarativeSource(
131
- source_config=ManifestBuilder()
132
- .with_list_partition_router("Rates", "partition_field", ["1", "2"])
133
- .with_incremental_sync(
134
- "Rates",
135
- start_datetime="2022-01-01",
136
- end_datetime="2022-02-28",
137
- datetime_format="%Y-%m-%d",
138
- cursor_field=CURSOR_FIELD,
139
- step="P1M",
140
- cursor_granularity="P1D",
141
- )
142
- .build()
143
- )
144
- stream_instance = source.streams({})[0]
145
- stream_instance.state = {
146
- "states": [
147
- {
148
- "partition": {"partition_field": "1"},
149
- "cursor": {CURSOR_FIELD: "2022-02-01"},
150
- }
151
- ]
152
- }
153
-
154
- slices = stream_instance.stream_slices(
155
- sync_mode=SYNC_MODE,
156
- stream_state={},
157
- )
158
-
159
- assert list(slices) == [
160
- {"partition_field": "1", "start_time": "2022-02-01", "end_time": "2022-02-28"},
161
- {"partition_field": "2", "start_time": "2022-01-01", "end_time": "2022-01-31"},
162
- {"partition_field": "2", "start_time": "2022-02-01", "end_time": "2022-02-28"},
163
- ]
164
-
165
-
166
- def test_given_record_for_partition_when_read_then_update_state():
167
- source = ManifestDeclarativeSource(
168
- source_config=ManifestBuilder()
169
- .with_list_partition_router("Rates", "partition_field", ["1", "2"])
170
- .with_incremental_sync(
171
- "Rates",
172
- start_datetime="2022-01-01",
173
- end_datetime="2022-02-28",
174
- datetime_format="%Y-%m-%d",
175
- cursor_field=CURSOR_FIELD,
176
- step="P1M",
177
- cursor_granularity="P1D",
178
- )
179
- .build()
180
- )
181
- stream_instance = source.streams({})[0]
182
- list(stream_instance.stream_slices(sync_mode=SYNC_MODE))
183
-
184
- stream_slice = StreamSlice(partition={"partition_field": "1"},
185
- cursor_slice={"start_time": "2022-01-01", "end_time": "2022-01-31"})
186
- with patch.object(
187
- SimpleRetriever, "_read_pages",
188
- side_effect=[[Record({"a record key": "a record value", CURSOR_FIELD: "2022-01-15"}, stream_slice)]]
189
- ):
190
- list(
191
- stream_instance.read_records(
192
- sync_mode=SYNC_MODE,
193
- stream_slice=stream_slice,
194
- stream_state={"states": []},
195
- cursor_field=CURSOR_FIELD,
196
- )
197
- )
198
-
199
- assert stream_instance.state == {
200
- "states": [
201
- {
202
- "partition": {"partition_field": "1"},
203
- "cursor": {CURSOR_FIELD: "2022-01-15"},
204
- }
205
- ]
206
- }
207
-
208
-
209
- def test_substream_without_input_state():
210
- test_source = ManifestDeclarativeSource(
211
- source_config=ManifestBuilder()
212
- .with_substream_partition_router("AnotherStream")
213
- .with_incremental_sync(
214
- "Rates",
215
- start_datetime="2022-01-01",
216
- end_datetime="2022-02-28",
217
- datetime_format="%Y-%m-%d",
218
- cursor_field=CURSOR_FIELD,
219
- step="P1M",
220
- cursor_granularity="P1D",
221
- )
222
- .with_incremental_sync(
223
- "AnotherStream",
224
- start_datetime="2022-01-01",
225
- end_datetime="2022-02-28",
226
- datetime_format="%Y-%m-%d",
227
- cursor_field=CURSOR_FIELD,
228
- step="P1M",
229
- cursor_granularity="P1D",
230
- )
231
- .build()
232
- )
233
-
234
- stream_instance = test_source.streams({})[1]
235
-
236
- stream_slice = StreamSlice(partition={"parent_id": "1"},
237
- cursor_slice={"start_time": "2022-01-01", "end_time": "2022-01-31"})
238
-
239
- with patch.object(
240
- SimpleRetriever, "_read_pages", side_effect=[[Record({"id": "1", CURSOR_FIELD: "2022-01-15"}, stream_slice)],
241
- [Record({"id": "2", CURSOR_FIELD: "2022-01-15"}, stream_slice)]]
242
- ):
243
- slices = list(stream_instance.stream_slices(sync_mode=SYNC_MODE))
244
- assert list(slices) == [
245
- StreamSlice(partition={"parent_id": "1", "parent_slice": {}, },
246
- cursor_slice={"start_time": "2022-01-01", "end_time": "2022-01-31"}),
247
- StreamSlice(partition={"parent_id": "1", "parent_slice": {}, },
248
- cursor_slice={"start_time": "2022-02-01", "end_time": "2022-02-28"}),
249
- StreamSlice(partition={"parent_id": "2", "parent_slice": {}, },
250
- cursor_slice={"start_time": "2022-01-01", "end_time": "2022-01-31"}),
251
- StreamSlice(partition={"parent_id": "2", "parent_slice": {}, },
252
- cursor_slice={"start_time": "2022-02-01", "end_time": "2022-02-28"}),
253
- ]
254
-
255
-
256
- def test_substream_with_legacy_input_state():
257
- source = ManifestDeclarativeSource(
258
- source_config=ManifestBuilder()
259
- .with_substream_partition_router("AnotherStream")
260
- .with_incremental_sync(
261
- "Rates",
262
- start_datetime="2022-01-01",
263
- end_datetime="2022-02-28",
264
- datetime_format="%Y-%m-%d",
265
- cursor_field=CURSOR_FIELD,
266
- step="P1M",
267
- cursor_granularity="P1D",
268
- )
269
- .with_incremental_sync(
270
- "AnotherStream",
271
- start_datetime="2022-01-01",
272
- end_datetime="2022-02-28",
273
- datetime_format="%Y-%m-%d",
274
- cursor_field=CURSOR_FIELD,
275
- step="P1M",
276
- cursor_granularity="P1D",
277
- )
278
- .build()
279
- )
280
-
281
- stream_instance = source.streams({})[1]
282
-
283
- input_state = {
284
- "states": [
285
- {
286
- "partition": {"item_id": "an_item_id",
287
- "parent_slice": {"end_time": "1629640663", "start_time": "1626962264"},
288
- },
289
- "cursor": {
290
- "updated_at": "1709058818"
291
- }
292
- }
293
- ]
294
- }
295
- stream_instance.state = input_state
296
-
297
- stream_slice = StreamSlice(partition={"parent_id": "1"},
298
- cursor_slice={"start_time": "2022-01-01", "end_time": "2022-01-31"})
299
-
300
- logger = init_logger("airbyte")
301
- configured_catalog = ConfiguredAirbyteCatalog(
302
- streams=[
303
- {
304
- "stream": {"name": "AnotherStream", "json_schema": {}, "supported_sync_modes": ["incremental"]},
305
- "sync_mode": "incremental",
306
- "destination_sync_mode": "overwrite",
307
- },
308
- ]
309
- )
310
-
311
- with patch.object(
312
- SimpleRetriever, "_read_pages", side_effect=[
313
- [Record({"id": "1", CURSOR_FIELD: "2022-01-15"}, stream_slice)],
314
- [Record({"parent_id": "1", CURSOR_FIELD: "2022-01-15"}, stream_slice)],
315
- [Record({"id": "2", CURSOR_FIELD: "2022-01-15"}, stream_slice)],
316
- [Record({"parent_id": "2", CURSOR_FIELD: "2022-01-15"}, stream_slice)]
317
- ]
318
- ):
319
- messages = list(source.read(logger, {}, configured_catalog, input_state))
320
-
321
- output_state_message = [message for message in messages if message.type == Type.STATE][0]
322
-
323
- expected_state = {"states": [
324
- {
325
- "cursor": {
326
- CURSOR_FIELD: "2022-01-15"
327
- },
328
- "partition": {"parent_id": "1", "parent_slice": {}}
329
- }
330
- ]}
331
-
332
- assert output_state_message.state.stream.stream_state == expected_state
@@ -1,3 +0,0 @@
1
- #
2
- # Copyright (c) 2021 Airbyte, Inc., all rights reserved.
3
- #
@@ -1,80 +0,0 @@
1
- #
2
- # Copyright (c) 2023 Airbyte, Inc., all rights reserved.
3
- #
4
- import base64
5
- import hashlib
6
-
7
- import pytest
8
- from airbyte_cdk.sources.declarative.interpolation.jinja import JinjaInterpolation
9
-
10
- interpolation = JinjaInterpolation()
11
-
12
-
13
- def test_hash_md5_no_salt():
14
- input_string = "abcd"
15
- s = "{{ '%s' | hash('md5') }}" % input_string
16
- filter_hash = interpolation.eval(s, config={})
17
-
18
- # compute expected hash calling hashlib directly
19
- hash_obj = hashlib.md5()
20
- hash_obj.update(str(input_string).encode("utf-8"))
21
- hashlib_computed_hash = hash_obj.hexdigest()
22
-
23
- assert filter_hash == hashlib_computed_hash
24
-
25
-
26
- def test_hash_md5_on_numeric_value():
27
- input_value = 123.456
28
- s = "{{ %f | hash('md5') }}" % input_value
29
- filter_hash = interpolation.eval(s, config={})
30
-
31
- # compute expected hash calling hashlib directly
32
- hash_obj = hashlib.md5()
33
- hash_obj.update(str(input_value).encode("utf-8"))
34
- hashlib_computed_hash = hash_obj.hexdigest()
35
-
36
- assert filter_hash == hashlib_computed_hash
37
-
38
-
39
- def test_hash_md5_with_salt():
40
- input_string = "test_input_string"
41
- input_salt = "test_input_salt"
42
-
43
- s = "{{ '%s' | hash('md5', '%s' ) }}" % (input_string, input_salt)
44
- filter_hash = interpolation.eval(s, config={})
45
-
46
- # compute expected value calling hashlib directly
47
- hash_obj = hashlib.md5()
48
- hash_obj.update(str(input_string + input_salt).encode("utf-8"))
49
- hashlib_computed_hash = hash_obj.hexdigest()
50
-
51
- assert filter_hash == hashlib_computed_hash
52
-
53
-
54
- @pytest.mark.parametrize(
55
- "input_string",
56
- ["test_input_client_id", "some_client_secret_1", "12345", "775.78"],
57
- )
58
- def test_base64encode(input_string: str):
59
- s = "{{ '%s' | base64encode }}" % input_string
60
- filter_base64encode = interpolation.eval(s, config={})
61
-
62
- # compute expected base64encode calling base64 library directly
63
- base64_obj = base64.b64encode(input_string.encode("utf-8")).decode()
64
-
65
- assert filter_base64encode == base64_obj
66
-
67
-
68
- @pytest.mark.parametrize(
69
- "input_string, expected_string",
70
- [
71
- ("aW5wdXRfc3RyaW5n", "input_string"),
72
- ("YWlyYnl0ZQ==", "airbyte"),
73
- ("cGFzc3dvcmQ=", "password"),
74
- ],
75
- )
76
- def test_base64decode(input_string: str, expected_string: str):
77
- s = "{{ '%s' | base64decode }}" % input_string
78
- filter_base64decode = interpolation.eval(s, config={})
79
-
80
- assert filter_base64decode == expected_string
@@ -1,40 +0,0 @@
1
- #
2
- # Copyright (c) 2023 Airbyte, Inc., all rights reserved.
3
- #
4
-
5
- import pytest
6
- from airbyte_cdk.sources.declarative.interpolation.interpolated_boolean import InterpolatedBoolean
7
-
8
- config = {
9
- "parent": {"key_with_true": True},
10
- "string_key": "compare_me",
11
- "zero_value": 0,
12
- "empty_array": [],
13
- "non_empty_array": [1],
14
- "empty_dict": {},
15
- "empty_tuple": (),
16
- }
17
-
18
-
19
- @pytest.mark.parametrize(
20
- "test_name, template, expected_result",
21
- [
22
- ("test_interpolated_true_value", "{{ config['parent']['key_with_true'] }}", True),
23
- ("test_interpolated_true_comparison", "{{ config['string_key'] == \"compare_me\" }}", True),
24
- ("test_interpolated_false_condition", "{{ config['string_key'] == \"witness_me\" }}", False),
25
- ("test_path_has_value_returns_true", "{{ config['string_key'] }}", True),
26
- ("test_zero_is_false", "{{ config['zero_value'] }}", False),
27
- ("test_empty_array_is_false", "{{ config['empty_array'] }}", False),
28
- ("test_empty_dict_is_false", "{{ config['empty_dict'] }}", False),
29
- ("test_empty_tuple_is_false", "{{ config['empty_tuple'] }}", False),
30
- ("test_lowercase_false", '{{ "false" }}', False),
31
- ("test_False", "{{ False }}", False),
32
- ("test_True", "{{ True }}", True),
33
- ("test_value_in_array", "{{ 1 in config['non_empty_array'] }}", True),
34
- ("test_value_not_in_array", "{{ 2 in config['non_empty_array'] }}", False),
35
- ("test_interpolation_using_parameters", "{{ parameters['from_parameters'] == \"come_find_me\" }}", True),
36
- ],
37
- )
38
- def test_interpolated_boolean(test_name, template, expected_result):
39
- interpolated_bool = InterpolatedBoolean(condition=template, parameters={"from_parameters": "come_find_me"})
40
- assert interpolated_bool.eval(config) == expected_result
@@ -1,35 +0,0 @@
1
- #
2
- # Copyright (c) 2023 Airbyte, Inc., all rights reserved.
3
- #
4
-
5
- import pytest
6
- from airbyte_cdk.sources.declarative.interpolation.interpolated_mapping import InterpolatedMapping
7
-
8
-
9
- @pytest.mark.parametrize(
10
- "test_name, key, expected_value",
11
- [
12
- ("test_field_value", "field", "value"),
13
- ("test_number", "number", 100),
14
- ("test_field_to_interpolate_from_config", "field_to_interpolate_from_config", "VALUE_FROM_CONFIG"),
15
- ("test_field_to_interpolate_from_kwargs", "field_to_interpolate_from_kwargs", "VALUE_FROM_KWARGS"),
16
- ("test_field_to_interpolate_from_parameters", "field_to_interpolate_from_parameters", "VALUE_FROM_PARAMETERS"),
17
- ("test_key_is_interpolated", "key", "VALUE"),
18
- ],
19
- )
20
- def test(test_name, key, expected_value):
21
- d = {
22
- "field": "value",
23
- "number": 100,
24
- "field_to_interpolate_from_config": "{{ config['c'] }}",
25
- "field_to_interpolate_from_kwargs": "{{ kwargs['a'] }}",
26
- "field_to_interpolate_from_parameters": "{{ parameters['b'] }}",
27
- "{{ parameters.k }}": "VALUE",
28
- }
29
- config = {"c": "VALUE_FROM_CONFIG"}
30
- kwargs = {"a": "VALUE_FROM_KWARGS"}
31
- mapping = InterpolatedMapping(mapping=d, parameters={"b": "VALUE_FROM_PARAMETERS", "k": "key"})
32
-
33
- interpolated = mapping.eval(config, **{"kwargs": kwargs})
34
-
35
- assert interpolated[key] == expected_value
@@ -1,45 +0,0 @@
1
- #
2
- # Copyright (c) 2023 Airbyte, Inc., all rights reserved.
3
- #
4
-
5
- import dpath.util
6
- import pytest
7
- from airbyte_cdk.sources.declarative.interpolation.interpolated_nested_mapping import InterpolatedNestedMapping
8
-
9
-
10
- @pytest.mark.parametrize(
11
- "test_name, path, expected_value",
12
- [
13
- ("test_field_value", "nested/field", "value"),
14
- ("test_number", "nested/number", 100),
15
- ("test_interpolated_number", "nested/nested_array/1/value", 5),
16
- ("test_interpolated_boolean", "nested/nested_array/2/value", True),
17
- ("test_field_to_interpolate_from_config", "nested/config_value", "VALUE_FROM_CONFIG"),
18
- ("test_field_to_interpolate_from_kwargs", "nested/kwargs_value", "VALUE_FROM_KWARGS"),
19
- ("test_field_to_interpolate_from_parameters", "nested/parameters_value", "VALUE_FROM_PARAMETERS"),
20
- ("test_key_is_interpolated", "nested/nested_array/0/key", "VALUE"),
21
- ],
22
- )
23
- def test(test_name, path, expected_value):
24
- d = {
25
- "nested": {
26
- "field": "value",
27
- "number": 100,
28
- "nested_array": [
29
- {"{{ parameters.k }}": "VALUE"},
30
- {"value": "{{ config['num_value'] | int + 2 }}"},
31
- {"value": "{{ True }}"},
32
- ],
33
- "config_value": "{{ config['c'] }}",
34
- "parameters_value": "{{ parameters['b'] }}",
35
- "kwargs_value": "{{ kwargs['a'] }}",
36
- }
37
- }
38
-
39
- config = {"c": "VALUE_FROM_CONFIG", "num_value": 3}
40
- kwargs = {"a": "VALUE_FROM_KWARGS"}
41
- mapping = InterpolatedNestedMapping(mapping=d, parameters={"b": "VALUE_FROM_PARAMETERS", "k": "key"})
42
-
43
- interpolated = mapping.eval(config, **{"kwargs": kwargs})
44
-
45
- assert dpath.util.get(interpolated, path) == expected_value
@@ -1,25 +0,0 @@
1
- #
2
- # Copyright (c) 2023 Airbyte, Inc., all rights reserved.
3
- #
4
-
5
- import pytest
6
- from airbyte_cdk.sources.declarative.interpolation.interpolated_string import InterpolatedString
7
-
8
- config = {"field": "value"}
9
- parameters = {"hello": "world"}
10
- kwargs = {"c": "airbyte"}
11
-
12
-
13
- @pytest.mark.parametrize(
14
- "test_name, input_string, expected_value",
15
- [
16
- ("test_static_value", "HELLO WORLD", "HELLO WORLD"),
17
- ("test_eval_from_parameters", "{{ parameters['hello'] }}", "world"),
18
- ("test_eval_from_config", "{{ config['field'] }}", "value"),
19
- ("test_eval_from_kwargs", "{{ kwargs['c'] }}", "airbyte"),
20
- ("test_eval_from_kwargs", "{{ kwargs['c'] }}", "airbyte"),
21
- ],
22
- )
23
- def test_interpolated_string(test_name, input_string, expected_value):
24
- s = InterpolatedString.create(input_string, parameters=parameters)
25
- assert s.eval(config, **{"kwargs": kwargs}) == expected_value