airbyte-cdk 0.72.1__py3-none-any.whl → 6.13.1.dev4106__py3-none-any.whl
Sign up to get free protection for your applications and to get access to all the features.
- airbyte_cdk/__init__.py +355 -6
- airbyte_cdk/cli/__init__.py +1 -0
- airbyte_cdk/cli/source_declarative_manifest/__init__.py +5 -0
- airbyte_cdk/cli/source_declarative_manifest/_run.py +230 -0
- airbyte_cdk/cli/source_declarative_manifest/spec.json +17 -0
- airbyte_cdk/config_observation.py +29 -10
- airbyte_cdk/connector.py +24 -24
- airbyte_cdk/connector_builder/README.md +53 -0
- airbyte_cdk/connector_builder/connector_builder_handler.py +37 -11
- airbyte_cdk/connector_builder/main.py +45 -13
- airbyte_cdk/connector_builder/message_grouper.py +189 -50
- airbyte_cdk/connector_builder/models.py +3 -2
- airbyte_cdk/destinations/__init__.py +4 -3
- airbyte_cdk/destinations/destination.py +54 -20
- airbyte_cdk/destinations/vector_db_based/README.md +37 -0
- airbyte_cdk/destinations/vector_db_based/config.py +40 -17
- airbyte_cdk/destinations/vector_db_based/document_processor.py +56 -17
- airbyte_cdk/destinations/vector_db_based/embedder.py +57 -15
- airbyte_cdk/destinations/vector_db_based/test_utils.py +14 -4
- airbyte_cdk/destinations/vector_db_based/utils.py +8 -2
- airbyte_cdk/destinations/vector_db_based/writer.py +24 -5
- airbyte_cdk/entrypoint.py +153 -44
- airbyte_cdk/exception_handler.py +21 -3
- airbyte_cdk/logger.py +30 -44
- airbyte_cdk/models/__init__.py +13 -2
- airbyte_cdk/models/airbyte_protocol.py +86 -1
- airbyte_cdk/models/airbyte_protocol_serializers.py +44 -0
- airbyte_cdk/models/file_transfer_record_message.py +13 -0
- airbyte_cdk/models/well_known_types.py +1 -1
- airbyte_cdk/sources/__init__.py +5 -1
- airbyte_cdk/sources/abstract_source.py +125 -79
- airbyte_cdk/sources/concurrent_source/__init__.py +7 -2
- airbyte_cdk/sources/concurrent_source/concurrent_read_processor.py +102 -36
- airbyte_cdk/sources/concurrent_source/concurrent_source.py +29 -36
- airbyte_cdk/sources/concurrent_source/concurrent_source_adapter.py +94 -10
- airbyte_cdk/sources/concurrent_source/stream_thread_exception.py +25 -0
- airbyte_cdk/sources/concurrent_source/thread_pool_manager.py +20 -14
- airbyte_cdk/sources/config.py +3 -2
- airbyte_cdk/sources/connector_state_manager.py +49 -83
- airbyte_cdk/sources/declarative/async_job/job.py +52 -0
- airbyte_cdk/sources/declarative/async_job/job_orchestrator.py +497 -0
- airbyte_cdk/sources/declarative/async_job/job_tracker.py +75 -0
- airbyte_cdk/sources/declarative/async_job/repository.py +35 -0
- airbyte_cdk/sources/declarative/async_job/status.py +24 -0
- airbyte_cdk/sources/declarative/async_job/timer.py +39 -0
- airbyte_cdk/sources/declarative/auth/__init__.py +2 -3
- airbyte_cdk/sources/declarative/auth/declarative_authenticator.py +3 -1
- airbyte_cdk/sources/declarative/auth/jwt.py +191 -0
- airbyte_cdk/sources/declarative/auth/oauth.py +60 -20
- airbyte_cdk/sources/declarative/auth/selective_authenticator.py +10 -2
- airbyte_cdk/sources/declarative/auth/token.py +28 -10
- airbyte_cdk/sources/declarative/auth/token_provider.py +9 -8
- airbyte_cdk/sources/declarative/checks/check_stream.py +16 -8
- airbyte_cdk/sources/declarative/checks/connection_checker.py +4 -2
- airbyte_cdk/sources/declarative/concurrency_level/__init__.py +7 -0
- airbyte_cdk/sources/declarative/concurrency_level/concurrency_level.py +50 -0
- airbyte_cdk/sources/declarative/concurrent_declarative_source.py +421 -0
- airbyte_cdk/sources/declarative/datetime/datetime_parser.py +4 -0
- airbyte_cdk/sources/declarative/datetime/min_max_datetime.py +26 -6
- airbyte_cdk/sources/declarative/declarative_component_schema.yaml +1185 -85
- airbyte_cdk/sources/declarative/declarative_source.py +5 -2
- airbyte_cdk/sources/declarative/declarative_stream.py +95 -9
- airbyte_cdk/sources/declarative/decoders/__init__.py +23 -2
- airbyte_cdk/sources/declarative/decoders/composite_raw_decoder.py +97 -0
- airbyte_cdk/sources/declarative/decoders/decoder.py +11 -4
- airbyte_cdk/sources/declarative/decoders/json_decoder.py +92 -5
- airbyte_cdk/sources/declarative/decoders/noop_decoder.py +21 -0
- airbyte_cdk/sources/declarative/decoders/pagination_decoder_decorator.py +39 -0
- airbyte_cdk/sources/declarative/decoders/xml_decoder.py +98 -0
- airbyte_cdk/sources/declarative/extractors/__init__.py +12 -1
- airbyte_cdk/sources/declarative/extractors/dpath_extractor.py +29 -24
- airbyte_cdk/sources/declarative/extractors/http_selector.py +4 -5
- airbyte_cdk/sources/declarative/extractors/record_extractor.py +2 -3
- airbyte_cdk/sources/declarative/extractors/record_filter.py +65 -8
- airbyte_cdk/sources/declarative/extractors/record_selector.py +85 -26
- airbyte_cdk/sources/declarative/extractors/response_to_file_extractor.py +177 -0
- airbyte_cdk/sources/declarative/extractors/type_transformer.py +55 -0
- airbyte_cdk/sources/declarative/incremental/__init__.py +25 -3
- airbyte_cdk/sources/declarative/incremental/datetime_based_cursor.py +156 -48
- airbyte_cdk/sources/declarative/incremental/declarative_cursor.py +13 -0
- airbyte_cdk/sources/declarative/incremental/global_substream_cursor.py +350 -0
- airbyte_cdk/sources/declarative/incremental/per_partition_cursor.py +159 -74
- airbyte_cdk/sources/declarative/incremental/per_partition_with_global.py +200 -0
- airbyte_cdk/sources/declarative/incremental/resumable_full_refresh_cursor.py +122 -0
- airbyte_cdk/sources/declarative/interpolation/filters.py +27 -1
- airbyte_cdk/sources/declarative/interpolation/interpolated_boolean.py +23 -5
- airbyte_cdk/sources/declarative/interpolation/interpolated_mapping.py +12 -8
- airbyte_cdk/sources/declarative/interpolation/interpolated_nested_mapping.py +13 -6
- airbyte_cdk/sources/declarative/interpolation/interpolated_string.py +21 -6
- airbyte_cdk/sources/declarative/interpolation/interpolation.py +9 -3
- airbyte_cdk/sources/declarative/interpolation/jinja.py +72 -37
- airbyte_cdk/sources/declarative/interpolation/macros.py +72 -17
- airbyte_cdk/sources/declarative/manifest_declarative_source.py +193 -52
- airbyte_cdk/sources/declarative/migrations/legacy_to_per_partition_state_migration.py +98 -0
- airbyte_cdk/sources/declarative/migrations/state_migration.py +24 -0
- airbyte_cdk/sources/declarative/models/__init__.py +1 -1
- airbyte_cdk/sources/declarative/models/declarative_component_schema.py +1319 -603
- airbyte_cdk/sources/declarative/parsers/custom_exceptions.py +2 -2
- airbyte_cdk/sources/declarative/parsers/manifest_component_transformer.py +26 -4
- airbyte_cdk/sources/declarative/parsers/manifest_reference_resolver.py +26 -15
- airbyte_cdk/sources/declarative/parsers/model_to_component_factory.py +1695 -225
- airbyte_cdk/sources/declarative/partition_routers/__init__.py +24 -4
- airbyte_cdk/sources/declarative/partition_routers/async_job_partition_router.py +65 -0
- airbyte_cdk/sources/declarative/partition_routers/cartesian_product_stream_slicer.py +176 -0
- airbyte_cdk/sources/declarative/partition_routers/list_partition_router.py +39 -9
- airbyte_cdk/sources/declarative/partition_routers/partition_router.py +62 -0
- airbyte_cdk/sources/declarative/partition_routers/single_partition_router.py +15 -3
- airbyte_cdk/sources/declarative/partition_routers/substream_partition_router.py +222 -39
- airbyte_cdk/sources/declarative/requesters/error_handlers/__init__.py +19 -5
- airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/__init__.py +3 -1
- airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/constant_backoff_strategy.py +19 -7
- airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/exponential_backoff_strategy.py +19 -7
- airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/header_helper.py +4 -2
- airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/wait_time_from_header_backoff_strategy.py +41 -9
- airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/wait_until_time_from_header_backoff_strategy.py +29 -14
- airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategy.py +5 -13
- airbyte_cdk/sources/declarative/requesters/error_handlers/composite_error_handler.py +32 -16
- airbyte_cdk/sources/declarative/requesters/error_handlers/default_error_handler.py +46 -56
- airbyte_cdk/sources/declarative/requesters/error_handlers/default_http_response_filter.py +40 -0
- airbyte_cdk/sources/declarative/requesters/error_handlers/error_handler.py +6 -32
- airbyte_cdk/sources/declarative/requesters/error_handlers/http_response_filter.py +119 -41
- airbyte_cdk/sources/declarative/requesters/http_job_repository.py +228 -0
- airbyte_cdk/sources/declarative/requesters/http_requester.py +98 -344
- airbyte_cdk/sources/declarative/requesters/paginators/__init__.py +14 -3
- airbyte_cdk/sources/declarative/requesters/paginators/default_paginator.py +105 -46
- airbyte_cdk/sources/declarative/requesters/paginators/no_pagination.py +14 -8
- airbyte_cdk/sources/declarative/requesters/paginators/paginator.py +19 -8
- airbyte_cdk/sources/declarative/requesters/paginators/strategies/__init__.py +9 -3
- airbyte_cdk/sources/declarative/requesters/paginators/strategies/cursor_pagination_strategy.py +53 -21
- airbyte_cdk/sources/declarative/requesters/paginators/strategies/offset_increment.py +42 -19
- airbyte_cdk/sources/declarative/requesters/paginators/strategies/page_increment.py +25 -12
- airbyte_cdk/sources/declarative/requesters/paginators/strategies/pagination_strategy.py +13 -10
- airbyte_cdk/sources/declarative/requesters/paginators/strategies/stop_condition.py +26 -13
- airbyte_cdk/sources/declarative/requesters/request_options/__init__.py +15 -2
- airbyte_cdk/sources/declarative/requesters/request_options/datetime_based_request_options_provider.py +91 -0
- airbyte_cdk/sources/declarative/requesters/request_options/default_request_options_provider.py +60 -0
- airbyte_cdk/sources/declarative/requesters/request_options/interpolated_nested_request_input_provider.py +31 -14
- airbyte_cdk/sources/declarative/requesters/request_options/interpolated_request_input_provider.py +27 -15
- airbyte_cdk/sources/declarative/requesters/request_options/interpolated_request_options_provider.py +63 -10
- airbyte_cdk/sources/declarative/requesters/request_options/request_options_provider.py +1 -1
- airbyte_cdk/sources/declarative/requesters/requester.py +9 -17
- airbyte_cdk/sources/declarative/resolvers/__init__.py +41 -0
- airbyte_cdk/sources/declarative/resolvers/components_resolver.py +55 -0
- airbyte_cdk/sources/declarative/resolvers/config_components_resolver.py +136 -0
- airbyte_cdk/sources/declarative/resolvers/http_components_resolver.py +112 -0
- airbyte_cdk/sources/declarative/retrievers/__init__.py +6 -2
- airbyte_cdk/sources/declarative/retrievers/async_retriever.py +100 -0
- airbyte_cdk/sources/declarative/retrievers/retriever.py +1 -3
- airbyte_cdk/sources/declarative/retrievers/simple_retriever.py +228 -72
- airbyte_cdk/sources/declarative/schema/__init__.py +14 -1
- airbyte_cdk/sources/declarative/schema/default_schema_loader.py +5 -3
- airbyte_cdk/sources/declarative/schema/dynamic_schema_loader.py +236 -0
- airbyte_cdk/sources/declarative/schema/json_file_schema_loader.py +8 -8
- airbyte_cdk/sources/declarative/spec/spec.py +12 -5
- airbyte_cdk/sources/declarative/stream_slicers/__init__.py +1 -2
- airbyte_cdk/sources/declarative/stream_slicers/declarative_partition_generator.py +88 -0
- airbyte_cdk/sources/declarative/stream_slicers/stream_slicer.py +9 -14
- airbyte_cdk/sources/declarative/transformations/add_fields.py +19 -11
- airbyte_cdk/sources/declarative/transformations/flatten_fields.py +52 -0
- airbyte_cdk/sources/declarative/transformations/keys_replace_transformation.py +61 -0
- airbyte_cdk/sources/declarative/transformations/keys_to_lower_transformation.py +22 -0
- airbyte_cdk/sources/declarative/transformations/keys_to_snake_transformation.py +68 -0
- airbyte_cdk/sources/declarative/transformations/remove_fields.py +13 -10
- airbyte_cdk/sources/declarative/transformations/transformation.py +5 -5
- airbyte_cdk/sources/declarative/types.py +19 -110
- airbyte_cdk/sources/declarative/yaml_declarative_source.py +31 -10
- airbyte_cdk/sources/embedded/base_integration.py +16 -5
- airbyte_cdk/sources/embedded/catalog.py +16 -4
- airbyte_cdk/sources/embedded/runner.py +19 -3
- airbyte_cdk/sources/embedded/tools.py +5 -2
- airbyte_cdk/sources/file_based/README.md +152 -0
- airbyte_cdk/sources/file_based/__init__.py +24 -0
- airbyte_cdk/sources/file_based/availability_strategy/__init__.py +9 -2
- airbyte_cdk/sources/file_based/availability_strategy/abstract_file_based_availability_strategy.py +22 -6
- airbyte_cdk/sources/file_based/availability_strategy/default_file_based_availability_strategy.py +46 -10
- airbyte_cdk/sources/file_based/config/abstract_file_based_spec.py +58 -10
- airbyte_cdk/sources/file_based/config/avro_format.py +2 -1
- airbyte_cdk/sources/file_based/config/csv_format.py +29 -10
- airbyte_cdk/sources/file_based/config/excel_format.py +18 -0
- airbyte_cdk/sources/file_based/config/file_based_stream_config.py +16 -4
- airbyte_cdk/sources/file_based/config/jsonl_format.py +2 -1
- airbyte_cdk/sources/file_based/config/parquet_format.py +2 -1
- airbyte_cdk/sources/file_based/config/unstructured_format.py +13 -5
- airbyte_cdk/sources/file_based/discovery_policy/__init__.py +6 -2
- airbyte_cdk/sources/file_based/discovery_policy/abstract_discovery_policy.py +2 -4
- airbyte_cdk/sources/file_based/discovery_policy/default_discovery_policy.py +7 -2
- airbyte_cdk/sources/file_based/exceptions.py +52 -15
- airbyte_cdk/sources/file_based/file_based_source.py +163 -33
- airbyte_cdk/sources/file_based/file_based_stream_reader.py +83 -5
- airbyte_cdk/sources/file_based/file_types/__init__.py +14 -1
- airbyte_cdk/sources/file_based/file_types/avro_parser.py +75 -24
- airbyte_cdk/sources/file_based/file_types/csv_parser.py +116 -34
- airbyte_cdk/sources/file_based/file_types/excel_parser.py +196 -0
- airbyte_cdk/sources/file_based/file_types/file_transfer.py +37 -0
- airbyte_cdk/sources/file_based/file_types/file_type_parser.py +4 -1
- airbyte_cdk/sources/file_based/file_types/jsonl_parser.py +24 -8
- airbyte_cdk/sources/file_based/file_types/parquet_parser.py +60 -18
- airbyte_cdk/sources/file_based/file_types/unstructured_parser.py +145 -41
- airbyte_cdk/sources/file_based/remote_file.py +1 -1
- airbyte_cdk/sources/file_based/schema_helpers.py +38 -10
- airbyte_cdk/sources/file_based/schema_validation_policies/__init__.py +3 -1
- airbyte_cdk/sources/file_based/schema_validation_policies/abstract_schema_validation_policy.py +3 -1
- airbyte_cdk/sources/file_based/schema_validation_policies/default_schema_validation_policies.py +16 -5
- airbyte_cdk/sources/file_based/stream/abstract_file_based_stream.py +50 -13
- airbyte_cdk/sources/file_based/stream/concurrent/adapters.py +67 -27
- airbyte_cdk/sources/file_based/stream/concurrent/cursor/__init__.py +5 -1
- airbyte_cdk/sources/file_based/stream/concurrent/cursor/abstract_concurrent_file_based_cursor.py +14 -23
- airbyte_cdk/sources/file_based/stream/concurrent/cursor/file_based_concurrent_cursor.py +54 -18
- airbyte_cdk/sources/file_based/stream/concurrent/cursor/file_based_final_state_cursor.py +21 -9
- airbyte_cdk/sources/file_based/stream/cursor/abstract_file_based_cursor.py +3 -1
- airbyte_cdk/sources/file_based/stream/cursor/default_file_based_cursor.py +27 -10
- airbyte_cdk/sources/file_based/stream/default_file_based_stream.py +175 -45
- airbyte_cdk/sources/http_logger.py +8 -3
- airbyte_cdk/sources/message/__init__.py +7 -1
- airbyte_cdk/sources/message/repository.py +18 -4
- airbyte_cdk/sources/source.py +42 -38
- airbyte_cdk/sources/streams/__init__.py +2 -2
- airbyte_cdk/sources/streams/availability_strategy.py +54 -3
- airbyte_cdk/sources/streams/call_rate.py +64 -21
- airbyte_cdk/sources/streams/checkpoint/__init__.py +26 -0
- airbyte_cdk/sources/streams/checkpoint/checkpoint_reader.py +335 -0
- airbyte_cdk/sources/{declarative/incremental → streams/checkpoint}/cursor.py +17 -14
- airbyte_cdk/sources/streams/checkpoint/per_partition_key_serializer.py +22 -0
- airbyte_cdk/sources/streams/checkpoint/resumable_full_refresh_cursor.py +51 -0
- airbyte_cdk/sources/streams/checkpoint/substream_resumable_full_refresh_cursor.py +110 -0
- airbyte_cdk/sources/streams/concurrent/README.md +7 -0
- airbyte_cdk/sources/streams/concurrent/abstract_stream.py +7 -2
- airbyte_cdk/sources/streams/concurrent/adapters.py +84 -75
- airbyte_cdk/sources/streams/concurrent/availability_strategy.py +30 -2
- airbyte_cdk/sources/streams/concurrent/cursor.py +298 -42
- airbyte_cdk/sources/streams/concurrent/default_stream.py +12 -3
- airbyte_cdk/sources/streams/concurrent/exceptions.py +3 -0
- airbyte_cdk/sources/streams/concurrent/helpers.py +14 -3
- airbyte_cdk/sources/streams/concurrent/partition_enqueuer.py +12 -3
- airbyte_cdk/sources/streams/concurrent/partition_reader.py +10 -3
- airbyte_cdk/sources/streams/concurrent/partitions/partition.py +1 -16
- airbyte_cdk/sources/streams/concurrent/partitions/stream_slicer.py +21 -0
- airbyte_cdk/sources/streams/concurrent/partitions/types.py +15 -5
- airbyte_cdk/sources/streams/concurrent/state_converters/abstract_stream_state_converter.py +109 -17
- airbyte_cdk/sources/streams/concurrent/state_converters/datetime_stream_state_converter.py +90 -72
- airbyte_cdk/sources/streams/core.py +412 -87
- airbyte_cdk/sources/streams/http/__init__.py +2 -1
- airbyte_cdk/sources/streams/http/availability_strategy.py +12 -101
- airbyte_cdk/sources/streams/http/error_handlers/__init__.py +22 -0
- airbyte_cdk/sources/streams/http/error_handlers/backoff_strategy.py +28 -0
- airbyte_cdk/sources/streams/http/error_handlers/default_backoff_strategy.py +17 -0
- airbyte_cdk/sources/streams/http/error_handlers/default_error_mapping.py +86 -0
- airbyte_cdk/sources/streams/http/error_handlers/error_handler.py +42 -0
- airbyte_cdk/sources/streams/http/error_handlers/error_message_parser.py +19 -0
- airbyte_cdk/sources/streams/http/error_handlers/http_status_error_handler.py +110 -0
- airbyte_cdk/sources/streams/http/error_handlers/json_error_message_parser.py +52 -0
- airbyte_cdk/sources/streams/http/error_handlers/response_models.py +65 -0
- airbyte_cdk/sources/streams/http/exceptions.py +27 -7
- airbyte_cdk/sources/streams/http/http.py +369 -246
- airbyte_cdk/sources/streams/http/http_client.py +531 -0
- airbyte_cdk/sources/streams/http/rate_limiting.py +76 -12
- airbyte_cdk/sources/streams/http/requests_native_auth/abstract_oauth.py +28 -9
- airbyte_cdk/sources/streams/http/requests_native_auth/abstract_token.py +2 -1
- airbyte_cdk/sources/streams/http/requests_native_auth/oauth.py +90 -35
- airbyte_cdk/sources/streams/http/requests_native_auth/token.py +13 -3
- airbyte_cdk/sources/types.py +154 -0
- airbyte_cdk/sources/utils/record_helper.py +36 -21
- airbyte_cdk/sources/utils/schema_helpers.py +13 -6
- airbyte_cdk/sources/utils/slice_logger.py +4 -1
- airbyte_cdk/sources/utils/transform.py +54 -20
- airbyte_cdk/sql/_util/hashing.py +34 -0
- airbyte_cdk/sql/_util/name_normalizers.py +92 -0
- airbyte_cdk/sql/constants.py +32 -0
- airbyte_cdk/sql/exceptions.py +235 -0
- airbyte_cdk/sql/secrets.py +123 -0
- airbyte_cdk/sql/shared/__init__.py +15 -0
- airbyte_cdk/sql/shared/catalog_providers.py +145 -0
- airbyte_cdk/sql/shared/sql_processor.py +786 -0
- airbyte_cdk/sql/types.py +160 -0
- airbyte_cdk/test/catalog_builder.py +70 -18
- airbyte_cdk/test/entrypoint_wrapper.py +117 -42
- airbyte_cdk/test/mock_http/__init__.py +1 -1
- airbyte_cdk/test/mock_http/matcher.py +6 -0
- airbyte_cdk/test/mock_http/mocker.py +57 -10
- airbyte_cdk/test/mock_http/request.py +19 -3
- airbyte_cdk/test/mock_http/response.py +3 -1
- airbyte_cdk/test/mock_http/response_builder.py +32 -16
- airbyte_cdk/test/state_builder.py +18 -10
- airbyte_cdk/test/utils/__init__.py +1 -0
- airbyte_cdk/test/utils/data.py +24 -0
- airbyte_cdk/test/utils/http_mocking.py +16 -0
- airbyte_cdk/test/utils/manifest_only_fixtures.py +60 -0
- airbyte_cdk/test/utils/reading.py +26 -0
- airbyte_cdk/utils/__init__.py +2 -1
- airbyte_cdk/utils/airbyte_secrets_utils.py +5 -3
- airbyte_cdk/utils/analytics_message.py +10 -2
- airbyte_cdk/utils/datetime_format_inferrer.py +4 -1
- airbyte_cdk/utils/event_timing.py +10 -10
- airbyte_cdk/utils/mapping_helpers.py +3 -1
- airbyte_cdk/utils/message_utils.py +20 -11
- airbyte_cdk/utils/print_buffer.py +75 -0
- airbyte_cdk/utils/schema_inferrer.py +198 -28
- airbyte_cdk/utils/slice_hasher.py +30 -0
- airbyte_cdk/utils/spec_schema_transformations.py +6 -3
- airbyte_cdk/utils/stream_status_utils.py +8 -1
- airbyte_cdk/utils/traced_exception.py +61 -21
- airbyte_cdk-6.13.1.dev4106.dist-info/METADATA +109 -0
- airbyte_cdk-6.13.1.dev4106.dist-info/RECORD +349 -0
- {airbyte_cdk-0.72.1.dist-info → airbyte_cdk-6.13.1.dev4106.dist-info}/WHEEL +1 -2
- airbyte_cdk-6.13.1.dev4106.dist-info/entry_points.txt +3 -0
- airbyte_cdk/sources/declarative/create_partial.py +0 -92
- airbyte_cdk/sources/declarative/parsers/class_types_registry.py +0 -102
- airbyte_cdk/sources/declarative/parsers/default_implementation_registry.py +0 -64
- airbyte_cdk/sources/declarative/requesters/error_handlers/response_action.py +0 -16
- airbyte_cdk/sources/declarative/requesters/error_handlers/response_status.py +0 -68
- airbyte_cdk/sources/declarative/stream_slicers/cartesian_product_stream_slicer.py +0 -114
- airbyte_cdk/sources/deprecated/base_source.py +0 -94
- airbyte_cdk/sources/deprecated/client.py +0 -99
- airbyte_cdk/sources/singer/__init__.py +0 -8
- airbyte_cdk/sources/singer/singer_helpers.py +0 -304
- airbyte_cdk/sources/singer/source.py +0 -186
- airbyte_cdk/sources/streams/concurrent/partitions/record.py +0 -23
- airbyte_cdk/sources/streams/http/auth/__init__.py +0 -17
- airbyte_cdk/sources/streams/http/auth/core.py +0 -29
- airbyte_cdk/sources/streams/http/auth/oauth.py +0 -113
- airbyte_cdk/sources/streams/http/auth/token.py +0 -47
- airbyte_cdk/sources/streams/utils/stream_helper.py +0 -40
- airbyte_cdk/sources/utils/catalog_helpers.py +0 -22
- airbyte_cdk/sources/utils/schema_models.py +0 -84
- airbyte_cdk-0.72.1.dist-info/METADATA +0 -243
- airbyte_cdk-0.72.1.dist-info/RECORD +0 -466
- airbyte_cdk-0.72.1.dist-info/top_level.txt +0 -3
- source_declarative_manifest/main.py +0 -29
- unit_tests/connector_builder/__init__.py +0 -3
- unit_tests/connector_builder/test_connector_builder_handler.py +0 -871
- unit_tests/connector_builder/test_message_grouper.py +0 -713
- unit_tests/connector_builder/utils.py +0 -27
- unit_tests/destinations/test_destination.py +0 -243
- unit_tests/singer/test_singer_helpers.py +0 -56
- unit_tests/singer/test_singer_source.py +0 -112
- unit_tests/sources/__init__.py +0 -0
- unit_tests/sources/concurrent_source/__init__.py +0 -3
- unit_tests/sources/concurrent_source/test_concurrent_source_adapter.py +0 -106
- unit_tests/sources/declarative/__init__.py +0 -3
- unit_tests/sources/declarative/auth/__init__.py +0 -3
- unit_tests/sources/declarative/auth/test_oauth.py +0 -331
- unit_tests/sources/declarative/auth/test_selective_authenticator.py +0 -39
- unit_tests/sources/declarative/auth/test_session_token_auth.py +0 -182
- unit_tests/sources/declarative/auth/test_token_auth.py +0 -200
- unit_tests/sources/declarative/auth/test_token_provider.py +0 -73
- unit_tests/sources/declarative/checks/__init__.py +0 -3
- unit_tests/sources/declarative/checks/test_check_stream.py +0 -146
- unit_tests/sources/declarative/decoders/__init__.py +0 -0
- unit_tests/sources/declarative/decoders/test_json_decoder.py +0 -16
- unit_tests/sources/declarative/external_component.py +0 -13
- unit_tests/sources/declarative/extractors/__init__.py +0 -3
- unit_tests/sources/declarative/extractors/test_dpath_extractor.py +0 -55
- unit_tests/sources/declarative/extractors/test_record_filter.py +0 -55
- unit_tests/sources/declarative/extractors/test_record_selector.py +0 -179
- unit_tests/sources/declarative/incremental/__init__.py +0 -0
- unit_tests/sources/declarative/incremental/test_datetime_based_cursor.py +0 -860
- unit_tests/sources/declarative/incremental/test_per_partition_cursor.py +0 -406
- unit_tests/sources/declarative/incremental/test_per_partition_cursor_integration.py +0 -332
- unit_tests/sources/declarative/interpolation/__init__.py +0 -3
- unit_tests/sources/declarative/interpolation/test_filters.py +0 -80
- unit_tests/sources/declarative/interpolation/test_interpolated_boolean.py +0 -40
- unit_tests/sources/declarative/interpolation/test_interpolated_mapping.py +0 -35
- unit_tests/sources/declarative/interpolation/test_interpolated_nested_mapping.py +0 -45
- unit_tests/sources/declarative/interpolation/test_interpolated_string.py +0 -25
- unit_tests/sources/declarative/interpolation/test_jinja.py +0 -240
- unit_tests/sources/declarative/interpolation/test_macros.py +0 -73
- unit_tests/sources/declarative/parsers/__init__.py +0 -3
- unit_tests/sources/declarative/parsers/test_manifest_component_transformer.py +0 -406
- unit_tests/sources/declarative/parsers/test_manifest_reference_resolver.py +0 -139
- unit_tests/sources/declarative/parsers/test_model_to_component_factory.py +0 -1847
- unit_tests/sources/declarative/parsers/testing_components.py +0 -36
- unit_tests/sources/declarative/partition_routers/__init__.py +0 -3
- unit_tests/sources/declarative/partition_routers/test_list_partition_router.py +0 -155
- unit_tests/sources/declarative/partition_routers/test_single_partition_router.py +0 -14
- unit_tests/sources/declarative/partition_routers/test_substream_partition_router.py +0 -404
- unit_tests/sources/declarative/requesters/__init__.py +0 -3
- unit_tests/sources/declarative/requesters/error_handlers/__init__.py +0 -3
- unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/__init__.py +0 -3
- unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/test_constant_backoff.py +0 -34
- unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/test_exponential_backoff.py +0 -36
- unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/test_header_helper.py +0 -38
- unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/test_wait_time_from_header.py +0 -35
- unit_tests/sources/declarative/requesters/error_handlers/backoff_strategies/test_wait_until_time_from_header.py +0 -64
- unit_tests/sources/declarative/requesters/error_handlers/test_composite_error_handler.py +0 -213
- unit_tests/sources/declarative/requesters/error_handlers/test_default_error_handler.py +0 -178
- unit_tests/sources/declarative/requesters/error_handlers/test_http_response_filter.py +0 -121
- unit_tests/sources/declarative/requesters/error_handlers/test_response_status.py +0 -44
- unit_tests/sources/declarative/requesters/paginators/__init__.py +0 -3
- unit_tests/sources/declarative/requesters/paginators/test_cursor_pagination_strategy.py +0 -64
- unit_tests/sources/declarative/requesters/paginators/test_default_paginator.py +0 -313
- unit_tests/sources/declarative/requesters/paginators/test_no_paginator.py +0 -12
- unit_tests/sources/declarative/requesters/paginators/test_offset_increment.py +0 -58
- unit_tests/sources/declarative/requesters/paginators/test_page_increment.py +0 -70
- unit_tests/sources/declarative/requesters/paginators/test_request_option.py +0 -43
- unit_tests/sources/declarative/requesters/paginators/test_stop_condition.py +0 -105
- unit_tests/sources/declarative/requesters/request_options/__init__.py +0 -3
- unit_tests/sources/declarative/requesters/request_options/test_interpolated_request_options_provider.py +0 -101
- unit_tests/sources/declarative/requesters/test_http_requester.py +0 -974
- unit_tests/sources/declarative/requesters/test_interpolated_request_input_provider.py +0 -32
- unit_tests/sources/declarative/retrievers/__init__.py +0 -3
- unit_tests/sources/declarative/retrievers/test_simple_retriever.py +0 -542
- unit_tests/sources/declarative/schema/__init__.py +0 -6
- unit_tests/sources/declarative/schema/source_test/SourceTest.py +0 -8
- unit_tests/sources/declarative/schema/source_test/__init__.py +0 -3
- unit_tests/sources/declarative/schema/test_default_schema_loader.py +0 -32
- unit_tests/sources/declarative/schema/test_inline_schema_loader.py +0 -19
- unit_tests/sources/declarative/schema/test_json_file_schema_loader.py +0 -26
- unit_tests/sources/declarative/states/__init__.py +0 -3
- unit_tests/sources/declarative/stream_slicers/__init__.py +0 -3
- unit_tests/sources/declarative/stream_slicers/test_cartesian_product_stream_slicer.py +0 -225
- unit_tests/sources/declarative/test_create_partial.py +0 -83
- unit_tests/sources/declarative/test_declarative_stream.py +0 -103
- unit_tests/sources/declarative/test_manifest_declarative_source.py +0 -1260
- unit_tests/sources/declarative/test_types.py +0 -39
- unit_tests/sources/declarative/test_yaml_declarative_source.py +0 -148
- unit_tests/sources/file_based/__init__.py +0 -0
- unit_tests/sources/file_based/availability_strategy/__init__.py +0 -0
- unit_tests/sources/file_based/availability_strategy/test_default_file_based_availability_strategy.py +0 -100
- unit_tests/sources/file_based/config/__init__.py +0 -0
- unit_tests/sources/file_based/config/test_abstract_file_based_spec.py +0 -28
- unit_tests/sources/file_based/config/test_csv_format.py +0 -34
- unit_tests/sources/file_based/config/test_file_based_stream_config.py +0 -84
- unit_tests/sources/file_based/discovery_policy/__init__.py +0 -0
- unit_tests/sources/file_based/discovery_policy/test_default_discovery_policy.py +0 -31
- unit_tests/sources/file_based/file_types/__init__.py +0 -0
- unit_tests/sources/file_based/file_types/test_avro_parser.py +0 -243
- unit_tests/sources/file_based/file_types/test_csv_parser.py +0 -546
- unit_tests/sources/file_based/file_types/test_jsonl_parser.py +0 -158
- unit_tests/sources/file_based/file_types/test_parquet_parser.py +0 -274
- unit_tests/sources/file_based/file_types/test_unstructured_parser.py +0 -593
- unit_tests/sources/file_based/helpers.py +0 -70
- unit_tests/sources/file_based/in_memory_files_source.py +0 -211
- unit_tests/sources/file_based/scenarios/__init__.py +0 -0
- unit_tests/sources/file_based/scenarios/avro_scenarios.py +0 -744
- unit_tests/sources/file_based/scenarios/check_scenarios.py +0 -220
- unit_tests/sources/file_based/scenarios/concurrent_incremental_scenarios.py +0 -2844
- unit_tests/sources/file_based/scenarios/csv_scenarios.py +0 -3105
- unit_tests/sources/file_based/scenarios/file_based_source_builder.py +0 -91
- unit_tests/sources/file_based/scenarios/incremental_scenarios.py +0 -1926
- unit_tests/sources/file_based/scenarios/jsonl_scenarios.py +0 -930
- unit_tests/sources/file_based/scenarios/parquet_scenarios.py +0 -754
- unit_tests/sources/file_based/scenarios/scenario_builder.py +0 -234
- unit_tests/sources/file_based/scenarios/unstructured_scenarios.py +0 -608
- unit_tests/sources/file_based/scenarios/user_input_schema_scenarios.py +0 -746
- unit_tests/sources/file_based/scenarios/validation_policy_scenarios.py +0 -726
- unit_tests/sources/file_based/stream/__init__.py +0 -0
- unit_tests/sources/file_based/stream/concurrent/__init__.py +0 -0
- unit_tests/sources/file_based/stream/concurrent/test_adapters.py +0 -362
- unit_tests/sources/file_based/stream/concurrent/test_file_based_concurrent_cursor.py +0 -458
- unit_tests/sources/file_based/stream/test_default_file_based_cursor.py +0 -310
- unit_tests/sources/file_based/stream/test_default_file_based_stream.py +0 -244
- unit_tests/sources/file_based/test_file_based_scenarios.py +0 -320
- unit_tests/sources/file_based/test_file_based_stream_reader.py +0 -272
- unit_tests/sources/file_based/test_scenarios.py +0 -253
- unit_tests/sources/file_based/test_schema_helpers.py +0 -346
- unit_tests/sources/fixtures/__init__.py +0 -3
- unit_tests/sources/fixtures/source_test_fixture.py +0 -153
- unit_tests/sources/message/__init__.py +0 -0
- unit_tests/sources/message/test_repository.py +0 -153
- unit_tests/sources/streams/__init__.py +0 -0
- unit_tests/sources/streams/concurrent/__init__.py +0 -3
- unit_tests/sources/streams/concurrent/scenarios/__init__.py +0 -3
- unit_tests/sources/streams/concurrent/scenarios/incremental_scenarios.py +0 -250
- unit_tests/sources/streams/concurrent/scenarios/stream_facade_builder.py +0 -140
- unit_tests/sources/streams/concurrent/scenarios/stream_facade_scenarios.py +0 -452
- unit_tests/sources/streams/concurrent/scenarios/test_concurrent_scenarios.py +0 -76
- unit_tests/sources/streams/concurrent/scenarios/thread_based_concurrent_stream_scenarios.py +0 -418
- unit_tests/sources/streams/concurrent/scenarios/thread_based_concurrent_stream_source_builder.py +0 -142
- unit_tests/sources/streams/concurrent/scenarios/utils.py +0 -55
- unit_tests/sources/streams/concurrent/test_adapters.py +0 -380
- unit_tests/sources/streams/concurrent/test_concurrent_read_processor.py +0 -684
- unit_tests/sources/streams/concurrent/test_cursor.py +0 -139
- unit_tests/sources/streams/concurrent/test_datetime_state_converter.py +0 -369
- unit_tests/sources/streams/concurrent/test_default_stream.py +0 -197
- unit_tests/sources/streams/concurrent/test_partition_enqueuer.py +0 -90
- unit_tests/sources/streams/concurrent/test_partition_reader.py +0 -67
- unit_tests/sources/streams/concurrent/test_thread_pool_manager.py +0 -106
- unit_tests/sources/streams/http/__init__.py +0 -0
- unit_tests/sources/streams/http/auth/__init__.py +0 -0
- unit_tests/sources/streams/http/auth/test_auth.py +0 -173
- unit_tests/sources/streams/http/requests_native_auth/__init__.py +0 -0
- unit_tests/sources/streams/http/requests_native_auth/test_requests_native_auth.py +0 -423
- unit_tests/sources/streams/http/test_availability_strategy.py +0 -180
- unit_tests/sources/streams/http/test_http.py +0 -635
- unit_tests/sources/streams/test_availability_strategy.py +0 -70
- unit_tests/sources/streams/test_call_rate.py +0 -300
- unit_tests/sources/streams/test_stream_read.py +0 -405
- unit_tests/sources/streams/test_streams_core.py +0 -184
- unit_tests/sources/test_abstract_source.py +0 -1442
- unit_tests/sources/test_concurrent_source.py +0 -112
- unit_tests/sources/test_config.py +0 -92
- unit_tests/sources/test_connector_state_manager.py +0 -482
- unit_tests/sources/test_http_logger.py +0 -252
- unit_tests/sources/test_integration_source.py +0 -86
- unit_tests/sources/test_source.py +0 -684
- unit_tests/sources/test_source_read.py +0 -460
- unit_tests/test/__init__.py +0 -0
- unit_tests/test/mock_http/__init__.py +0 -0
- unit_tests/test/mock_http/test_matcher.py +0 -53
- unit_tests/test/mock_http/test_mocker.py +0 -214
- unit_tests/test/mock_http/test_request.py +0 -117
- unit_tests/test/mock_http/test_response_builder.py +0 -177
- unit_tests/test/test_entrypoint_wrapper.py +0 -240
- unit_tests/utils/__init__.py +0 -0
- unit_tests/utils/test_datetime_format_inferrer.py +0 -60
- unit_tests/utils/test_mapping_helpers.py +0 -54
- unit_tests/utils/test_message_utils.py +0 -91
- unit_tests/utils/test_rate_limiting.py +0 -26
- unit_tests/utils/test_schema_inferrer.py +0 -202
- unit_tests/utils/test_secret_utils.py +0 -135
- unit_tests/utils/test_stream_status_utils.py +0 -61
- unit_tests/utils/test_traced_exception.py +0 -107
- /airbyte_cdk/sources/{deprecated → declarative/async_job}/__init__.py +0 -0
- {source_declarative_manifest → airbyte_cdk/sources/declarative/migrations}/__init__.py +0 -0
- {unit_tests/destinations → airbyte_cdk/sql}/__init__.py +0 -0
- {unit_tests/singer → airbyte_cdk/sql/_util}/__init__.py +0 -0
- {airbyte_cdk-0.72.1.dist-info → airbyte_cdk-6.13.1.dev4106.dist-info}/LICENSE.txt +0 -0
@@ -1,47 +0,0 @@
|
|
1
|
-
#
|
2
|
-
# Copyright (c) 2023 Airbyte, Inc., all rights reserved.
|
3
|
-
#
|
4
|
-
|
5
|
-
|
6
|
-
import base64
|
7
|
-
from itertools import cycle
|
8
|
-
from typing import Any, List, Mapping
|
9
|
-
|
10
|
-
from deprecated import deprecated
|
11
|
-
|
12
|
-
from .core import HttpAuthenticator
|
13
|
-
|
14
|
-
|
15
|
-
@deprecated(version="0.1.20", reason="Use airbyte_cdk.sources.streams.http.requests_native_auth.TokenAuthenticator instead")
|
16
|
-
class TokenAuthenticator(HttpAuthenticator):
|
17
|
-
def __init__(self, token: str, auth_method: str = "Bearer", auth_header: str = "Authorization"):
|
18
|
-
self.auth_method = auth_method
|
19
|
-
self.auth_header = auth_header
|
20
|
-
self._token = token
|
21
|
-
|
22
|
-
def get_auth_header(self) -> Mapping[str, Any]:
|
23
|
-
return {self.auth_header: f"{self.auth_method} {self._token}"}
|
24
|
-
|
25
|
-
|
26
|
-
@deprecated(version="0.1.20", reason="Use airbyte_cdk.sources.streams.http.requests_native_auth.MultipleTokenAuthenticator instead")
|
27
|
-
class MultipleTokenAuthenticator(HttpAuthenticator):
|
28
|
-
def __init__(self, tokens: List[str], auth_method: str = "Bearer", auth_header: str = "Authorization"):
|
29
|
-
self.auth_method = auth_method
|
30
|
-
self.auth_header = auth_header
|
31
|
-
self._tokens = tokens
|
32
|
-
self._tokens_iter = cycle(self._tokens)
|
33
|
-
|
34
|
-
def get_auth_header(self) -> Mapping[str, Any]:
|
35
|
-
return {self.auth_header: f"{self.auth_method} {next(self._tokens_iter)}"}
|
36
|
-
|
37
|
-
|
38
|
-
class BasicHttpAuthenticator(TokenAuthenticator):
|
39
|
-
"""
|
40
|
-
Builds auth based off the basic authentication scheme as defined by RFC 7617, which transmits credentials as USER ID/password pairs, encoded using bas64
|
41
|
-
https://developer.mozilla.org/en-US/docs/Web/HTTP/Authentication#basic_authentication_scheme
|
42
|
-
"""
|
43
|
-
|
44
|
-
def __init__(self, username: str, password: str, auth_method: str = "Basic", auth_header: str = "Authorization"):
|
45
|
-
auth_string = f"{username}:{password}".encode("utf8")
|
46
|
-
b64_encoded = base64.b64encode(auth_string).decode("utf8")
|
47
|
-
super().__init__(b64_encoded, auth_method, auth_header)
|
@@ -1,40 +0,0 @@
|
|
1
|
-
#
|
2
|
-
# Copyright (c) 2023 Airbyte, Inc., all rights reserved.
|
3
|
-
#
|
4
|
-
|
5
|
-
from typing import Any, Mapping, Optional
|
6
|
-
|
7
|
-
from airbyte_cdk.models import SyncMode
|
8
|
-
from airbyte_cdk.sources.streams.core import Stream, StreamData
|
9
|
-
|
10
|
-
|
11
|
-
def get_first_stream_slice(stream) -> Optional[Mapping[str, Any]]:
|
12
|
-
"""
|
13
|
-
Gets the first stream_slice from a given stream's stream_slices.
|
14
|
-
:param stream: stream
|
15
|
-
:raises StopIteration: if there is no first slice to return (the stream_slices generator is empty)
|
16
|
-
:return: first stream slice from 'stream_slices' generator (`None` is a valid stream slice)
|
17
|
-
"""
|
18
|
-
# We wrap the return output of stream_slices() because some implementations return types that are iterable,
|
19
|
-
# but not iterators such as lists or tuples
|
20
|
-
slices = iter(
|
21
|
-
stream.stream_slices(
|
22
|
-
cursor_field=stream.cursor_field,
|
23
|
-
sync_mode=SyncMode.full_refresh,
|
24
|
-
)
|
25
|
-
)
|
26
|
-
return next(slices)
|
27
|
-
|
28
|
-
|
29
|
-
def get_first_record_for_slice(stream: Stream, stream_slice: Optional[Mapping[str, Any]]) -> StreamData:
|
30
|
-
"""
|
31
|
-
Gets the first record for a stream_slice of a stream.
|
32
|
-
:param stream: stream
|
33
|
-
:param stream_slice: stream_slice
|
34
|
-
:raises StopIteration: if there is no first record to return (the read_records generator is empty)
|
35
|
-
:return: StreamData containing the first record in the slice
|
36
|
-
"""
|
37
|
-
# We wrap the return output of read_records() because some implementations return types that are iterable,
|
38
|
-
# but not iterators such as lists or tuples
|
39
|
-
records_for_slice = iter(stream.read_records(sync_mode=SyncMode.full_refresh, stream_slice=stream_slice))
|
40
|
-
return next(records_for_slice)
|
@@ -1,22 +0,0 @@
|
|
1
|
-
#
|
2
|
-
# Copyright (c) 2023 Airbyte, Inc., all rights reserved.
|
3
|
-
#
|
4
|
-
|
5
|
-
|
6
|
-
from airbyte_cdk.models import AirbyteCatalog, SyncMode
|
7
|
-
|
8
|
-
|
9
|
-
class CatalogHelper:
|
10
|
-
@staticmethod
|
11
|
-
def coerce_catalog_as_full_refresh(catalog: AirbyteCatalog) -> AirbyteCatalog:
|
12
|
-
"""
|
13
|
-
Updates the sync mode on all streams in this catalog to be full refresh
|
14
|
-
"""
|
15
|
-
coerced_catalog = catalog.copy()
|
16
|
-
for stream in catalog.streams:
|
17
|
-
stream.source_defined_cursor = False
|
18
|
-
stream.supported_sync_modes = [SyncMode.full_refresh]
|
19
|
-
stream.default_cursor_field = None
|
20
|
-
|
21
|
-
# remove nulls
|
22
|
-
return AirbyteCatalog.parse_raw(coerced_catalog.json(exclude_unset=True, exclude_none=True))
|
@@ -1,84 +0,0 @@
|
|
1
|
-
#
|
2
|
-
# Copyright (c) 2023 Airbyte, Inc., all rights reserved.
|
3
|
-
#
|
4
|
-
|
5
|
-
from typing import Any, Dict, Optional, Type
|
6
|
-
|
7
|
-
from airbyte_cdk.sources.utils.schema_helpers import expand_refs
|
8
|
-
from pydantic import BaseModel, Extra
|
9
|
-
from pydantic.main import ModelMetaclass
|
10
|
-
from pydantic.typing import resolve_annotations
|
11
|
-
|
12
|
-
|
13
|
-
class AllOptional(ModelMetaclass):
|
14
|
-
"""
|
15
|
-
Metaclass for marking all Pydantic model fields as Optional
|
16
|
-
Here is example of declaring model using this metaclass like:
|
17
|
-
'''
|
18
|
-
class MyModel(BaseModel, metaclass=AllOptional):
|
19
|
-
a: str
|
20
|
-
b: str
|
21
|
-
'''
|
22
|
-
it is an equivalent of:
|
23
|
-
'''
|
24
|
-
class MyModel(BaseModel):
|
25
|
-
a: Optional[str]
|
26
|
-
b: Optional[str]
|
27
|
-
'''
|
28
|
-
It would make code more clear and eliminate a lot of manual work.
|
29
|
-
"""
|
30
|
-
|
31
|
-
def __new__(mcs, name, bases, namespaces, **kwargs):
|
32
|
-
"""
|
33
|
-
Iterate through fields and wrap then with typing.Optional type.
|
34
|
-
"""
|
35
|
-
annotations = resolve_annotations(namespaces.get("__annotations__", {}), namespaces.get("__module__", None))
|
36
|
-
for base in bases:
|
37
|
-
annotations = {**annotations, **getattr(base, "__annotations__", {})}
|
38
|
-
for field in annotations:
|
39
|
-
if not field.startswith("__"):
|
40
|
-
annotations[field] = Optional[annotations[field]]
|
41
|
-
namespaces["__annotations__"] = annotations
|
42
|
-
return super().__new__(mcs, name, bases, namespaces, **kwargs)
|
43
|
-
|
44
|
-
|
45
|
-
class BaseSchemaModel(BaseModel):
|
46
|
-
"""
|
47
|
-
Base class for all schema models. It has some extra schema postprocessing.
|
48
|
-
Can be used in combination with AllOptional metaclass
|
49
|
-
"""
|
50
|
-
|
51
|
-
class Config:
|
52
|
-
extra = Extra.allow
|
53
|
-
|
54
|
-
@classmethod
|
55
|
-
def schema_extra(cls, schema: Dict[str, Any], model: Type[BaseModel]) -> None:
|
56
|
-
"""Modify generated jsonschema, remove "title", "description" and "required" fields.
|
57
|
-
|
58
|
-
Pydantic doesn't treat Union[None, Any] type correctly when generate jsonschema,
|
59
|
-
so we can't set field as nullable (i.e. field that can have either null and non-null values),
|
60
|
-
We generate this jsonschema value manually.
|
61
|
-
|
62
|
-
:param schema: generated jsonschema
|
63
|
-
:param model:
|
64
|
-
"""
|
65
|
-
schema.pop("title", None)
|
66
|
-
schema.pop("description", None)
|
67
|
-
schema.pop("required", None)
|
68
|
-
for name, prop in schema.get("properties", {}).items():
|
69
|
-
prop.pop("title", None)
|
70
|
-
prop.pop("description", None)
|
71
|
-
allow_none = model.__fields__[name].allow_none
|
72
|
-
if allow_none:
|
73
|
-
if "type" in prop:
|
74
|
-
prop["type"] = ["null", prop["type"]]
|
75
|
-
elif "$ref" in prop:
|
76
|
-
ref = prop.pop("$ref")
|
77
|
-
prop["oneOf"] = [{"type": "null"}, {"$ref": ref}]
|
78
|
-
|
79
|
-
@classmethod
|
80
|
-
def schema(cls, *args, **kwargs) -> Dict[str, Any]:
|
81
|
-
"""We're overriding the schema classmethod to enable some post-processing"""
|
82
|
-
schema = super().schema(*args, **kwargs)
|
83
|
-
expand_refs(schema)
|
84
|
-
return schema
|
@@ -1,243 +0,0 @@
|
|
1
|
-
Metadata-Version: 2.1
|
2
|
-
Name: airbyte-cdk
|
3
|
-
Version: 0.72.1
|
4
|
-
Summary: A framework for writing Airbyte Connectors.
|
5
|
-
Home-page: https://github.com/airbytehq/airbyte
|
6
|
-
Author: Airbyte
|
7
|
-
Author-email: contact@airbyte.io
|
8
|
-
License: MIT
|
9
|
-
Project-URL: Documentation, https://docs.airbyte.io/
|
10
|
-
Project-URL: Source, https://github.com/airbytehq/airbyte
|
11
|
-
Project-URL: Tracker, https://github.com/airbytehq/airbyte/issues
|
12
|
-
Keywords: airbyte connector-development-kit cdk
|
13
|
-
Classifier: Development Status :: 3 - Alpha
|
14
|
-
Classifier: Intended Audience :: Developers
|
15
|
-
Classifier: Topic :: Scientific/Engineering
|
16
|
-
Classifier: Topic :: Software Development :: Libraries :: Python Modules
|
17
|
-
Classifier: License :: OSI Approved :: MIT License
|
18
|
-
Classifier: Programming Language :: Python :: 3.8
|
19
|
-
Requires-Python: >=3.8
|
20
|
-
Description-Content-Type: text/markdown
|
21
|
-
License-File: LICENSE.txt
|
22
|
-
Requires-Dist: airbyte-protocol-models ==0.5.1
|
23
|
-
Requires-Dist: backoff
|
24
|
-
Requires-Dist: dpath ~=2.0.1
|
25
|
-
Requires-Dist: isodate ~=0.6.1
|
26
|
-
Requires-Dist: jsonschema ~=3.2.0
|
27
|
-
Requires-Dist: jsonref ~=0.2
|
28
|
-
Requires-Dist: pendulum <3.0.0
|
29
|
-
Requires-Dist: genson ==1.2.2
|
30
|
-
Requires-Dist: pydantic <2.0.0,>=1.10.8
|
31
|
-
Requires-Dist: pyrate-limiter ~=3.1.0
|
32
|
-
Requires-Dist: python-dateutil
|
33
|
-
Requires-Dist: PyYAML >=6.0.1
|
34
|
-
Requires-Dist: requests
|
35
|
-
Requires-Dist: requests-cache
|
36
|
-
Requires-Dist: Deprecated ~=1.2
|
37
|
-
Requires-Dist: Jinja2 ~=3.1.2
|
38
|
-
Requires-Dist: cachetools
|
39
|
-
Requires-Dist: wcmatch ==8.4
|
40
|
-
Provides-Extra: dev
|
41
|
-
Requires-Dist: avro ~=1.11.2 ; extra == 'dev'
|
42
|
-
Requires-Dist: fastavro ~=1.8.0 ; extra == 'dev'
|
43
|
-
Requires-Dist: freezegun ; extra == 'dev'
|
44
|
-
Requires-Dist: mypy ; extra == 'dev'
|
45
|
-
Requires-Dist: pytest ; extra == 'dev'
|
46
|
-
Requires-Dist: pytest-cov ; extra == 'dev'
|
47
|
-
Requires-Dist: pytest-mock ; extra == 'dev'
|
48
|
-
Requires-Dist: requests-mock ; extra == 'dev'
|
49
|
-
Requires-Dist: pytest-httpserver ; extra == 'dev'
|
50
|
-
Requires-Dist: pandas ==2.0.3 ; extra == 'dev'
|
51
|
-
Requires-Dist: pyarrow ~=15.0.0 ; extra == 'dev'
|
52
|
-
Requires-Dist: langchain ==0.0.271 ; extra == 'dev'
|
53
|
-
Requires-Dist: openai[embeddings] ==0.27.9 ; extra == 'dev'
|
54
|
-
Requires-Dist: cohere ==4.21 ; extra == 'dev'
|
55
|
-
Requires-Dist: tiktoken ==0.4.0 ; extra == 'dev'
|
56
|
-
Requires-Dist: unstructured ==0.10.27 ; extra == 'dev'
|
57
|
-
Requires-Dist: unstructured[docx,pptx] ==0.10.27 ; extra == 'dev'
|
58
|
-
Requires-Dist: pdf2image ==1.16.3 ; extra == 'dev'
|
59
|
-
Requires-Dist: pdfminer.six ==20221105 ; extra == 'dev'
|
60
|
-
Requires-Dist: unstructured.pytesseract >=0.3.12 ; extra == 'dev'
|
61
|
-
Requires-Dist: pytesseract ==0.3.10 ; extra == 'dev'
|
62
|
-
Requires-Dist: markdown ; extra == 'dev'
|
63
|
-
Provides-Extra: file-based
|
64
|
-
Requires-Dist: avro ~=1.11.2 ; extra == 'file-based'
|
65
|
-
Requires-Dist: fastavro ~=1.8.0 ; extra == 'file-based'
|
66
|
-
Requires-Dist: pyarrow ~=15.0.0 ; extra == 'file-based'
|
67
|
-
Requires-Dist: unstructured ==0.10.27 ; extra == 'file-based'
|
68
|
-
Requires-Dist: unstructured[docx,pptx] ==0.10.27 ; extra == 'file-based'
|
69
|
-
Requires-Dist: pdf2image ==1.16.3 ; extra == 'file-based'
|
70
|
-
Requires-Dist: pdfminer.six ==20221105 ; extra == 'file-based'
|
71
|
-
Requires-Dist: unstructured.pytesseract >=0.3.12 ; extra == 'file-based'
|
72
|
-
Requires-Dist: pytesseract ==0.3.10 ; extra == 'file-based'
|
73
|
-
Requires-Dist: markdown ; extra == 'file-based'
|
74
|
-
Provides-Extra: sphinx-docs
|
75
|
-
Requires-Dist: Sphinx ~=4.2 ; extra == 'sphinx-docs'
|
76
|
-
Requires-Dist: sphinx-rtd-theme ~=1.0 ; extra == 'sphinx-docs'
|
77
|
-
Provides-Extra: vector-db-based
|
78
|
-
Requires-Dist: langchain ==0.0.271 ; extra == 'vector-db-based'
|
79
|
-
Requires-Dist: openai[embeddings] ==0.27.9 ; extra == 'vector-db-based'
|
80
|
-
Requires-Dist: cohere ==4.21 ; extra == 'vector-db-based'
|
81
|
-
Requires-Dist: tiktoken ==0.4.0 ; extra == 'vector-db-based'
|
82
|
-
|
83
|
-
# Connector Development Kit \(Python\)
|
84
|
-
|
85
|
-
The Airbyte Python CDK is a framework for rapidly developing production-grade Airbyte connectors.The CDK currently offers helpers specific for creating Airbyte source connectors for:
|
86
|
-
|
87
|
-
- HTTP APIs \(REST APIs, GraphQL, etc..\)
|
88
|
-
- Generic Python sources \(anything not covered by the above\)
|
89
|
-
|
90
|
-
The CDK provides an improved developer experience by providing basic implementation structure and abstracting away low-level glue boilerplate.
|
91
|
-
|
92
|
-
This document is a general introduction to the CDK. Readers should have basic familiarity with the [Airbyte Specification](https://docs.airbyte.com/understanding-airbyte/airbyte-protocol/) before proceeding.
|
93
|
-
|
94
|
-
## Getting Started
|
95
|
-
|
96
|
-
Generate an empty connector using the code generator. First clone the Airbyte repository then from the repository root run
|
97
|
-
|
98
|
-
```bash
|
99
|
-
cd airbyte-integrations/connector-templates/generator
|
100
|
-
./generate.sh
|
101
|
-
```
|
102
|
-
|
103
|
-
then follow the interactive prompt. Next, find all `TODO`s in the generated project directory -- they're accompanied by lots of comments explaining what you'll need to do in order to implement your connector. Upon completing all TODOs properly, you should have a functioning connector.
|
104
|
-
|
105
|
-
Additionally, you can follow [this tutorial](https://docs.airbyte.com/connector-development/cdk-python/) for a complete walkthrough of creating an HTTP connector using the Airbyte CDK.
|
106
|
-
|
107
|
-
### Concepts & Documentation
|
108
|
-
|
109
|
-
See the [concepts docs](docs/concepts/) for a tour through what the API offers.
|
110
|
-
|
111
|
-
### Example Connectors
|
112
|
-
|
113
|
-
**HTTP Connectors**:
|
114
|
-
|
115
|
-
- [Stripe](https://github.com/airbytehq/airbyte/blob/master/airbyte-integrations/connectors/source-stripe/source_stripe/source.py)
|
116
|
-
- [Slack](https://github.com/airbytehq/airbyte/blob/master/airbyte-integrations/connectors/source-slack/source_slack/source.py)
|
117
|
-
|
118
|
-
**Simple Python connectors using the barebones `Source` abstraction**:
|
119
|
-
|
120
|
-
- [Google Sheets](https://github.com/airbytehq/airbyte/blob/master/airbyte-integrations/connectors/source-google-sheets/google_sheets_source/google_sheets_source.py)
|
121
|
-
- [Mailchimp](https://github.com/airbytehq/airbyte/blob/master/airbyte-integrations/connectors/source-mailchimp/source_mailchimp/source.py)
|
122
|
-
|
123
|
-
## Contributing
|
124
|
-
|
125
|
-
### First time setup
|
126
|
-
|
127
|
-
We assume `python` points to Python 3.9 or higher.
|
128
|
-
|
129
|
-
Setup a virtual env:
|
130
|
-
|
131
|
-
```bash
|
132
|
-
python -m venv .venv
|
133
|
-
source .venv/bin/activate
|
134
|
-
pip install -e ".[dev]" # [dev] installs development-only dependencies
|
135
|
-
```
|
136
|
-
|
137
|
-
#### Iteration
|
138
|
-
|
139
|
-
- Iterate on the code locally
|
140
|
-
- Run tests via `python -m pytest -s unit_tests`
|
141
|
-
- Perform static type checks using `mypy airbyte_cdk`. `MyPy` configuration is in `mypy.ini`.
|
142
|
-
- Run `mypy <files to check>` to only check specific files. This is useful as the CDK still contains code that is not compliant.
|
143
|
-
- The `type_check_and_test.sh` script bundles both type checking and testing in one convenient command. Feel free to use it!
|
144
|
-
|
145
|
-
##### Autogenerated files
|
146
|
-
|
147
|
-
If the iteration you are working on includes changes to the models, you might want to regenerate them. In order to do that, you can run:
|
148
|
-
|
149
|
-
```bash
|
150
|
-
cd airbyte-cdk/python
|
151
|
-
./gradlew build
|
152
|
-
```
|
153
|
-
|
154
|
-
This will generate the files based on the schemas, add the license information and format the code. If you want to only do the former and rely on
|
155
|
-
pre-commit to the others, you can run the appropriate generation command i.e. `./gradlew generateComponentManifestClassFiles`.
|
156
|
-
|
157
|
-
#### Testing
|
158
|
-
|
159
|
-
All tests are located in the `unit_tests` directory. Run `python -m pytest --cov=airbyte_cdk unit_tests/` to run them. This also presents a test coverage report.
|
160
|
-
|
161
|
-
#### Building and testing a connector with your local CDK
|
162
|
-
|
163
|
-
When developing a new feature in the CDK, you may find it helpful to run a connector that uses that new feature. You can test this in one of two ways:
|
164
|
-
|
165
|
-
- Running a connector locally
|
166
|
-
- Building and running a source via Docker
|
167
|
-
|
168
|
-
##### Installing your local CDK into a local Python connector
|
169
|
-
|
170
|
-
In order to get a local Python connector running your local CDK, do the following.
|
171
|
-
|
172
|
-
First, make sure you have your connector's virtual environment active:
|
173
|
-
|
174
|
-
```bash
|
175
|
-
# from the `airbyte/airbyte-integrations/connectors/<connector-directory>` directory
|
176
|
-
source .venv/bin/activate
|
177
|
-
|
178
|
-
# if you haven't installed dependencies for your connector already
|
179
|
-
pip install -e .
|
180
|
-
```
|
181
|
-
|
182
|
-
Then, navigate to the CDK and install it in editable mode:
|
183
|
-
|
184
|
-
```bash
|
185
|
-
cd ../../../airbyte-cdk/python
|
186
|
-
pip install -e .
|
187
|
-
```
|
188
|
-
|
189
|
-
You should see that `pip` has uninstalled the version of `airbyte-cdk` defined by your connector's `setup.py` and installed your local CDK. Any changes you make will be immediately reflected in your editor, so long as your editor's interpreter is set to your connector's virtual environment.
|
190
|
-
|
191
|
-
##### Building a Python connector in Docker with your local CDK installed
|
192
|
-
|
193
|
-
_Pre-requisite: Install the [`airbyte-ci` CLI](https://github.com/airbytehq/airbyte/blob/master/airbyte-ci/connectors/pipelines/README.md)_
|
194
|
-
|
195
|
-
You can build your connector image with the local CDK using
|
196
|
-
|
197
|
-
```bash
|
198
|
-
# from the airbytehq/airbyte base directory
|
199
|
-
airbyte-ci connectors --use-local-cdk --name=<CONNECTOR> build
|
200
|
-
```
|
201
|
-
|
202
|
-
Note that the local CDK is injected at build time, so if you make changes, you will have to run the build command again to see them reflected.
|
203
|
-
|
204
|
-
##### Running Connector Acceptance Tests for a single connector in Docker with your local CDK installed
|
205
|
-
|
206
|
-
_Pre-requisite: Install the [`airbyte-ci` CLI](https://github.com/airbytehq/airbyte/blob/master/airbyte-ci/connectors/pipelines/README.md)_
|
207
|
-
|
208
|
-
To run acceptance tests for a single connectors using the local CDK, from the connector directory, run
|
209
|
-
|
210
|
-
```bash
|
211
|
-
airbyte-ci connectors --use-local-cdk --name=<CONNECTOR> test
|
212
|
-
```
|
213
|
-
|
214
|
-
#### When you don't have access to the API
|
215
|
-
|
216
|
-
There can be some time where you do not have access to the API (either because you don't have the credentials, network access, etc...) You will probably still want to do end-to-end testing at least once. In order to do so, you can emulate the server you would be reaching using a server stubbing tool.
|
217
|
-
|
218
|
-
For example, using [mockserver](https://www.mock-server.com/), you can set up an expectation file like this:
|
219
|
-
|
220
|
-
```json
|
221
|
-
{
|
222
|
-
"httpRequest": {
|
223
|
-
"method": "GET",
|
224
|
-
"path": "/data"
|
225
|
-
},
|
226
|
-
"httpResponse": {
|
227
|
-
"body": "{\"data\": [{\"record_key\": 1}, {\"record_key\": 2}]}"
|
228
|
-
}
|
229
|
-
}
|
230
|
-
```
|
231
|
-
|
232
|
-
Assuming this file has been created at `secrets/mock_server_config/expectations.json`, running the following command will allow to match any requests on path `/data` to return the response defined in the expectation file:
|
233
|
-
|
234
|
-
```bash
|
235
|
-
docker run -d --rm -v $(pwd)/secrets/mock_server_config:/config -p 8113:8113 --env MOCKSERVER_LOG_LEVEL=TRACE --env MOCKSERVER_SERVER_PORT=8113 --env MOCKSERVER_WATCH_INITIALIZATION_JSON=true --env MOCKSERVER_PERSISTED_EXPECTATIONS_PATH=/config/expectations.json --env MOCKSERVER_INITIALIZATION_JSON_PATH=/config/expectations.json mockserver/mockserver:5.15.0
|
236
|
-
```
|
237
|
-
|
238
|
-
HTTP requests to `localhost:8113/data` should now return the body defined in the expectations file. To test this, the implementer either has to change the code which defines the base URL for Python source or update the `url_base` from low-code. With the Connector Builder running in docker, you will have to use domain `host.docker.internal` instead of `localhost` as the requests are executed within docker.
|
239
|
-
|
240
|
-
#### Publishing a new version to PyPi
|
241
|
-
|
242
|
-
1. Open a PR
|
243
|
-
2. Once it is approved and **merged**, an Airbyte member must run the `Publish CDK Manually` workflow from master using `release-type=major|manor|patch` and setting the changelog message.
|