airbyte-cdk 6.7.0rc3__py3-none-any.whl → 6.7.1.dev0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (124) hide show
  1. airbyte_cdk/cli/source_declarative_manifest/_run.py +2 -1
  2. airbyte_cdk/config_observation.py +2 -1
  3. airbyte_cdk/connector.py +1 -0
  4. airbyte_cdk/connector_builder/connector_builder_handler.py +1 -1
  5. airbyte_cdk/connector_builder/main.py +2 -1
  6. airbyte_cdk/destinations/destination.py +2 -1
  7. airbyte_cdk/destinations/vector_db_based/config.py +2 -1
  8. airbyte_cdk/destinations/vector_db_based/document_processor.py +4 -3
  9. airbyte_cdk/destinations/vector_db_based/embedder.py +5 -4
  10. airbyte_cdk/entrypoint.py +3 -2
  11. airbyte_cdk/logger.py +2 -1
  12. airbyte_cdk/models/__init__.py +2 -0
  13. airbyte_cdk/models/airbyte_protocol.py +2 -1
  14. airbyte_cdk/sources/concurrent_source/concurrent_read_processor.py +3 -3
  15. airbyte_cdk/sources/concurrent_source/concurrent_source.py +1 -1
  16. airbyte_cdk/sources/config.py +2 -1
  17. airbyte_cdk/sources/declarative/auth/jwt.py +1 -0
  18. airbyte_cdk/sources/declarative/auth/oauth.py +1 -0
  19. airbyte_cdk/sources/declarative/auth/selective_authenticator.py +1 -0
  20. airbyte_cdk/sources/declarative/auth/token.py +2 -1
  21. airbyte_cdk/sources/declarative/auth/token_provider.py +3 -2
  22. airbyte_cdk/sources/declarative/concurrent_declarative_source.py +78 -52
  23. airbyte_cdk/sources/declarative/declarative_component_schema.yaml +167 -0
  24. airbyte_cdk/sources/declarative/decoders/json_decoder.py +3 -2
  25. airbyte_cdk/sources/declarative/decoders/noop_decoder.py +1 -0
  26. airbyte_cdk/sources/declarative/decoders/pagination_decoder_decorator.py +1 -0
  27. airbyte_cdk/sources/declarative/decoders/xml_decoder.py +1 -0
  28. airbyte_cdk/sources/declarative/extractors/dpath_extractor.py +1 -0
  29. airbyte_cdk/sources/declarative/extractors/http_selector.py +1 -0
  30. airbyte_cdk/sources/declarative/extractors/record_filter.py +6 -48
  31. airbyte_cdk/sources/declarative/extractors/record_selector.py +32 -4
  32. airbyte_cdk/sources/declarative/extractors/response_to_file_extractor.py +2 -1
  33. airbyte_cdk/sources/declarative/incremental/datetime_based_cursor.py +2 -1
  34. airbyte_cdk/sources/declarative/incremental/global_substream_cursor.py +5 -2
  35. airbyte_cdk/sources/declarative/incremental/per_partition_cursor.py +5 -2
  36. airbyte_cdk/sources/declarative/incremental/per_partition_with_global.py +1 -3
  37. airbyte_cdk/sources/declarative/interpolation/jinja.py +5 -4
  38. airbyte_cdk/sources/declarative/manifest_declarative_source.py +4 -3
  39. airbyte_cdk/sources/declarative/migrations/legacy_to_per_partition_state_migration.py +1 -1
  40. airbyte_cdk/sources/declarative/models/declarative_component_schema.py +122 -0
  41. airbyte_cdk/sources/declarative/parsers/model_to_component_factory.py +30 -17
  42. airbyte_cdk/sources/declarative/partition_routers/substream_partition_router.py +1 -0
  43. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/constant_backoff_strategy.py +1 -0
  44. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/exponential_backoff_strategy.py +1 -0
  45. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/wait_time_from_header_backoff_strategy.py +1 -0
  46. airbyte_cdk/sources/declarative/requesters/error_handlers/backoff_strategies/wait_until_time_from_header_backoff_strategy.py +1 -0
  47. airbyte_cdk/sources/declarative/requesters/error_handlers/composite_error_handler.py +1 -0
  48. airbyte_cdk/sources/declarative/requesters/error_handlers/default_error_handler.py +1 -0
  49. airbyte_cdk/sources/declarative/requesters/error_handlers/default_http_response_filter.py +1 -0
  50. airbyte_cdk/sources/declarative/requesters/error_handlers/http_response_filter.py +1 -0
  51. airbyte_cdk/sources/declarative/requesters/http_job_repository.py +2 -1
  52. airbyte_cdk/sources/declarative/requesters/http_requester.py +1 -0
  53. airbyte_cdk/sources/declarative/requesters/paginators/default_paginator.py +1 -0
  54. airbyte_cdk/sources/declarative/requesters/paginators/no_pagination.py +1 -0
  55. airbyte_cdk/sources/declarative/requesters/paginators/paginator.py +1 -0
  56. airbyte_cdk/sources/declarative/requesters/paginators/strategies/cursor_pagination_strategy.py +1 -0
  57. airbyte_cdk/sources/declarative/requesters/paginators/strategies/offset_increment.py +1 -0
  58. airbyte_cdk/sources/declarative/requesters/paginators/strategies/page_increment.py +1 -0
  59. airbyte_cdk/sources/declarative/requesters/paginators/strategies/pagination_strategy.py +1 -0
  60. airbyte_cdk/sources/declarative/requesters/paginators/strategies/stop_condition.py +9 -3
  61. airbyte_cdk/sources/declarative/requesters/request_options/interpolated_request_options_provider.py +2 -1
  62. airbyte_cdk/sources/declarative/requesters/requester.py +1 -0
  63. airbyte_cdk/sources/declarative/retrievers/async_retriever.py +2 -1
  64. airbyte_cdk/sources/declarative/retrievers/simple_retriever.py +12 -4
  65. airbyte_cdk/sources/declarative/stream_slicers/declarative_partition_generator.py +7 -4
  66. airbyte_cdk/sources/declarative/transformations/add_fields.py +1 -0
  67. airbyte_cdk/sources/declarative/transformations/remove_fields.py +1 -0
  68. airbyte_cdk/sources/declarative/yaml_declarative_source.py +1 -0
  69. airbyte_cdk/sources/embedded/tools.py +1 -0
  70. airbyte_cdk/sources/file_based/config/abstract_file_based_spec.py +2 -1
  71. airbyte_cdk/sources/file_based/config/avro_format.py +2 -1
  72. airbyte_cdk/sources/file_based/config/csv_format.py +2 -1
  73. airbyte_cdk/sources/file_based/config/excel_format.py +2 -1
  74. airbyte_cdk/sources/file_based/config/file_based_stream_config.py +2 -1
  75. airbyte_cdk/sources/file_based/config/jsonl_format.py +2 -1
  76. airbyte_cdk/sources/file_based/config/parquet_format.py +2 -1
  77. airbyte_cdk/sources/file_based/config/unstructured_format.py +2 -1
  78. airbyte_cdk/sources/file_based/file_based_source.py +2 -1
  79. airbyte_cdk/sources/file_based/file_based_stream_reader.py +2 -1
  80. airbyte_cdk/sources/file_based/file_types/avro_parser.py +1 -0
  81. airbyte_cdk/sources/file_based/file_types/csv_parser.py +2 -1
  82. airbyte_cdk/sources/file_based/file_types/excel_parser.py +5 -5
  83. airbyte_cdk/sources/file_based/file_types/jsonl_parser.py +2 -1
  84. airbyte_cdk/sources/file_based/file_types/parquet_parser.py +2 -1
  85. airbyte_cdk/sources/file_based/file_types/unstructured_parser.py +9 -8
  86. airbyte_cdk/sources/file_based/stream/abstract_file_based_stream.py +2 -1
  87. airbyte_cdk/sources/file_based/stream/concurrent/adapters.py +5 -4
  88. airbyte_cdk/sources/file_based/stream/concurrent/cursor/abstract_concurrent_file_based_cursor.py +1 -1
  89. airbyte_cdk/sources/file_based/stream/concurrent/cursor/file_based_concurrent_cursor.py +1 -1
  90. airbyte_cdk/sources/file_based/stream/concurrent/cursor/file_based_final_state_cursor.py +1 -1
  91. airbyte_cdk/sources/http_logger.py +1 -0
  92. airbyte_cdk/sources/streams/call_rate.py +1 -2
  93. airbyte_cdk/sources/streams/concurrent/abstract_stream.py +2 -1
  94. airbyte_cdk/sources/streams/concurrent/adapters.py +8 -4
  95. airbyte_cdk/sources/streams/concurrent/availability_strategy.py +2 -1
  96. airbyte_cdk/sources/streams/concurrent/cursor.py +30 -6
  97. airbyte_cdk/sources/streams/concurrent/default_stream.py +1 -0
  98. airbyte_cdk/sources/streams/concurrent/partitions/partition.py +1 -1
  99. airbyte_cdk/sources/streams/concurrent/partitions/types.py +1 -1
  100. airbyte_cdk/sources/streams/concurrent/state_converters/datetime_stream_state_converter.py +1 -1
  101. airbyte_cdk/sources/streams/core.py +2 -1
  102. airbyte_cdk/sources/streams/http/error_handlers/default_error_mapping.py +2 -1
  103. airbyte_cdk/sources/streams/http/error_handlers/http_status_error_handler.py +1 -0
  104. airbyte_cdk/sources/streams/http/error_handlers/json_error_message_parser.py +1 -0
  105. airbyte_cdk/sources/streams/http/error_handlers/response_models.py +2 -1
  106. airbyte_cdk/sources/streams/http/http.py +3 -2
  107. airbyte_cdk/sources/streams/http/http_client.py +49 -2
  108. airbyte_cdk/sources/streams/http/requests_native_auth/abstract_oauth.py +2 -1
  109. airbyte_cdk/sources/streams/http/requests_native_auth/oauth.py +1 -0
  110. airbyte_cdk/sources/types.py +14 -1
  111. airbyte_cdk/sources/utils/schema_helpers.py +3 -2
  112. airbyte_cdk/sql/secrets.py +2 -1
  113. airbyte_cdk/sql/shared/sql_processor.py +8 -6
  114. airbyte_cdk/test/entrypoint_wrapper.py +4 -3
  115. airbyte_cdk/test/mock_http/mocker.py +1 -0
  116. airbyte_cdk/utils/schema_inferrer.py +2 -1
  117. airbyte_cdk/utils/slice_hasher.py +1 -1
  118. airbyte_cdk/utils/traced_exception.py +2 -1
  119. {airbyte_cdk-6.7.0rc3.dist-info → airbyte_cdk-6.7.1.dev0.dist-info}/METADATA +9 -2
  120. {airbyte_cdk-6.7.0rc3.dist-info → airbyte_cdk-6.7.1.dev0.dist-info}/RECORD +123 -124
  121. airbyte_cdk/sources/streams/concurrent/partitions/record.py +0 -35
  122. {airbyte_cdk-6.7.0rc3.dist-info → airbyte_cdk-6.7.1.dev0.dist-info}/LICENSE.txt +0 -0
  123. {airbyte_cdk-6.7.0rc3.dist-info → airbyte_cdk-6.7.1.dev0.dist-info}/WHEEL +0 -0
  124. {airbyte_cdk-6.7.0rc3.dist-info → airbyte_cdk-6.7.1.dev0.dist-info}/entry_points.txt +0 -0
@@ -1972,6 +1972,173 @@ definitions:
1972
1972
  - app_id:
1973
1973
  type: string
1974
1974
  path_in_connector_config: ["info", "app_id"]
1975
+ oauth_connector_input_specification:
1976
+ title: DeclarativeOAuth Connector Specification
1977
+ description: |-
1978
+ The DeclarativeOAuth specific blob.
1979
+ Pertains to the fields defined by the connector relating to the OAuth flow.
1980
+
1981
+ Interpolation capabilities:
1982
+ - The variables placeholders are declared as `{my_var}`.
1983
+ - The nested resolution variables like `{{my_nested_var}}` is allowed as well.
1984
+
1985
+ - The allowed interpolation context is:
1986
+ + base64Encoder - encode to `base64`, {base64Encoder:{my_var_a}:{my_var_b}}
1987
+ + base64Decorer - decode from `base64` encoded string, {base64Decoder:{my_string_variable_or_string_value}}
1988
+ + urlEncoder - encode the input string to URL-like format, {urlEncoder:https://test.host.com/endpoint}
1989
+ + urlDecorer - decode the input url-encoded string into text format, {urlDecoder:https%3A%2F%2Fairbyte.io}
1990
+ + codeChallengeS256 - get the `codeChallenge` encoded value to provide additional data-provider specific authorisation values, {codeChallengeS256:{state_value}}
1991
+
1992
+ Examples:
1993
+ - The TikTok Marketing DeclarativeOAuth spec:
1994
+ {
1995
+ "oauth_connector_input_specification": {
1996
+ "type": "object",
1997
+ "additionalProperties": false,
1998
+ "properties": {
1999
+ "consent_url": "https://ads.tiktok.com/marketing_api/auth?{client_id_key}={{client_id_key}}&{redirect_uri_key}={urlEncoder:{{redirect_uri_key}}}&{state_key}={{state_key}}",
2000
+ "access_token_url": "https://business-api.tiktok.com/open_api/v1.3/oauth2/access_token/",
2001
+ "access_token_params": {
2002
+ "{auth_code_key}": "{{auth_code_key}}",
2003
+ "{client_id_key}": "{{client_id_key}}",
2004
+ "{client_secret_key}": "{{client_secret_key}}"
2005
+ },
2006
+ "access_token_headers": {
2007
+ "Content-Type": "application/json",
2008
+ "Accept": "application/json"
2009
+ },
2010
+ "extract_output": ["data.access_token"],
2011
+ "client_id_key": "app_id",
2012
+ "client_secret_key": "secret",
2013
+ "auth_code_key": "auth_code"
2014
+ }
2015
+ }
2016
+ }
2017
+ type: object
2018
+ additionalProperties: true
2019
+ required:
2020
+ - consent_url
2021
+ - access_token_url
2022
+ - extract_output
2023
+ properties:
2024
+ consent_url:
2025
+ title: DeclarativeOAuth Consent URL
2026
+ type: string
2027
+ description: |-
2028
+ The DeclarativeOAuth Specific string URL string template to initiate the authentication.
2029
+ The placeholders are replaced during the processing to provide neccessary values.
2030
+ examples:
2031
+ - consent_url: https://domain.host.com/marketing_api/auth?{client_id_key}={{client_id_key}}&{redirect_uri_key}={urlEncoder:{{redirect_uri_key}}}&{state_key}={{state_key}}
2032
+ - consent_url: https://endpoint.host.com/oauth2/authorize?{client_id_key}={{client_id_key}}&{redirect_uri_key}={urlEncoder:{{redirect_uri_key}}}&{scope_key}={urlEncoder:{{scope_key}}}&{state_key}={{state_key}}&subdomain={subdomain}
2033
+ scope:
2034
+ title: (Optional) DeclarativeOAuth Scope
2035
+ type: string
2036
+ description: |-
2037
+ The DeclarativeOAuth Specific string of the scopes needed to be grant for authenticated user.
2038
+ examples:
2039
+ - scope: user:read user:read_orders workspaces:read
2040
+ access_token_url:
2041
+ title: DeclarativeOAuth Access Token URL
2042
+ type: string
2043
+ description: |-
2044
+ The DeclarativeOAuth Specific URL templated string to obtain the `access_token`, `refresh_token` etc.
2045
+ The placeholders are replaced during the processing to provide neccessary values.
2046
+ examples:
2047
+ - access_token_url: https://auth.host.com/oauth2/token?{client_id_key}={{client_id_key}}&{client_secret_key}={{client_secret_key}}&{auth_code_key}={{auth_code_key}}&{redirect_uri_key}={urlEncoder:{{redirect_uri_key}}}
2048
+ access_token_headers:
2049
+ title: (Optional) DeclarativeOAuth Access Token Headers
2050
+ type: object
2051
+ additionalProperties: true
2052
+ description: |-
2053
+ The DeclarativeOAuth Specific optional headers to inject while exchanging the `auth_code` to `access_token` during `completeOAuthFlow` step.
2054
+ examples:
2055
+ - access_token_headers: {
2056
+ "Authorization": "Basic {base64Encoder:{client_id}:{client_secret}}"
2057
+ }
2058
+ access_token_params:
2059
+ title: (Optional) DeclarativeOAuth Access Token Query Params (Json Encoded)
2060
+ type: object
2061
+ additionalProperties: true
2062
+ description: |-
2063
+ The DeclarativeOAuth Specific optional query parameters to inject while exchanging the `auth_code` to `access_token` during `completeOAuthFlow` step.
2064
+ When this property is provided, the query params will be encoded as `Json` and included in the outgoing API request.
2065
+ examples:
2066
+ - access_token_params: {
2067
+ "{auth_code_key}": "{{auth_code_key}}",
2068
+ "{client_id_key}": "{{client_id_key}}",
2069
+ "{client_secret_key}": "{{client_secret_key}}"
2070
+ }
2071
+ extract_output:
2072
+ title: DeclarativeOAuth Extract Output
2073
+ type: array
2074
+ items:
2075
+ type: string
2076
+ description: |-
2077
+ The DeclarativeOAuth Specific list of strings to indicate which keys should be extracted and returned back to the input config.
2078
+ examples:
2079
+ - extract_output: ["access_token", "refresh_token", "other_field"]
2080
+ state:
2081
+ title: (Optional) DeclarativeOAuth Configurable State Query Param
2082
+ type: object
2083
+ additionalProperties: true
2084
+ required:
2085
+ - min
2086
+ - max
2087
+ description: |-
2088
+ The DeclarativeOAuth Specific object to provide the criteria of how the `state` query param should be constructed,
2089
+ including length and complexity.
2090
+ properties:
2091
+ min:
2092
+ type: integer
2093
+ max:
2094
+ type: integer
2095
+ examples:
2096
+ - state: {
2097
+ "min": 7,
2098
+ "max": 128,
2099
+ }
2100
+ client_id_key:
2101
+ title: (Optional) DeclarativeOAuth Client ID Key Override
2102
+ type: string
2103
+ description: |-
2104
+ The DeclarativeOAuth Specific optional override to provide the custom `client_id` key name, if required by data-provider.
2105
+ examples:
2106
+ - client_id_key: "my_custom_client_id_key_name"
2107
+ client_secret_key:
2108
+ title: (Optional) DeclarativeOAuth Client Secret Key Override
2109
+ type: string
2110
+ description: |-
2111
+ The DeclarativeOAuth Specific optional override to provide the custom `client_secret` key name, if required by data-provider.
2112
+ examples:
2113
+ - client_secret_key: "my_custom_client_secret_key_name"
2114
+ scope_key:
2115
+ title: (Optional) DeclarativeOAuth Scope Key Override
2116
+ type: string
2117
+ description: |-
2118
+ The DeclarativeOAuth Specific optional override to provide the custom `scope` key name, if required by data-provider.
2119
+ examples:
2120
+ - scope_key: "my_custom_scope_key_key_name"
2121
+ state_key:
2122
+ title: (Optional) DeclarativeOAuth State Key Override
2123
+ type: string
2124
+ description: |-
2125
+ The DeclarativeOAuth Specific optional override to provide the custom `state` key name, if required by data-provider.
2126
+ examples:
2127
+ - state_key: "my_custom_state_key_key_name"
2128
+ auth_code_key:
2129
+ title: (Optional) DeclarativeOAuth Auth Code Key Override
2130
+ type: string
2131
+ description: |-
2132
+ The DeclarativeOAuth Specific optional override to provide the custom `code` key name to something like `auth_code` or `custom_auth_code`, if required by data-provider.
2133
+ examples:
2134
+ - auth_code_key: "my_custom_auth_code_key_name"
2135
+ redirect_uri_key:
2136
+ title: (Optional) DeclarativeOAuth Redirect URI Key Override
2137
+ type: string
2138
+ description: |-
2139
+ The DeclarativeOAuth Specific optional override to provide the custom `redirect_uri` key name to something like `callback_uri`, if required by data-provider.
2140
+ examples:
2141
+ - redirect_uri_key: "my_custom_redirect_uri_key_name"
1975
2142
  complete_oauth_output_specification:
1976
2143
  title: "OAuth output specification"
1977
2144
  description: |-
@@ -5,11 +5,12 @@ import codecs
5
5
  import logging
6
6
  from dataclasses import InitVar, dataclass
7
7
  from gzip import decompress
8
- from typing import Any, Generator, Mapping, MutableMapping, List, Optional
8
+ from typing import Any, Generator, List, Mapping, MutableMapping, Optional
9
9
 
10
+ import orjson
10
11
  import requests
12
+
11
13
  from airbyte_cdk.sources.declarative.decoders.decoder import Decoder
12
- import orjson
13
14
 
14
15
  logger = logging.getLogger("airbyte")
15
16
 
@@ -4,6 +4,7 @@ import logging
4
4
  from typing import Any, Generator, Mapping
5
5
 
6
6
  import requests
7
+
7
8
  from airbyte_cdk.sources.declarative.decoders.decoder import Decoder
8
9
 
9
10
  logger = logging.getLogger("airbyte")
@@ -7,6 +7,7 @@ from dataclasses import dataclass
7
7
  from typing import Any, Generator, MutableMapping
8
8
 
9
9
  import requests
10
+
10
11
  from airbyte_cdk.sources.declarative.decoders import Decoder
11
12
 
12
13
  logger = logging.getLogger("airbyte")
@@ -9,6 +9,7 @@ from xml.parsers.expat import ExpatError
9
9
 
10
10
  import requests
11
11
  import xmltodict
12
+
12
13
  from airbyte_cdk.sources.declarative.decoders.decoder import Decoder
13
14
 
14
15
  logger = logging.getLogger("airbyte")
@@ -7,6 +7,7 @@ from typing import Any, Iterable, List, Mapping, MutableMapping, Union
7
7
 
8
8
  import dpath
9
9
  import requests
10
+
10
11
  from airbyte_cdk.sources.declarative.decoders import Decoder, JsonDecoder
11
12
  from airbyte_cdk.sources.declarative.extractors.record_extractor import RecordExtractor
12
13
  from airbyte_cdk.sources.declarative.interpolation.interpolated_string import InterpolatedString
@@ -6,6 +6,7 @@ from abc import abstractmethod
6
6
  from typing import Any, Iterable, Mapping, Optional
7
7
 
8
8
  import requests
9
+
9
10
  from airbyte_cdk.sources.types import Record, StreamSlice, StreamState
10
11
 
11
12
 
@@ -1,7 +1,6 @@
1
1
  #
2
2
  # Copyright (c) 2023 Airbyte, Inc., all rights reserved.
3
3
  #
4
- import datetime
5
4
  from dataclasses import InitVar, dataclass
6
5
  from typing import Any, Iterable, Mapping, Optional, Union
7
6
 
@@ -11,7 +10,7 @@ from airbyte_cdk.sources.declarative.incremental import (
11
10
  PerPartitionWithGlobalCursor,
12
11
  )
13
12
  from airbyte_cdk.sources.declarative.interpolation.interpolated_boolean import InterpolatedBoolean
14
- from airbyte_cdk.sources.types import Config, StreamSlice, StreamState
13
+ from airbyte_cdk.sources.types import Config, Record, StreamSlice, StreamState
15
14
 
16
15
 
17
16
  @dataclass
@@ -68,20 +67,6 @@ class ClientSideIncrementalRecordFilterDecorator(RecordFilter):
68
67
  self._date_time_based_cursor = date_time_based_cursor
69
68
  self._substream_cursor = substream_cursor
70
69
 
71
- @property
72
- def _cursor_field(self) -> str:
73
- return self._date_time_based_cursor.cursor_field.eval(self._date_time_based_cursor.config) # type: ignore # eval returns a string in this context
74
-
75
- @property
76
- def _start_date_from_config(self) -> datetime.datetime:
77
- return self._date_time_based_cursor._start_datetime.get_datetime(
78
- self._date_time_based_cursor.config
79
- )
80
-
81
- @property
82
- def _end_datetime(self) -> datetime.datetime:
83
- return self._date_time_based_cursor.select_best_end_datetime()
84
-
85
70
  def filter_records(
86
71
  self,
87
72
  records: Iterable[Mapping[str, Any]],
@@ -89,16 +74,14 @@ class ClientSideIncrementalRecordFilterDecorator(RecordFilter):
89
74
  stream_slice: Optional[StreamSlice] = None,
90
75
  next_page_token: Optional[Mapping[str, Any]] = None,
91
76
  ) -> Iterable[Mapping[str, Any]]:
92
- state_value = self._get_state_value(
93
- stream_state, stream_slice or StreamSlice(partition={}, cursor_slice={})
94
- )
95
- filter_date: datetime.datetime = self._get_filter_date(state_value)
96
77
  records = (
97
78
  record
98
79
  for record in records
99
- if self._end_datetime
100
- >= self._date_time_based_cursor.parse_date(record[self._cursor_field])
101
- >= filter_date
80
+ if (self._substream_cursor or self._date_time_based_cursor).should_be_synced(
81
+ # Record is created on the fly to align with cursors interface; stream name is ignored as we don't need it here
82
+ # Record stream name is empty cause it is not used durig the filtering
83
+ Record(data=record, associated_slice=stream_slice, stream_name="")
84
+ )
102
85
  )
103
86
  if self.condition:
104
87
  records = super().filter_records(
@@ -108,28 +91,3 @@ class ClientSideIncrementalRecordFilterDecorator(RecordFilter):
108
91
  next_page_token=next_page_token,
109
92
  )
110
93
  yield from records
111
-
112
- def _get_state_value(
113
- self, stream_state: StreamState, stream_slice: StreamSlice
114
- ) -> Optional[str]:
115
- """
116
- Return cursor_value or None in case it was not found.
117
- Cursor_value may be empty if:
118
- 1. It is an initial sync => no stream_state exist at all.
119
- 2. In Parent-child stream, and we already make initial sync, so stream_state is present.
120
- During the second read, we receive one extra record from parent and therefore no stream_state for this record will be found.
121
-
122
- :param StreamState stream_state: State
123
- :param StreamSlice stream_slice: Current Stream slice
124
- :return Optional[str]: cursor_value in case it was found, otherwise None.
125
- """
126
- state = (self._substream_cursor or self._date_time_based_cursor).select_state(stream_slice)
127
-
128
- return state.get(self._cursor_field) if state else None
129
-
130
- def _get_filter_date(self, state_value: Optional[str]) -> datetime.datetime:
131
- start_date_parsed = self._start_date_from_config
132
- if state_value:
133
- return max(start_date_parsed, self._date_time_based_cursor.parse_date(state_value))
134
- else:
135
- return start_date_parsed
@@ -3,12 +3,14 @@
3
3
  #
4
4
 
5
5
  from dataclasses import InitVar, dataclass, field
6
- from typing import Any, Iterable, List, Mapping, Optional
6
+ from typing import Any, Iterable, List, Mapping, Optional, Union
7
7
 
8
8
  import requests
9
+
9
10
  from airbyte_cdk.sources.declarative.extractors.http_selector import HttpSelector
10
11
  from airbyte_cdk.sources.declarative.extractors.record_extractor import RecordExtractor
11
12
  from airbyte_cdk.sources.declarative.extractors.record_filter import RecordFilter
13
+ from airbyte_cdk.sources.declarative.interpolation import InterpolatedString
12
14
  from airbyte_cdk.sources.declarative.models import SchemaNormalization
13
15
  from airbyte_cdk.sources.declarative.transformations import RecordTransformation
14
16
  from airbyte_cdk.sources.types import Config, Record, StreamSlice, StreamState
@@ -37,11 +39,34 @@ class RecordSelector(HttpSelector):
37
39
  config: Config
38
40
  parameters: InitVar[Mapping[str, Any]]
39
41
  schema_normalization: TypeTransformer
42
+ name: str
43
+ _name: Union[InterpolatedString, str] = field(init=False, repr=False, default="")
40
44
  record_filter: Optional[RecordFilter] = None
41
45
  transformations: List[RecordTransformation] = field(default_factory=lambda: [])
42
46
 
43
47
  def __post_init__(self, parameters: Mapping[str, Any]) -> None:
44
48
  self._parameters = parameters
49
+ self._name = (
50
+ InterpolatedString(self._name, parameters=parameters)
51
+ if isinstance(self._name, str)
52
+ else self._name
53
+ )
54
+
55
+ @property # type: ignore
56
+ def name(self) -> str:
57
+ """
58
+ :return: Stream name
59
+ """
60
+ return (
61
+ str(self._name.eval(self.config))
62
+ if isinstance(self._name, InterpolatedString)
63
+ else self._name
64
+ )
65
+
66
+ @name.setter
67
+ def name(self, value: str) -> None:
68
+ if not isinstance(value, property):
69
+ self._name = value
45
70
 
46
71
  def select_records(
47
72
  self,
@@ -85,7 +110,7 @@ class RecordSelector(HttpSelector):
85
110
  transformed_data = self._transform(filtered_data, stream_state, stream_slice)
86
111
  normalized_data = self._normalize_by_schema(transformed_data, schema=records_schema)
87
112
  for data in normalized_data:
88
- yield Record(data, stream_slice)
113
+ yield Record(data=data, stream_name=self.name, associated_slice=stream_slice)
89
114
 
90
115
  def _normalize_by_schema(
91
116
  self, records: Iterable[Mapping[str, Any]], schema: Optional[Mapping[str, Any]]
@@ -125,6 +150,9 @@ class RecordSelector(HttpSelector):
125
150
  for record in records:
126
151
  for transformation in self.transformations:
127
152
  transformation.transform(
128
- record, config=self.config, stream_state=stream_state, stream_slice=stream_slice
129
- ) # type: ignore # record has type Mapping[str, Any], but Dict[str, Any] expected
153
+ record, # type: ignore # record has type Mapping[str, Any], but Dict[str, Any] expected
154
+ config=self.config,
155
+ stream_state=stream_state,
156
+ stream_slice=stream_slice,
157
+ )
130
158
  yield record
@@ -10,9 +10,10 @@ from typing import Any, Dict, Iterable, Mapping, Optional, Tuple
10
10
 
11
11
  import pandas as pd
12
12
  import requests
13
- from airbyte_cdk.sources.declarative.extractors.record_extractor import RecordExtractor
14
13
  from numpy import nan
15
14
 
15
+ from airbyte_cdk.sources.declarative.extractors.record_extractor import RecordExtractor
16
+
16
17
  EMPTY_STR: str = ""
17
18
  DEFAULT_ENCODING: str = "utf-8"
18
19
  DOWNLOAD_CHUNK_SIZE: int = 1024 * 10
@@ -7,6 +7,8 @@ from dataclasses import InitVar, dataclass, field
7
7
  from datetime import timedelta
8
8
  from typing import Any, Callable, Iterable, List, Mapping, MutableMapping, Optional, Union
9
9
 
10
+ from isodate import Duration, duration_isoformat, parse_duration
11
+
10
12
  from airbyte_cdk.models import AirbyteLogMessage, AirbyteMessage, Level, Type
11
13
  from airbyte_cdk.sources.declarative.datetime.datetime_parser import DatetimeParser
12
14
  from airbyte_cdk.sources.declarative.datetime.min_max_datetime import MinMaxDatetime
@@ -19,7 +21,6 @@ from airbyte_cdk.sources.declarative.requesters.request_option import (
19
21
  )
20
22
  from airbyte_cdk.sources.message import MessageRepository
21
23
  from airbyte_cdk.sources.types import Config, Record, StreamSlice, StreamState
22
- from isodate import Duration, duration_isoformat, parse_duration
23
24
 
24
25
 
25
26
  @dataclass
@@ -340,8 +340,11 @@ class GlobalSubstreamCursor(DeclarativeCursor):
340
340
  @staticmethod
341
341
  def _convert_record_to_cursor_record(record: Record) -> Record:
342
342
  return Record(
343
- record.data,
344
- StreamSlice(partition={}, cursor_slice=record.associated_slice.cursor_slice)
343
+ data=record.data,
344
+ stream_name=record.stream_name,
345
+ associated_slice=StreamSlice(
346
+ partition={}, cursor_slice=record.associated_slice.cursor_slice
347
+ )
345
348
  if record.associated_slice
346
349
  else None,
347
350
  )
@@ -325,8 +325,11 @@ class PerPartitionCursor(DeclarativeCursor):
325
325
  @staticmethod
326
326
  def _convert_record_to_cursor_record(record: Record) -> Record:
327
327
  return Record(
328
- record.data,
329
- StreamSlice(partition={}, cursor_slice=record.associated_slice.cursor_slice)
328
+ data=record.data,
329
+ stream_name=record.stream_name,
330
+ associated_slice=StreamSlice(
331
+ partition={}, cursor_slice=record.associated_slice.cursor_slice
332
+ )
330
333
  if record.associated_slice
331
334
  else None,
332
335
  )
@@ -194,9 +194,7 @@ class PerPartitionWithGlobalCursor(DeclarativeCursor):
194
194
  )
195
195
 
196
196
  def should_be_synced(self, record: Record) -> bool:
197
- return self._global_cursor.should_be_synced(
198
- record
199
- ) or self._per_partition_cursor.should_be_synced(record)
197
+ return self._get_active_cursor().should_be_synced(record)
200
198
 
201
199
  def is_greater_than_or_equal(self, first: Record, second: Record) -> bool:
202
200
  return self._global_cursor.is_greater_than_or_equal(first, second)
@@ -6,15 +6,16 @@ import ast
6
6
  from functools import cache
7
7
  from typing import Any, Mapping, Optional, Tuple, Type
8
8
 
9
- from airbyte_cdk.sources.declarative.interpolation.filters import filters
10
- from airbyte_cdk.sources.declarative.interpolation.interpolation import Interpolation
11
- from airbyte_cdk.sources.declarative.interpolation.macros import macros
12
- from airbyte_cdk.sources.types import Config
13
9
  from jinja2 import meta
14
10
  from jinja2.environment import Template
15
11
  from jinja2.exceptions import UndefinedError
16
12
  from jinja2.sandbox import SandboxedEnvironment
17
13
 
14
+ from airbyte_cdk.sources.declarative.interpolation.filters import filters
15
+ from airbyte_cdk.sources.declarative.interpolation.interpolation import Interpolation
16
+ from airbyte_cdk.sources.declarative.interpolation.macros import macros
17
+ from airbyte_cdk.sources.types import Config
18
+
18
19
 
19
20
  class StreamPartitionAccessEnvironment(SandboxedEnvironment):
20
21
  """
@@ -8,9 +8,12 @@ import pkgutil
8
8
  from copy import deepcopy
9
9
  from importlib import metadata
10
10
  from typing import Any, Dict, Iterator, List, Mapping, Optional
11
- from packaging.version import Version, InvalidVersion
12
11
 
13
12
  import yaml
13
+ from jsonschema.exceptions import ValidationError
14
+ from jsonschema.validators import validate
15
+ from packaging.version import InvalidVersion, Version
16
+
14
17
  from airbyte_cdk.models import (
15
18
  AirbyteConnectionStatus,
16
19
  AirbyteMessage,
@@ -44,8 +47,6 @@ from airbyte_cdk.sources.utils.slice_logger import (
44
47
  DebugSliceLogger,
45
48
  SliceLogger,
46
49
  )
47
- from jsonschema.exceptions import ValidationError
48
- from jsonschema.validators import validate
49
50
 
50
51
 
51
52
  class ManifestDeclarativeSource(DeclarativeSource):
@@ -5,9 +5,9 @@ from typing import Any, Mapping
5
5
  from airbyte_cdk.sources.declarative.interpolation.interpolated_string import InterpolatedString
6
6
  from airbyte_cdk.sources.declarative.migrations.state_migration import StateMigration
7
7
  from airbyte_cdk.sources.declarative.models import (
8
+ CustomIncrementalSync,
8
9
  DatetimeBasedCursor,
9
10
  SubstreamPartitionRouter,
10
- CustomIncrementalSync,
11
11
  )
12
12
  from airbyte_cdk.sources.declarative.models.declarative_component_schema import ParentStreamConfig
13
13