dtlpy 1.115.44__py3-none-any.whl → 1.117.6__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (238) hide show
  1. dtlpy/__init__.py +491 -491
  2. dtlpy/__version__.py +1 -1
  3. dtlpy/assets/__init__.py +26 -26
  4. dtlpy/assets/code_server/config.yaml +2 -2
  5. dtlpy/assets/code_server/installation.sh +24 -24
  6. dtlpy/assets/code_server/launch.json +13 -13
  7. dtlpy/assets/code_server/settings.json +2 -2
  8. dtlpy/assets/main.py +53 -53
  9. dtlpy/assets/main_partial.py +18 -18
  10. dtlpy/assets/mock.json +11 -11
  11. dtlpy/assets/model_adapter.py +83 -83
  12. dtlpy/assets/package.json +61 -61
  13. dtlpy/assets/package_catalog.json +29 -29
  14. dtlpy/assets/package_gitignore +307 -307
  15. dtlpy/assets/service_runners/__init__.py +33 -33
  16. dtlpy/assets/service_runners/converter.py +96 -96
  17. dtlpy/assets/service_runners/multi_method.py +49 -49
  18. dtlpy/assets/service_runners/multi_method_annotation.py +54 -54
  19. dtlpy/assets/service_runners/multi_method_dataset.py +55 -55
  20. dtlpy/assets/service_runners/multi_method_item.py +52 -52
  21. dtlpy/assets/service_runners/multi_method_json.py +52 -52
  22. dtlpy/assets/service_runners/single_method.py +37 -37
  23. dtlpy/assets/service_runners/single_method_annotation.py +43 -43
  24. dtlpy/assets/service_runners/single_method_dataset.py +43 -43
  25. dtlpy/assets/service_runners/single_method_item.py +41 -41
  26. dtlpy/assets/service_runners/single_method_json.py +42 -42
  27. dtlpy/assets/service_runners/single_method_multi_input.py +45 -45
  28. dtlpy/assets/voc_annotation_template.xml +23 -23
  29. dtlpy/caches/base_cache.py +32 -32
  30. dtlpy/caches/cache.py +473 -473
  31. dtlpy/caches/dl_cache.py +201 -201
  32. dtlpy/caches/filesystem_cache.py +89 -89
  33. dtlpy/caches/redis_cache.py +84 -84
  34. dtlpy/dlp/__init__.py +20 -20
  35. dtlpy/dlp/cli_utilities.py +367 -367
  36. dtlpy/dlp/command_executor.py +764 -764
  37. dtlpy/dlp/dlp +1 -1
  38. dtlpy/dlp/dlp.bat +1 -1
  39. dtlpy/dlp/dlp.py +128 -128
  40. dtlpy/dlp/parser.py +651 -651
  41. dtlpy/entities/__init__.py +83 -83
  42. dtlpy/entities/analytic.py +347 -347
  43. dtlpy/entities/annotation.py +1879 -1879
  44. dtlpy/entities/annotation_collection.py +699 -699
  45. dtlpy/entities/annotation_definitions/__init__.py +20 -20
  46. dtlpy/entities/annotation_definitions/base_annotation_definition.py +100 -100
  47. dtlpy/entities/annotation_definitions/box.py +195 -195
  48. dtlpy/entities/annotation_definitions/classification.py +67 -67
  49. dtlpy/entities/annotation_definitions/comparison.py +72 -72
  50. dtlpy/entities/annotation_definitions/cube.py +204 -204
  51. dtlpy/entities/annotation_definitions/cube_3d.py +149 -149
  52. dtlpy/entities/annotation_definitions/description.py +32 -32
  53. dtlpy/entities/annotation_definitions/ellipse.py +124 -124
  54. dtlpy/entities/annotation_definitions/free_text.py +62 -62
  55. dtlpy/entities/annotation_definitions/gis.py +69 -69
  56. dtlpy/entities/annotation_definitions/note.py +139 -139
  57. dtlpy/entities/annotation_definitions/point.py +117 -117
  58. dtlpy/entities/annotation_definitions/polygon.py +182 -182
  59. dtlpy/entities/annotation_definitions/polyline.py +111 -111
  60. dtlpy/entities/annotation_definitions/pose.py +92 -92
  61. dtlpy/entities/annotation_definitions/ref_image.py +86 -86
  62. dtlpy/entities/annotation_definitions/segmentation.py +240 -240
  63. dtlpy/entities/annotation_definitions/subtitle.py +34 -34
  64. dtlpy/entities/annotation_definitions/text.py +85 -85
  65. dtlpy/entities/annotation_definitions/undefined_annotation.py +74 -74
  66. dtlpy/entities/app.py +220 -220
  67. dtlpy/entities/app_module.py +107 -107
  68. dtlpy/entities/artifact.py +174 -174
  69. dtlpy/entities/assignment.py +399 -399
  70. dtlpy/entities/base_entity.py +214 -214
  71. dtlpy/entities/bot.py +113 -113
  72. dtlpy/entities/codebase.py +292 -292
  73. dtlpy/entities/collection.py +38 -38
  74. dtlpy/entities/command.py +169 -169
  75. dtlpy/entities/compute.py +449 -449
  76. dtlpy/entities/dataset.py +1299 -1299
  77. dtlpy/entities/directory_tree.py +44 -44
  78. dtlpy/entities/dpk.py +470 -470
  79. dtlpy/entities/driver.py +235 -235
  80. dtlpy/entities/execution.py +397 -397
  81. dtlpy/entities/feature.py +124 -124
  82. dtlpy/entities/feature_set.py +152 -145
  83. dtlpy/entities/filters.py +798 -798
  84. dtlpy/entities/gis_item.py +107 -107
  85. dtlpy/entities/integration.py +184 -184
  86. dtlpy/entities/item.py +975 -959
  87. dtlpy/entities/label.py +123 -123
  88. dtlpy/entities/links.py +85 -85
  89. dtlpy/entities/message.py +175 -175
  90. dtlpy/entities/model.py +684 -684
  91. dtlpy/entities/node.py +1005 -1005
  92. dtlpy/entities/ontology.py +810 -803
  93. dtlpy/entities/organization.py +287 -287
  94. dtlpy/entities/package.py +657 -657
  95. dtlpy/entities/package_defaults.py +5 -5
  96. dtlpy/entities/package_function.py +185 -185
  97. dtlpy/entities/package_module.py +113 -113
  98. dtlpy/entities/package_slot.py +118 -118
  99. dtlpy/entities/paged_entities.py +299 -299
  100. dtlpy/entities/pipeline.py +624 -624
  101. dtlpy/entities/pipeline_execution.py +279 -279
  102. dtlpy/entities/project.py +394 -394
  103. dtlpy/entities/prompt_item.py +505 -505
  104. dtlpy/entities/recipe.py +301 -301
  105. dtlpy/entities/reflect_dict.py +102 -102
  106. dtlpy/entities/resource_execution.py +138 -138
  107. dtlpy/entities/service.py +974 -963
  108. dtlpy/entities/service_driver.py +117 -117
  109. dtlpy/entities/setting.py +294 -294
  110. dtlpy/entities/task.py +495 -495
  111. dtlpy/entities/time_series.py +143 -143
  112. dtlpy/entities/trigger.py +426 -426
  113. dtlpy/entities/user.py +118 -118
  114. dtlpy/entities/webhook.py +124 -124
  115. dtlpy/examples/__init__.py +19 -19
  116. dtlpy/examples/add_labels.py +135 -135
  117. dtlpy/examples/add_metadata_to_item.py +21 -21
  118. dtlpy/examples/annotate_items_using_model.py +65 -65
  119. dtlpy/examples/annotate_video_using_model_and_tracker.py +75 -75
  120. dtlpy/examples/annotations_convert_to_voc.py +9 -9
  121. dtlpy/examples/annotations_convert_to_yolo.py +9 -9
  122. dtlpy/examples/convert_annotation_types.py +51 -51
  123. dtlpy/examples/converter.py +143 -143
  124. dtlpy/examples/copy_annotations.py +22 -22
  125. dtlpy/examples/copy_folder.py +31 -31
  126. dtlpy/examples/create_annotations.py +51 -51
  127. dtlpy/examples/create_video_annotations.py +83 -83
  128. dtlpy/examples/delete_annotations.py +26 -26
  129. dtlpy/examples/filters.py +113 -113
  130. dtlpy/examples/move_item.py +23 -23
  131. dtlpy/examples/play_video_annotation.py +13 -13
  132. dtlpy/examples/show_item_and_mask.py +53 -53
  133. dtlpy/examples/triggers.py +49 -49
  134. dtlpy/examples/upload_batch_of_items.py +20 -20
  135. dtlpy/examples/upload_items_and_custom_format_annotations.py +55 -55
  136. dtlpy/examples/upload_items_with_modalities.py +43 -43
  137. dtlpy/examples/upload_segmentation_annotations_from_mask_image.py +44 -44
  138. dtlpy/examples/upload_yolo_format_annotations.py +70 -70
  139. dtlpy/exceptions.py +125 -125
  140. dtlpy/miscellaneous/__init__.py +20 -20
  141. dtlpy/miscellaneous/dict_differ.py +95 -95
  142. dtlpy/miscellaneous/git_utils.py +217 -217
  143. dtlpy/miscellaneous/json_utils.py +14 -14
  144. dtlpy/miscellaneous/list_print.py +105 -105
  145. dtlpy/miscellaneous/zipping.py +130 -130
  146. dtlpy/ml/__init__.py +20 -20
  147. dtlpy/ml/base_feature_extractor_adapter.py +27 -27
  148. dtlpy/ml/base_model_adapter.py +1287 -1230
  149. dtlpy/ml/metrics.py +461 -461
  150. dtlpy/ml/predictions_utils.py +274 -274
  151. dtlpy/ml/summary_writer.py +57 -57
  152. dtlpy/ml/train_utils.py +60 -60
  153. dtlpy/new_instance.py +252 -252
  154. dtlpy/repositories/__init__.py +56 -56
  155. dtlpy/repositories/analytics.py +85 -85
  156. dtlpy/repositories/annotations.py +916 -916
  157. dtlpy/repositories/apps.py +383 -383
  158. dtlpy/repositories/artifacts.py +452 -452
  159. dtlpy/repositories/assignments.py +599 -599
  160. dtlpy/repositories/bots.py +213 -213
  161. dtlpy/repositories/codebases.py +559 -559
  162. dtlpy/repositories/collections.py +332 -332
  163. dtlpy/repositories/commands.py +152 -152
  164. dtlpy/repositories/compositions.py +61 -61
  165. dtlpy/repositories/computes.py +439 -439
  166. dtlpy/repositories/datasets.py +1585 -1504
  167. dtlpy/repositories/downloader.py +1157 -923
  168. dtlpy/repositories/dpks.py +433 -433
  169. dtlpy/repositories/drivers.py +482 -482
  170. dtlpy/repositories/executions.py +815 -815
  171. dtlpy/repositories/feature_sets.py +256 -226
  172. dtlpy/repositories/features.py +255 -255
  173. dtlpy/repositories/integrations.py +484 -484
  174. dtlpy/repositories/items.py +912 -912
  175. dtlpy/repositories/messages.py +94 -94
  176. dtlpy/repositories/models.py +1000 -1000
  177. dtlpy/repositories/nodes.py +80 -80
  178. dtlpy/repositories/ontologies.py +511 -511
  179. dtlpy/repositories/organizations.py +525 -525
  180. dtlpy/repositories/packages.py +1941 -1941
  181. dtlpy/repositories/pipeline_executions.py +451 -451
  182. dtlpy/repositories/pipelines.py +640 -640
  183. dtlpy/repositories/projects.py +539 -539
  184. dtlpy/repositories/recipes.py +429 -399
  185. dtlpy/repositories/resource_executions.py +137 -137
  186. dtlpy/repositories/schema.py +120 -120
  187. dtlpy/repositories/service_drivers.py +213 -213
  188. dtlpy/repositories/services.py +1704 -1704
  189. dtlpy/repositories/settings.py +339 -339
  190. dtlpy/repositories/tasks.py +1477 -1477
  191. dtlpy/repositories/times_series.py +278 -278
  192. dtlpy/repositories/triggers.py +536 -536
  193. dtlpy/repositories/upload_element.py +257 -257
  194. dtlpy/repositories/uploader.py +661 -661
  195. dtlpy/repositories/webhooks.py +249 -249
  196. dtlpy/services/__init__.py +22 -22
  197. dtlpy/services/aihttp_retry.py +131 -131
  198. dtlpy/services/api_client.py +1786 -1785
  199. dtlpy/services/api_reference.py +40 -40
  200. dtlpy/services/async_utils.py +133 -133
  201. dtlpy/services/calls_counter.py +44 -44
  202. dtlpy/services/check_sdk.py +68 -68
  203. dtlpy/services/cookie.py +115 -115
  204. dtlpy/services/create_logger.py +156 -156
  205. dtlpy/services/events.py +84 -84
  206. dtlpy/services/logins.py +235 -235
  207. dtlpy/services/reporter.py +256 -256
  208. dtlpy/services/service_defaults.py +91 -91
  209. dtlpy/utilities/__init__.py +20 -20
  210. dtlpy/utilities/annotations/__init__.py +16 -16
  211. dtlpy/utilities/annotations/annotation_converters.py +269 -269
  212. dtlpy/utilities/base_package_runner.py +285 -264
  213. dtlpy/utilities/converter.py +1650 -1650
  214. dtlpy/utilities/dataset_generators/__init__.py +1 -1
  215. dtlpy/utilities/dataset_generators/dataset_generator.py +670 -670
  216. dtlpy/utilities/dataset_generators/dataset_generator_tensorflow.py +23 -23
  217. dtlpy/utilities/dataset_generators/dataset_generator_torch.py +21 -21
  218. dtlpy/utilities/local_development/__init__.py +1 -1
  219. dtlpy/utilities/local_development/local_session.py +179 -179
  220. dtlpy/utilities/reports/__init__.py +2 -2
  221. dtlpy/utilities/reports/figures.py +343 -343
  222. dtlpy/utilities/reports/report.py +71 -71
  223. dtlpy/utilities/videos/__init__.py +17 -17
  224. dtlpy/utilities/videos/video_player.py +598 -598
  225. dtlpy/utilities/videos/videos.py +470 -470
  226. {dtlpy-1.115.44.data → dtlpy-1.117.6.data}/scripts/dlp +1 -1
  227. dtlpy-1.117.6.data/scripts/dlp.bat +2 -0
  228. {dtlpy-1.115.44.data → dtlpy-1.117.6.data}/scripts/dlp.py +128 -128
  229. {dtlpy-1.115.44.dist-info → dtlpy-1.117.6.dist-info}/METADATA +186 -186
  230. dtlpy-1.117.6.dist-info/RECORD +239 -0
  231. {dtlpy-1.115.44.dist-info → dtlpy-1.117.6.dist-info}/WHEEL +1 -1
  232. {dtlpy-1.115.44.dist-info → dtlpy-1.117.6.dist-info}/licenses/LICENSE +200 -200
  233. tests/features/environment.py +551 -551
  234. dtlpy/assets/__pycache__/__init__.cpython-310.pyc +0 -0
  235. dtlpy-1.115.44.data/scripts/dlp.bat +0 -2
  236. dtlpy-1.115.44.dist-info/RECORD +0 -240
  237. {dtlpy-1.115.44.dist-info → dtlpy-1.117.6.dist-info}/entry_points.txt +0 -0
  238. {dtlpy-1.115.44.dist-info → dtlpy-1.117.6.dist-info}/top_level.txt +0 -0
@@ -1,300 +1,300 @@
1
- import logging
2
- import math
3
- import time
4
- import tqdm
5
- import copy
6
- import sys
7
- from typing import Optional, List, Any
8
-
9
- import attr
10
-
11
- from .filters import FiltersOperations, FiltersOrderByDirection, FiltersResource
12
- from .. import miscellaneous
13
- from ..services.api_client import ApiClient
14
-
15
- logger = logging.getLogger(name='dtlpy')
16
-
17
-
18
- @attr.s
19
- class PagedEntities:
20
- """
21
- Pages object for efficient API pagination.
22
- Defaults to offset-based pagination for compatibility with all operations.
23
- Switches to keyset/cursor-based pagination (using 'id' as the cursor) during iteration for performance.
24
- Falls back to offset-based pagination if keyset is not possible (e.g., custom sort).
25
- """
26
- # api
27
- _client_api: ApiClient = attr.ib(repr=False)
28
-
29
- # params
30
- page_offset: int = attr.ib()
31
- page_size: int = attr.ib()
32
- filters: Any = attr.ib()
33
- items_repository: Any = attr.ib(repr=False)
34
- has_next_page: bool = attr.ib(default=False)
35
- total_pages_count: int = attr.ib(default=0)
36
- items_count: int = attr.ib(default=0)
37
-
38
- # hybrid pagination
39
- use_id_based_paging: bool = attr.ib(default=False) # Default to False for offset-based pagination
40
- last_seen_id: Optional[Any] = attr.ib(default=None)
41
-
42
- # execution attribute
43
- _service_id = attr.ib(default=None, repr=False)
44
- _project_id = attr.ib(default=None, repr=False)
45
- _list_function = attr.ib(default=None, repr=False)
46
-
47
- # items list
48
- items: List[Any] = attr.ib(default=miscellaneous.List(), repr=False)
49
-
50
- @staticmethod
51
- def _has_explicit_sort(flt) -> bool:
52
- """
53
- Check if the filter has custom sort fields defined (not id/createdAt).
54
- """
55
- prepared = flt.prepare() if flt else {}
56
- sort_fields = list(prepared.get("sort", {}).keys())
57
- if isinstance(sort_fields, list) and len(sort_fields) > 0:
58
- return sort_fields[0] not in {"id", "createdAt"}
59
- return False
60
-
61
- def _should_use_keyset_pagination(self) -> bool:
62
- """
63
- Determine whether to use keyset pagination based on page offset and resource type.
64
- Keyset pagination can only be used when page_offset is 0 (first page).
65
- :param page_offset: The page offset to check
66
- :return: True if keyset pagination should be used, False otherwise
67
- """
68
- # Keyset pagination only works for page 0 (first page)
69
- if self.page_offset != 0:
70
- return False
71
-
72
- # can't use add to custom filter
73
- if self.filters.custom_filter is not None:
74
- return False
75
-
76
- # Check if the resource supports keyset pagination
77
- enable_id_based_paging = getattr(self.filters, "resource", None) in [
78
- FiltersResource.ITEM,
79
- FiltersResource.ANNOTATION,
80
- FiltersResource.FEATURE,
81
- ]
82
-
83
- if not enable_id_based_paging:
84
- return False
85
-
86
- # Check if there's no explicit sort that would prevent keyset pagination
87
- if self._has_explicit_sort(self.filters):
88
- return False
89
-
90
- return True
91
-
92
- def process_result(self, result: dict) -> List[Any]:
93
- """
94
- Process the API result and update pagination state.
95
- :param result: json object
96
- :return: list of items
97
- """
98
- # Only update page_offset if using offset-based pagination
99
- if not self.use_id_based_paging and 'page_offset' in result:
100
- self.page_offset = result['page_offset']
101
- if 'page_size' in result:
102
- self.page_size = result['page_size']
103
- if 'hasNextPage' in result:
104
- self.has_next_page = result['hasNextPage']
105
- if 'totalItemsCount' in result:
106
- self.items_count = result['totalItemsCount']
107
- if 'totalPagesCount' in result:
108
- self.total_pages_count = result['totalPagesCount']
109
- if 'items' in result:
110
- items = self.items_repository._build_entities_from_response(response_items=result['items'])
111
- else:
112
- items = miscellaneous.List(list())
113
- return items
114
-
115
- def __getitem__(self, y: int) -> List[Any]:
116
- # If we're already on the requested page, return current items
117
- if y == self.page_offset:
118
- return self.items
119
- # Otherwise, go to the requested page
120
- self.go_to_page(y)
121
- return self.items
122
-
123
- def __len__(self) -> int:
124
- return self.items_count
125
-
126
- def __iter__(self):
127
- # Use keyset/cursor-based pagination for iteration when possible
128
- self.last_seen_id = None
129
- self.page_offset = 0 # Start from the first page for iteration
130
- self.use_id_based_paging = self._should_use_keyset_pagination()
131
- self.has_next_page = True # Start with assumption that there are more pages
132
- self.page_size = self.page_size or 100
133
- pbar = tqdm.tqdm(total=self.items_count,
134
- disable=self._client_api.verbose.disable_progress_bar_iterate_pages,
135
- file=sys.stdout, desc="Iterate Pages")
136
-
137
- # Get the first page
138
- self.get_page()
139
- if self.items:
140
- yield self.items
141
- pbar.update()
142
-
143
- # Continue with next pages
144
- while self.has_next_page:
145
- if self.use_id_based_paging:
146
- # For keyset pagination, just get the next page
147
- self.page_offset = 0
148
- self.get_page()
149
- else:
150
- # For offset pagination, increment the offset
151
- self._move_page_offset(1)
152
- self.get_page()
153
-
154
- if not self.items:
155
- break
156
- yield self.items
157
- pbar.update()
158
- pbar.close()
159
-
160
- def __reversed__(self):
161
- # Force offset-based pagination for reverse iteration
162
- self.use_id_based_paging = False
163
- self.page_offset = self.total_pages_count - 1
164
- while True:
165
- self.get_page()
166
- yield self.items
167
- if self.page_offset == 0:
168
- break
169
- self._move_page_offset(-1)
170
-
171
- def _move_page_offset(self, offset: int) -> None:
172
- """
173
- Move the page offset by a given step.
174
- :param offset: offset to move
175
- """
176
- self.page_offset += offset
177
- if self.filters.custom_filter is not None:
178
- if 'page' in self.filters.custom_filter and self.filters.custom_filter['page'] != self.page_offset:
179
- self.filters.custom_filter['page'] = self.page_offset
180
-
181
- def return_page(self, page_offset: Optional[int] = None, page_size: Optional[int] = None) -> List[Any]:
182
- """
183
- Return a page of results using offset-based pagination by default.
184
- Switches to keyset/cursor-based pagination when supported and beneficial.
185
- :param page_offset: page offset (for offset-based)
186
- :param page_size: page size
187
- :return: list of items
188
- """
189
- if page_size is not None:
190
- self.page_size = page_size
191
- if page_offset is not None:
192
- self.page_offset = page_offset
193
-
194
- if self.filters is None:
195
- raise ValueError("Can't return page. Filters is empty")
196
- self.filters.page_size = self.page_size
197
- self.filters.page = self.page_offset
198
- req = copy.deepcopy(self.filters)
199
-
200
- # Determine pagination method based on page offset and resource type
201
- self.use_id_based_paging = self._should_use_keyset_pagination()
202
-
203
- if self.use_id_based_paging:
204
- # Use keyset/cursor-based pagination
205
- prepared = req.prepare()
206
- sort_spec = prepared.get("sort", {})
207
- order = next(iter(sort_spec.values()), None)
208
- if order is None:
209
- order = FiltersOrderByDirection.ASCENDING
210
- if order == FiltersOrderByDirection.DESCENDING:
211
- operator_value = FiltersOperations.LESS_THAN
212
- else:
213
- operator_value = FiltersOperations.GREATER_THAN
214
-
215
- req.sort_by(field="id", value=order)
216
- req.page = 0 # always fetch from the start for keyset
217
- # Only add last_seen_id filter if we're not explicitly requesting page 0
218
- if self.last_seen_id:
219
- req.add(
220
- field="id",
221
- values=self.last_seen_id,
222
- operator=operator_value,
223
- method=FiltersOperations.AND,
224
- )
225
- # Fetch data
226
- if self._list_function is None:
227
- result = self.items_repository._list(filters=req)
228
- else:
229
- result = self._list_function(filters=req)
230
-
231
- items = self.process_result(result)
232
-
233
- # Update last_seen_id for keyset
234
- if self.use_id_based_paging and items and hasattr(items[-1], "id"):
235
- self.last_seen_id = items[-1].id
236
- elif self.use_id_based_paging and not items:
237
- self.last_seen_id = None
238
- return items
239
-
240
- def get_page(self, page_offset: Optional[int] = None, page_size: Optional[int] = None) -> None:
241
- """
242
- Get a page of results and update self.items.
243
- :param page_offset: page offset (for offset-based)
244
- :param page_size: page size
245
- """
246
- items = self.return_page(page_offset=page_offset, page_size=page_size)
247
- self.items = items
248
-
249
- def next_page(self) -> None:
250
- """
251
- Brings the next page of items from host.
252
- """
253
- if self.use_id_based_paging:
254
- # For keyset pagination, just get the next page
255
- self.get_page()
256
- else:
257
- # For offset pagination, increment the offset
258
- self._move_page_offset(1)
259
- self.get_page()
260
-
261
- def prev_page(self) -> None:
262
- """
263
- Brings the previous page of items from host.
264
- Only works with offset-based pagination.
265
- """
266
- if self.use_id_based_paging:
267
- raise NotImplementedError("prev_page is not supported for keyset pagination.")
268
- self._move_page_offset(-1)
269
- self.get_page()
270
-
271
- def go_to_page(self, page: int = 0) -> None:
272
- """
273
- Brings specified page of items from host.
274
- For page 0, uses keyset pagination if supported.
275
- For other pages, uses offset-based pagination.
276
- :param page: page number
277
- """
278
- # Reset last_seen_id when going to page 0 to ensure we get all items
279
- if page == 0:
280
- self.last_seen_id = None
281
- self.page_offset = page
282
- self.get_page()
283
-
284
- def all(self):
285
- """
286
- Iterate over all items in all pages efficiently.
287
- Uses the iterator implementation (__iter__).
288
- """
289
- for items in self:
290
- for item in items:
291
- yield item
292
-
293
- ########
294
- # misc #
295
- ########
296
- def print(self, columns=None):
297
- self.items.print(columns=columns)
298
-
299
- def to_df(self, columns=None):
1
+ import logging
2
+ import math
3
+ import time
4
+ import tqdm
5
+ import copy
6
+ import sys
7
+ from typing import Optional, List, Any
8
+
9
+ import attr
10
+
11
+ from .filters import FiltersOperations, FiltersOrderByDirection, FiltersResource
12
+ from .. import miscellaneous
13
+ from ..services.api_client import ApiClient
14
+
15
+ logger = logging.getLogger(name='dtlpy')
16
+
17
+
18
+ @attr.s
19
+ class PagedEntities:
20
+ """
21
+ Pages object for efficient API pagination.
22
+ Defaults to offset-based pagination for compatibility with all operations.
23
+ Switches to keyset/cursor-based pagination (using 'id' as the cursor) during iteration for performance.
24
+ Falls back to offset-based pagination if keyset is not possible (e.g., custom sort).
25
+ """
26
+ # api
27
+ _client_api: ApiClient = attr.ib(repr=False)
28
+
29
+ # params
30
+ page_offset: int = attr.ib()
31
+ page_size: int = attr.ib()
32
+ filters: Any = attr.ib()
33
+ items_repository: Any = attr.ib(repr=False)
34
+ has_next_page: bool = attr.ib(default=False)
35
+ total_pages_count: int = attr.ib(default=0)
36
+ items_count: int = attr.ib(default=0)
37
+
38
+ # hybrid pagination
39
+ use_id_based_paging: bool = attr.ib(default=False) # Default to False for offset-based pagination
40
+ last_seen_id: Optional[Any] = attr.ib(default=None)
41
+
42
+ # execution attribute
43
+ _service_id = attr.ib(default=None, repr=False)
44
+ _project_id = attr.ib(default=None, repr=False)
45
+ _list_function = attr.ib(default=None, repr=False)
46
+
47
+ # items list
48
+ items: List[Any] = attr.ib(default=miscellaneous.List(), repr=False)
49
+
50
+ @staticmethod
51
+ def _has_explicit_sort(flt) -> bool:
52
+ """
53
+ Check if the filter has custom sort fields defined (not id/createdAt).
54
+ """
55
+ prepared = flt.prepare() if flt else {}
56
+ sort_fields = list(prepared.get("sort", {}).keys())
57
+ if isinstance(sort_fields, list) and len(sort_fields) > 0:
58
+ return sort_fields[0] not in {"id", "createdAt"}
59
+ return False
60
+
61
+ def _should_use_keyset_pagination(self) -> bool:
62
+ """
63
+ Determine whether to use keyset pagination based on page offset and resource type.
64
+ Keyset pagination can only be used when page_offset is 0 (first page).
65
+ :param page_offset: The page offset to check
66
+ :return: True if keyset pagination should be used, False otherwise
67
+ """
68
+ # Keyset pagination only works for page 0 (first page)
69
+ if self.page_offset != 0:
70
+ return False
71
+
72
+ # can't use add to custom filter
73
+ if self.filters.custom_filter is not None:
74
+ return False
75
+
76
+ # Check if the resource supports keyset pagination
77
+ enable_id_based_paging = getattr(self.filters, "resource", None) in [
78
+ FiltersResource.ITEM,
79
+ FiltersResource.ANNOTATION,
80
+ FiltersResource.FEATURE,
81
+ ]
82
+
83
+ if not enable_id_based_paging:
84
+ return False
85
+
86
+ # Check if there's no explicit sort that would prevent keyset pagination
87
+ if self._has_explicit_sort(self.filters):
88
+ return False
89
+
90
+ return True
91
+
92
+ def process_result(self, result: dict) -> List[Any]:
93
+ """
94
+ Process the API result and update pagination state.
95
+ :param result: json object
96
+ :return: list of items
97
+ """
98
+ # Only update page_offset if using offset-based pagination
99
+ if not self.use_id_based_paging and 'page_offset' in result:
100
+ self.page_offset = result['page_offset']
101
+ if 'page_size' in result:
102
+ self.page_size = result['page_size']
103
+ if 'hasNextPage' in result:
104
+ self.has_next_page = result['hasNextPage']
105
+ if 'totalItemsCount' in result:
106
+ self.items_count = result['totalItemsCount']
107
+ if 'totalPagesCount' in result:
108
+ self.total_pages_count = result['totalPagesCount']
109
+ if 'items' in result:
110
+ items = self.items_repository._build_entities_from_response(response_items=result['items'])
111
+ else:
112
+ items = miscellaneous.List(list())
113
+ return items
114
+
115
+ def __getitem__(self, y: int) -> List[Any]:
116
+ # If we're already on the requested page, return current items
117
+ if y == self.page_offset:
118
+ return self.items
119
+ # Otherwise, go to the requested page
120
+ self.go_to_page(y)
121
+ return self.items
122
+
123
+ def __len__(self) -> int:
124
+ return self.items_count
125
+
126
+ def __iter__(self):
127
+ # Use keyset/cursor-based pagination for iteration when possible
128
+ self.last_seen_id = None
129
+ self.page_offset = 0 # Start from the first page for iteration
130
+ self.use_id_based_paging = self._should_use_keyset_pagination()
131
+ self.has_next_page = True # Start with assumption that there are more pages
132
+ self.page_size = self.page_size or 100
133
+ pbar = tqdm.tqdm(total=self.items_count,
134
+ disable=self._client_api.verbose.disable_progress_bar_iterate_pages,
135
+ file=sys.stdout, desc="Iterate Pages")
136
+
137
+ # Get the first page
138
+ self.get_page()
139
+ if self.items:
140
+ yield self.items
141
+ pbar.update()
142
+
143
+ # Continue with next pages
144
+ while self.has_next_page:
145
+ if self.use_id_based_paging:
146
+ # For keyset pagination, just get the next page
147
+ self.page_offset = 0
148
+ self.get_page()
149
+ else:
150
+ # For offset pagination, increment the offset
151
+ self._move_page_offset(1)
152
+ self.get_page()
153
+
154
+ if not self.items:
155
+ break
156
+ yield self.items
157
+ pbar.update()
158
+ pbar.close()
159
+
160
+ def __reversed__(self):
161
+ # Force offset-based pagination for reverse iteration
162
+ self.use_id_based_paging = False
163
+ self.page_offset = self.total_pages_count - 1
164
+ while True:
165
+ self.get_page()
166
+ yield self.items
167
+ if self.page_offset == 0:
168
+ break
169
+ self._move_page_offset(-1)
170
+
171
+ def _move_page_offset(self, offset: int) -> None:
172
+ """
173
+ Move the page offset by a given step.
174
+ :param offset: offset to move
175
+ """
176
+ self.page_offset += offset
177
+ if self.filters.custom_filter is not None:
178
+ if 'page' in self.filters.custom_filter and self.filters.custom_filter['page'] != self.page_offset:
179
+ self.filters.custom_filter['page'] = self.page_offset
180
+
181
+ def return_page(self, page_offset: Optional[int] = None, page_size: Optional[int] = None) -> List[Any]:
182
+ """
183
+ Return a page of results using offset-based pagination by default.
184
+ Switches to keyset/cursor-based pagination when supported and beneficial.
185
+ :param page_offset: page offset (for offset-based)
186
+ :param page_size: page size
187
+ :return: list of items
188
+ """
189
+ if page_size is not None:
190
+ self.page_size = page_size
191
+ if page_offset is not None:
192
+ self.page_offset = page_offset
193
+
194
+ if self.filters is None:
195
+ raise ValueError("Can't return page. Filters is empty")
196
+ self.filters.page_size = self.page_size
197
+ self.filters.page = self.page_offset
198
+ req = copy.deepcopy(self.filters)
199
+
200
+ # Determine pagination method based on page offset and resource type
201
+ self.use_id_based_paging = self._should_use_keyset_pagination()
202
+
203
+ if self.use_id_based_paging:
204
+ # Use keyset/cursor-based pagination
205
+ prepared = req.prepare()
206
+ sort_spec = prepared.get("sort", {})
207
+ order = next(iter(sort_spec.values()), None)
208
+ if order is None:
209
+ order = FiltersOrderByDirection.ASCENDING
210
+ if order == FiltersOrderByDirection.DESCENDING:
211
+ operator_value = FiltersOperations.LESS_THAN
212
+ else:
213
+ operator_value = FiltersOperations.GREATER_THAN
214
+
215
+ req.sort_by(field="id", value=order)
216
+ req.page = 0 # always fetch from the start for keyset
217
+ # Only add last_seen_id filter if we're not explicitly requesting page 0
218
+ if self.last_seen_id:
219
+ req.add(
220
+ field="id",
221
+ values=self.last_seen_id,
222
+ operator=operator_value,
223
+ method=FiltersOperations.AND,
224
+ )
225
+ # Fetch data
226
+ if self._list_function is None:
227
+ result = self.items_repository._list(filters=req)
228
+ else:
229
+ result = self._list_function(filters=req)
230
+
231
+ items = self.process_result(result)
232
+
233
+ # Update last_seen_id for keyset
234
+ if self.use_id_based_paging and items and hasattr(items[-1], "id"):
235
+ self.last_seen_id = items[-1].id
236
+ elif self.use_id_based_paging and not items:
237
+ self.last_seen_id = None
238
+ return items
239
+
240
+ def get_page(self, page_offset: Optional[int] = None, page_size: Optional[int] = None) -> None:
241
+ """
242
+ Get a page of results and update self.items.
243
+ :param page_offset: page offset (for offset-based)
244
+ :param page_size: page size
245
+ """
246
+ items = self.return_page(page_offset=page_offset, page_size=page_size)
247
+ self.items = items
248
+
249
+ def next_page(self) -> None:
250
+ """
251
+ Brings the next page of items from host.
252
+ """
253
+ if self.use_id_based_paging:
254
+ # For keyset pagination, just get the next page
255
+ self.get_page()
256
+ else:
257
+ # For offset pagination, increment the offset
258
+ self._move_page_offset(1)
259
+ self.get_page()
260
+
261
+ def prev_page(self) -> None:
262
+ """
263
+ Brings the previous page of items from host.
264
+ Only works with offset-based pagination.
265
+ """
266
+ if self.use_id_based_paging:
267
+ raise NotImplementedError("prev_page is not supported for keyset pagination.")
268
+ self._move_page_offset(-1)
269
+ self.get_page()
270
+
271
+ def go_to_page(self, page: int = 0) -> None:
272
+ """
273
+ Brings specified page of items from host.
274
+ For page 0, uses keyset pagination if supported.
275
+ For other pages, uses offset-based pagination.
276
+ :param page: page number
277
+ """
278
+ # Reset last_seen_id when going to page 0 to ensure we get all items
279
+ if page == 0:
280
+ self.last_seen_id = None
281
+ self.page_offset = page
282
+ self.get_page()
283
+
284
+ def all(self):
285
+ """
286
+ Iterate over all items in all pages efficiently.
287
+ Uses the iterator implementation (__iter__).
288
+ """
289
+ for items in self:
290
+ for item in items:
291
+ yield item
292
+
293
+ ########
294
+ # misc #
295
+ ########
296
+ def print(self, columns=None):
297
+ self.items.print(columns=columns)
298
+
299
+ def to_df(self, columns=None):
300
300
  return self.items.to_df(columns=columns)