dtlpy 1.113.10__py3-none-any.whl → 1.114.13__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (243) hide show
  1. dtlpy/__init__.py +488 -488
  2. dtlpy/__version__.py +1 -1
  3. dtlpy/assets/__init__.py +26 -26
  4. dtlpy/assets/__pycache__/__init__.cpython-38.pyc +0 -0
  5. dtlpy/assets/code_server/config.yaml +2 -2
  6. dtlpy/assets/code_server/installation.sh +24 -24
  7. dtlpy/assets/code_server/launch.json +13 -13
  8. dtlpy/assets/code_server/settings.json +2 -2
  9. dtlpy/assets/main.py +53 -53
  10. dtlpy/assets/main_partial.py +18 -18
  11. dtlpy/assets/mock.json +11 -11
  12. dtlpy/assets/model_adapter.py +83 -83
  13. dtlpy/assets/package.json +61 -61
  14. dtlpy/assets/package_catalog.json +29 -29
  15. dtlpy/assets/package_gitignore +307 -307
  16. dtlpy/assets/service_runners/__init__.py +33 -33
  17. dtlpy/assets/service_runners/converter.py +96 -96
  18. dtlpy/assets/service_runners/multi_method.py +49 -49
  19. dtlpy/assets/service_runners/multi_method_annotation.py +54 -54
  20. dtlpy/assets/service_runners/multi_method_dataset.py +55 -55
  21. dtlpy/assets/service_runners/multi_method_item.py +52 -52
  22. dtlpy/assets/service_runners/multi_method_json.py +52 -52
  23. dtlpy/assets/service_runners/single_method.py +37 -37
  24. dtlpy/assets/service_runners/single_method_annotation.py +43 -43
  25. dtlpy/assets/service_runners/single_method_dataset.py +43 -43
  26. dtlpy/assets/service_runners/single_method_item.py +41 -41
  27. dtlpy/assets/service_runners/single_method_json.py +42 -42
  28. dtlpy/assets/service_runners/single_method_multi_input.py +45 -45
  29. dtlpy/assets/voc_annotation_template.xml +23 -23
  30. dtlpy/caches/base_cache.py +32 -32
  31. dtlpy/caches/cache.py +473 -473
  32. dtlpy/caches/dl_cache.py +201 -201
  33. dtlpy/caches/filesystem_cache.py +89 -89
  34. dtlpy/caches/redis_cache.py +84 -84
  35. dtlpy/dlp/__init__.py +20 -20
  36. dtlpy/dlp/cli_utilities.py +367 -367
  37. dtlpy/dlp/command_executor.py +764 -764
  38. dtlpy/dlp/dlp +1 -1
  39. dtlpy/dlp/dlp.bat +1 -1
  40. dtlpy/dlp/dlp.py +128 -128
  41. dtlpy/dlp/parser.py +651 -651
  42. dtlpy/entities/__init__.py +83 -83
  43. dtlpy/entities/analytic.py +311 -311
  44. dtlpy/entities/annotation.py +1879 -1879
  45. dtlpy/entities/annotation_collection.py +699 -699
  46. dtlpy/entities/annotation_definitions/__init__.py +20 -20
  47. dtlpy/entities/annotation_definitions/base_annotation_definition.py +100 -100
  48. dtlpy/entities/annotation_definitions/box.py +195 -195
  49. dtlpy/entities/annotation_definitions/classification.py +67 -67
  50. dtlpy/entities/annotation_definitions/comparison.py +72 -72
  51. dtlpy/entities/annotation_definitions/cube.py +204 -204
  52. dtlpy/entities/annotation_definitions/cube_3d.py +149 -149
  53. dtlpy/entities/annotation_definitions/description.py +32 -32
  54. dtlpy/entities/annotation_definitions/ellipse.py +124 -124
  55. dtlpy/entities/annotation_definitions/free_text.py +62 -62
  56. dtlpy/entities/annotation_definitions/gis.py +69 -69
  57. dtlpy/entities/annotation_definitions/note.py +139 -139
  58. dtlpy/entities/annotation_definitions/point.py +117 -117
  59. dtlpy/entities/annotation_definitions/polygon.py +182 -182
  60. dtlpy/entities/annotation_definitions/polyline.py +111 -111
  61. dtlpy/entities/annotation_definitions/pose.py +92 -92
  62. dtlpy/entities/annotation_definitions/ref_image.py +86 -86
  63. dtlpy/entities/annotation_definitions/segmentation.py +240 -240
  64. dtlpy/entities/annotation_definitions/subtitle.py +34 -34
  65. dtlpy/entities/annotation_definitions/text.py +85 -85
  66. dtlpy/entities/annotation_definitions/undefined_annotation.py +74 -74
  67. dtlpy/entities/app.py +220 -220
  68. dtlpy/entities/app_module.py +107 -107
  69. dtlpy/entities/artifact.py +174 -174
  70. dtlpy/entities/assignment.py +399 -399
  71. dtlpy/entities/base_entity.py +214 -214
  72. dtlpy/entities/bot.py +113 -113
  73. dtlpy/entities/codebase.py +296 -296
  74. dtlpy/entities/collection.py +38 -38
  75. dtlpy/entities/command.py +169 -169
  76. dtlpy/entities/compute.py +442 -442
  77. dtlpy/entities/dataset.py +1285 -1285
  78. dtlpy/entities/directory_tree.py +44 -44
  79. dtlpy/entities/dpk.py +470 -470
  80. dtlpy/entities/driver.py +222 -222
  81. dtlpy/entities/execution.py +397 -397
  82. dtlpy/entities/feature.py +124 -124
  83. dtlpy/entities/feature_set.py +145 -145
  84. dtlpy/entities/filters.py +641 -641
  85. dtlpy/entities/gis_item.py +107 -107
  86. dtlpy/entities/integration.py +184 -184
  87. dtlpy/entities/item.py +953 -953
  88. dtlpy/entities/label.py +123 -123
  89. dtlpy/entities/links.py +85 -85
  90. dtlpy/entities/message.py +175 -175
  91. dtlpy/entities/model.py +694 -691
  92. dtlpy/entities/node.py +1005 -1005
  93. dtlpy/entities/ontology.py +803 -803
  94. dtlpy/entities/organization.py +287 -287
  95. dtlpy/entities/package.py +657 -657
  96. dtlpy/entities/package_defaults.py +5 -5
  97. dtlpy/entities/package_function.py +185 -185
  98. dtlpy/entities/package_module.py +113 -113
  99. dtlpy/entities/package_slot.py +118 -118
  100. dtlpy/entities/paged_entities.py +290 -267
  101. dtlpy/entities/pipeline.py +593 -593
  102. dtlpy/entities/pipeline_execution.py +279 -279
  103. dtlpy/entities/project.py +394 -394
  104. dtlpy/entities/prompt_item.py +499 -499
  105. dtlpy/entities/recipe.py +301 -301
  106. dtlpy/entities/reflect_dict.py +102 -102
  107. dtlpy/entities/resource_execution.py +138 -138
  108. dtlpy/entities/service.py +958 -958
  109. dtlpy/entities/service_driver.py +117 -117
  110. dtlpy/entities/setting.py +294 -294
  111. dtlpy/entities/task.py +491 -491
  112. dtlpy/entities/time_series.py +143 -143
  113. dtlpy/entities/trigger.py +426 -426
  114. dtlpy/entities/user.py +118 -118
  115. dtlpy/entities/webhook.py +124 -124
  116. dtlpy/examples/__init__.py +19 -19
  117. dtlpy/examples/add_labels.py +135 -135
  118. dtlpy/examples/add_metadata_to_item.py +21 -21
  119. dtlpy/examples/annotate_items_using_model.py +65 -65
  120. dtlpy/examples/annotate_video_using_model_and_tracker.py +75 -75
  121. dtlpy/examples/annotations_convert_to_voc.py +9 -9
  122. dtlpy/examples/annotations_convert_to_yolo.py +9 -9
  123. dtlpy/examples/convert_annotation_types.py +51 -51
  124. dtlpy/examples/converter.py +143 -143
  125. dtlpy/examples/copy_annotations.py +22 -22
  126. dtlpy/examples/copy_folder.py +31 -31
  127. dtlpy/examples/create_annotations.py +51 -51
  128. dtlpy/examples/create_video_annotations.py +83 -83
  129. dtlpy/examples/delete_annotations.py +26 -26
  130. dtlpy/examples/filters.py +113 -113
  131. dtlpy/examples/move_item.py +23 -23
  132. dtlpy/examples/play_video_annotation.py +13 -13
  133. dtlpy/examples/show_item_and_mask.py +53 -53
  134. dtlpy/examples/triggers.py +49 -49
  135. dtlpy/examples/upload_batch_of_items.py +20 -20
  136. dtlpy/examples/upload_items_and_custom_format_annotations.py +55 -55
  137. dtlpy/examples/upload_items_with_modalities.py +43 -43
  138. dtlpy/examples/upload_segmentation_annotations_from_mask_image.py +44 -44
  139. dtlpy/examples/upload_yolo_format_annotations.py +70 -70
  140. dtlpy/exceptions.py +125 -125
  141. dtlpy/miscellaneous/__init__.py +20 -20
  142. dtlpy/miscellaneous/dict_differ.py +95 -95
  143. dtlpy/miscellaneous/git_utils.py +217 -217
  144. dtlpy/miscellaneous/json_utils.py +14 -14
  145. dtlpy/miscellaneous/list_print.py +105 -105
  146. dtlpy/miscellaneous/zipping.py +130 -130
  147. dtlpy/ml/__init__.py +20 -20
  148. dtlpy/ml/base_feature_extractor_adapter.py +27 -27
  149. dtlpy/ml/base_model_adapter.py +945 -940
  150. dtlpy/ml/metrics.py +461 -461
  151. dtlpy/ml/predictions_utils.py +274 -274
  152. dtlpy/ml/summary_writer.py +57 -57
  153. dtlpy/ml/train_utils.py +60 -60
  154. dtlpy/new_instance.py +252 -252
  155. dtlpy/repositories/__init__.py +56 -56
  156. dtlpy/repositories/analytics.py +85 -85
  157. dtlpy/repositories/annotations.py +916 -916
  158. dtlpy/repositories/apps.py +383 -383
  159. dtlpy/repositories/artifacts.py +452 -452
  160. dtlpy/repositories/assignments.py +599 -599
  161. dtlpy/repositories/bots.py +213 -213
  162. dtlpy/repositories/codebases.py +559 -559
  163. dtlpy/repositories/collections.py +332 -348
  164. dtlpy/repositories/commands.py +158 -158
  165. dtlpy/repositories/compositions.py +61 -61
  166. dtlpy/repositories/computes.py +434 -406
  167. dtlpy/repositories/datasets.py +1291 -1291
  168. dtlpy/repositories/downloader.py +895 -895
  169. dtlpy/repositories/dpks.py +433 -433
  170. dtlpy/repositories/drivers.py +266 -266
  171. dtlpy/repositories/executions.py +817 -817
  172. dtlpy/repositories/feature_sets.py +226 -226
  173. dtlpy/repositories/features.py +238 -238
  174. dtlpy/repositories/integrations.py +484 -484
  175. dtlpy/repositories/items.py +909 -915
  176. dtlpy/repositories/messages.py +94 -94
  177. dtlpy/repositories/models.py +877 -867
  178. dtlpy/repositories/nodes.py +80 -80
  179. dtlpy/repositories/ontologies.py +511 -511
  180. dtlpy/repositories/organizations.py +525 -525
  181. dtlpy/repositories/packages.py +1941 -1941
  182. dtlpy/repositories/pipeline_executions.py +448 -448
  183. dtlpy/repositories/pipelines.py +642 -642
  184. dtlpy/repositories/projects.py +539 -539
  185. dtlpy/repositories/recipes.py +399 -399
  186. dtlpy/repositories/resource_executions.py +137 -137
  187. dtlpy/repositories/schema.py +120 -120
  188. dtlpy/repositories/service_drivers.py +213 -213
  189. dtlpy/repositories/services.py +1704 -1704
  190. dtlpy/repositories/settings.py +339 -339
  191. dtlpy/repositories/tasks.py +1124 -1124
  192. dtlpy/repositories/times_series.py +278 -278
  193. dtlpy/repositories/triggers.py +536 -536
  194. dtlpy/repositories/upload_element.py +257 -257
  195. dtlpy/repositories/uploader.py +651 -651
  196. dtlpy/repositories/webhooks.py +249 -249
  197. dtlpy/services/__init__.py +22 -22
  198. dtlpy/services/aihttp_retry.py +131 -131
  199. dtlpy/services/api_client.py +1782 -1782
  200. dtlpy/services/api_reference.py +40 -40
  201. dtlpy/services/async_utils.py +133 -133
  202. dtlpy/services/calls_counter.py +44 -44
  203. dtlpy/services/check_sdk.py +68 -68
  204. dtlpy/services/cookie.py +115 -115
  205. dtlpy/services/create_logger.py +156 -156
  206. dtlpy/services/events.py +84 -84
  207. dtlpy/services/logins.py +235 -235
  208. dtlpy/services/reporter.py +256 -256
  209. dtlpy/services/service_defaults.py +91 -91
  210. dtlpy/utilities/__init__.py +20 -20
  211. dtlpy/utilities/annotations/__init__.py +16 -16
  212. dtlpy/utilities/annotations/annotation_converters.py +269 -269
  213. dtlpy/utilities/base_package_runner.py +264 -264
  214. dtlpy/utilities/converter.py +1650 -1650
  215. dtlpy/utilities/dataset_generators/__init__.py +1 -1
  216. dtlpy/utilities/dataset_generators/dataset_generator.py +670 -670
  217. dtlpy/utilities/dataset_generators/dataset_generator_tensorflow.py +23 -23
  218. dtlpy/utilities/dataset_generators/dataset_generator_torch.py +21 -21
  219. dtlpy/utilities/local_development/__init__.py +1 -1
  220. dtlpy/utilities/local_development/local_session.py +179 -179
  221. dtlpy/utilities/reports/__init__.py +2 -2
  222. dtlpy/utilities/reports/figures.py +343 -343
  223. dtlpy/utilities/reports/report.py +71 -71
  224. dtlpy/utilities/videos/__init__.py +17 -17
  225. dtlpy/utilities/videos/video_player.py +598 -598
  226. dtlpy/utilities/videos/videos.py +470 -470
  227. {dtlpy-1.113.10.data → dtlpy-1.114.13.data}/scripts/dlp +1 -1
  228. dtlpy-1.114.13.data/scripts/dlp.bat +2 -0
  229. {dtlpy-1.113.10.data → dtlpy-1.114.13.data}/scripts/dlp.py +128 -128
  230. {dtlpy-1.113.10.dist-info → dtlpy-1.114.13.dist-info}/LICENSE +200 -200
  231. {dtlpy-1.113.10.dist-info → dtlpy-1.114.13.dist-info}/METADATA +172 -172
  232. dtlpy-1.114.13.dist-info/RECORD +240 -0
  233. {dtlpy-1.113.10.dist-info → dtlpy-1.114.13.dist-info}/WHEEL +1 -1
  234. tests/features/environment.py +551 -550
  235. dtlpy-1.113.10.data/scripts/dlp.bat +0 -2
  236. dtlpy-1.113.10.dist-info/RECORD +0 -244
  237. tests/assets/__init__.py +0 -0
  238. tests/assets/models_flow/__init__.py +0 -0
  239. tests/assets/models_flow/failedmain.py +0 -52
  240. tests/assets/models_flow/main.py +0 -62
  241. tests/assets/models_flow/main_model.py +0 -54
  242. {dtlpy-1.113.10.dist-info → dtlpy-1.114.13.dist-info}/entry_points.txt +0 -0
  243. {dtlpy-1.113.10.dist-info → dtlpy-1.114.13.dist-info}/top_level.txt +0 -0
@@ -1,268 +1,291 @@
1
- import logging
2
- import math
3
- import time
4
- import tqdm
5
- import copy
6
- import sys
7
-
8
- import attr
9
-
10
- from .filters import FiltersOperations, FiltersOrderByDirection, FiltersResource
11
- from .. import miscellaneous
12
- from ..services.api_client import ApiClient
13
-
14
- logger = logging.getLogger(name='dtlpy')
15
-
16
-
17
- @attr.s
18
- class PagedEntities:
19
- """
20
- Pages object
21
- """
22
- # api
23
- _client_api = attr.ib(type=ApiClient, repr=False)
24
-
25
- # params
26
- page_offset = attr.ib()
27
- page_size = attr.ib()
28
- filters = attr.ib()
29
- items_repository = attr.ib(repr=False)
30
- has_next_page = attr.ib(default=False)
31
- total_pages_count = attr.ib(default=0)
32
- items_count = attr.ib(default=0)
33
-
34
- # hybrid pagination
35
- use_id_based_paging = attr.ib(default=False)
36
- last_seen_id = attr.ib(default=None)
37
-
38
- # execution attribute
39
- _service_id = attr.ib(default=None, repr=False)
40
- _project_id = attr.ib(default=None, repr=False)
41
- _order_by_type = attr.ib(default=None, repr=False)
42
- _order_by_direction = attr.ib(default=None, repr=False)
43
- _execution_status = attr.ib(default=None, repr=False)
44
- _execution_resource_type = attr.ib(default=None, repr=False)
45
- _execution_resource_id = attr.ib(default=None, repr=False)
46
- _execution_function_name = attr.ib(default=None, repr=False)
47
- _list_function = attr.ib(default=None, repr=False)
48
-
49
- # items list
50
- items = attr.ib(default=miscellaneous.List(), repr=False)
51
-
52
- @staticmethod
53
- def _has_explicit_sort(flt):
54
- """
55
- Check if the filter has custom sort fields defined (not id/createdAt).
56
- """
57
- prepared = flt.prepare() if flt else {}
58
- sort_fields = list(prepared.get("sort", {}).keys())
59
- return bool(sort_fields and sort_fields[0] not in {"id", "createdAt"})
60
-
61
- def process_result(self, result):
62
- """
63
- :param result: json object
64
- """
65
- if 'page_offset' in result:
66
- self.page_offset = result['page_offset']
67
- if 'page_size' in result:
68
- self.page_size = result['page_size']
69
- if 'hasNextPage' in result:
70
- self.has_next_page = result['hasNextPage']
71
- if 'totalItemsCount' in result:
72
- self.items_count = result['totalItemsCount']
73
- if 'totalPagesCount' in result:
74
- self.total_pages_count = result['totalPagesCount']
75
- if 'items' in result:
76
- items = self.items_repository._build_entities_from_response(response_items=result['items'])
77
- else:
78
- items = miscellaneous.List(list())
79
- return items
80
-
81
- def __getitem__(self, y):
82
- self.go_to_page(y)
83
- return self.items
84
-
85
- def __len__(self):
86
- return self.items_count
87
-
88
- def __iter__(self):
89
- pbar = tqdm.tqdm(total=self.total_pages_count,
90
- disable=self._client_api.verbose.disable_progress_bar_iterate_pages,
91
- file=sys.stdout, desc="Iterate Pages")
92
- if self.page_offset != 0:
93
- # reset the count for page 0
94
- self.page_offset = 0
95
- self.get_page()
96
- while True:
97
- yield self.items
98
- pbar.update()
99
-
100
- if self.has_next_page:
101
- self.page_offset += 1
102
- self.get_page()
103
- else:
104
- pbar.close()
105
- break
106
-
107
- def __reversed__(self):
108
- self.page_offset = self.total_pages_count - 1
109
- while True:
110
- self.get_page()
111
- yield self.items
112
- if self.page_offset == 0:
113
- break
114
- self.page_offset -= 1
115
-
116
- def return_page(self, page_offset=None, page_size=None):
117
- """
118
- Return page
119
-
120
- :param page_offset: page offset
121
- :param page_size: page size
122
- """
123
- if page_size is None:
124
- page_size = self.page_size
125
- if page_offset is None:
126
- page_offset = self.page_offset
127
-
128
- if self.filters is None:
129
- raise ValueError("Cant return page. Filters is empty")
130
-
131
- req = copy.deepcopy(self.filters)
132
- req.page_size = page_size
133
-
134
- after_id = getattr(req, "after_id", None)
135
- if after_id is not None:
136
- delattr(req, "after_id")
137
-
138
- enable_hybrid = getattr(self.filters, "resource", None) in [
139
- FiltersResource.ITEM,
140
- FiltersResource.ANNOTATION,
141
- FiltersResource.FEATURE,
142
- ]
143
-
144
- prepared= req.prepare()
145
- sort_spec= prepared.get("sort", {})
146
- sort_dir= next(iter(sort_spec.values()), None)
147
- order= sort_dir or FiltersOrderByDirection.ASCENDING
148
- operator_value = (FiltersOperations.LESS_THAN if sort_dir == FiltersOrderByDirection.DESCENDING else FiltersOperations.GREATER_THAN)
149
-
150
- if enable_hybrid and not self._has_explicit_sort(req):
151
- req.sort_by(field="id", value=order)
152
-
153
- if enable_hybrid and self.use_id_based_paging:
154
- req.page = 0
155
- if self.last_seen_id:
156
- req.add(
157
- field="id",
158
- values=self.last_seen_id,
159
- operator=operator_value,
160
- method=FiltersOperations.AND,
161
- )
162
- else:
163
- auto_hybrid = (
164
- enable_hybrid
165
- and not self.use_id_based_paging
166
- and not self._has_explicit_sort(self.filters)
167
- and self.last_seen_id is not None
168
- )
169
- if auto_hybrid and page_offset > 0:
170
- req.page = 0
171
- req.add(
172
- field="id",
173
- values=after_id or self.last_seen_id,
174
- operator=operator_value,
175
- method=FiltersOperations.AND,
176
- )
177
- self.use_id_based_paging = True
178
- else:
179
- req.page = page_offset
180
-
181
- if self._list_function is None:
182
- result = self.items_repository._list(filters=req)
183
- else:
184
- result = self._list_function(filters=req)
185
-
186
- items = self.process_result(result)
187
-
188
- if enable_hybrid and items and hasattr(items[-1], "id"):
189
- self.last_seen_id = items[-1].id
190
-
191
- if self.use_id_based_paging:
192
- if "hasNextPage" not in result:
193
- self.has_next_page = len(items) == page_size
194
-
195
- return items
196
-
197
- def get_page(self, page_offset=None, page_size=None):
198
- """
199
- Get page
200
-
201
- :param page_offset: page offset
202
- :param page_size: page size
203
- """
204
- items = self.return_page(page_offset=page_offset,
205
- page_size=page_size)
206
- self.items = items
207
-
208
- def next_page(self):
209
- """
210
- Brings the next page of items from host
211
-
212
- :return:
213
- """
214
- self.page_offset += 1
215
- self.get_page()
216
-
217
- def prev_page(self):
218
- """
219
- Brings the previous page of items from host
220
-
221
- :return:
222
- """
223
- self.page_offset -= 1
224
- self.get_page()
225
-
226
- def go_to_page(self, page=0):
227
- """
228
- Brings specified page of items from host
229
-
230
- :param page: page number
231
- :return:
232
- """
233
- self.page_offset = page
234
- self.get_page()
235
-
236
- def all(self):
237
- page_offset = 0
238
- page_size = 100
239
- pbar = tqdm.tqdm(total=self.items_count,
240
- disable=self._client_api.verbose.disable_progress_bar,
241
- file=sys.stdout, desc='Iterate Entity')
242
- total_pages = math.ceil(self.items_count / page_size)
243
- jobs = list()
244
- pool = self._client_api.thread_pools('item.page')
245
- while True:
246
- time.sleep(0.01) # to flush the results
247
- if page_offset <= total_pages:
248
- jobs.append(pool.submit(self.return_page, **{'page_offset': page_offset,
249
- 'page_size': page_size}))
250
- page_offset += 1
251
- for i_job, job in enumerate(jobs):
252
- if job.done():
253
- for item in job.result():
254
- pbar.update()
255
- yield item
256
- jobs.remove(job)
257
- if len(jobs) == 0:
258
- pbar.close()
259
- break
260
-
261
- ########
262
- # misc #
263
- ########
264
- def print(self, columns=None):
265
- self.items.print(columns=columns)
266
-
267
- def to_df(self, columns=None):
1
+ import logging
2
+ import math
3
+ import time
4
+ import tqdm
5
+ import copy
6
+ import sys
7
+ from typing import Optional, List, Any
8
+
9
+ import attr
10
+
11
+ from .filters import FiltersOperations, FiltersOrderByDirection, FiltersResource
12
+ from .. import miscellaneous
13
+ from ..services.api_client import ApiClient
14
+
15
+ logger = logging.getLogger(name='dtlpy')
16
+
17
+
18
+ @attr.s
19
+ class PagedEntities:
20
+ """
21
+ Pages object for efficient API pagination.
22
+ Defaults to offset-based pagination for compatibility with all operations.
23
+ Switches to keyset/cursor-based pagination (using 'id' as the cursor) during iteration for performance.
24
+ Falls back to offset-based pagination if keyset is not possible (e.g., custom sort).
25
+ """
26
+ # api
27
+ _client_api: ApiClient = attr.ib(repr=False)
28
+
29
+ # params
30
+ page_offset: int = attr.ib()
31
+ page_size: int = attr.ib()
32
+ filters: Any = attr.ib()
33
+ items_repository: Any = attr.ib(repr=False)
34
+ has_next_page: bool = attr.ib(default=False)
35
+ total_pages_count: int = attr.ib(default=0)
36
+ items_count: int = attr.ib(default=0)
37
+
38
+ # hybrid pagination
39
+ use_id_based_paging: bool = attr.ib(default=False) # Default to False for offset-based pagination
40
+ last_seen_id: Optional[Any] = attr.ib(default=None)
41
+
42
+ # execution attribute
43
+ _service_id = attr.ib(default=None, repr=False)
44
+ _project_id = attr.ib(default=None, repr=False)
45
+ _list_function = attr.ib(default=None, repr=False)
46
+
47
+ # items list
48
+ items: List[Any] = attr.ib(default=miscellaneous.List(), repr=False)
49
+
50
+ @staticmethod
51
+ def _has_explicit_sort(flt) -> bool:
52
+ """
53
+ Check if the filter has custom sort fields defined (not id/createdAt).
54
+ """
55
+ prepared = flt.prepare() if flt else {}
56
+ sort_fields = list(prepared.get("sort", {}).keys())
57
+ if isinstance(sort_fields, list) and len(sort_fields) > 0:
58
+ return sort_fields[0] not in {"id", "createdAt"}
59
+ return False
60
+
61
+ def _should_use_keyset_pagination(self) -> bool:
62
+ """
63
+ Determine whether to use keyset pagination based on page offset and resource type.
64
+ Keyset pagination can only be used when page_offset is 0 (first page).
65
+ :param page_offset: The page offset to check
66
+ :return: True if keyset pagination should be used, False otherwise
67
+ """
68
+ # Keyset pagination only works for page 0 (first page)
69
+ if self.page_offset != 0:
70
+ return False
71
+
72
+ # can't use add to custom filter
73
+ if self.filters.custom_filter is not None:
74
+ return False
75
+
76
+ # Check if the resource supports keyset pagination
77
+ enable_id_based_paging = getattr(self.filters, "resource", None) in [
78
+ FiltersResource.ITEM,
79
+ FiltersResource.ANNOTATION,
80
+ FiltersResource.FEATURE,
81
+ ]
82
+
83
+ if not enable_id_based_paging:
84
+ return False
85
+
86
+ # Check if there's no explicit sort that would prevent keyset pagination
87
+ if self._has_explicit_sort(self.filters):
88
+ return False
89
+
90
+ return True
91
+
92
+ def process_result(self, result: dict) -> List[Any]:
93
+ """
94
+ Process the API result and update pagination state.
95
+ :param result: json object
96
+ :return: list of items
97
+ """
98
+ # Only update page_offset if using offset-based pagination
99
+ if not self.use_id_based_paging and 'page_offset' in result:
100
+ self.page_offset = result['page_offset']
101
+ if 'page_size' in result:
102
+ self.page_size = result['page_size']
103
+ if 'hasNextPage' in result:
104
+ self.has_next_page = result['hasNextPage']
105
+ if 'totalItemsCount' in result:
106
+ self.items_count = result['totalItemsCount']
107
+ if 'totalPagesCount' in result:
108
+ self.total_pages_count = result['totalPagesCount']
109
+ if 'items' in result:
110
+ items = self.items_repository._build_entities_from_response(response_items=result['items'])
111
+ else:
112
+ items = miscellaneous.List(list())
113
+ return items
114
+
115
+ def __getitem__(self, y: int) -> List[Any]:
116
+ # If we're already on the requested page, return current items
117
+ if y == self.page_offset:
118
+ return self.items
119
+ # Otherwise, go to the requested page
120
+ self.go_to_page(y)
121
+ return self.items
122
+
123
+ def __len__(self) -> int:
124
+ return self.items_count
125
+
126
+ def __iter__(self):
127
+ # Use keyset/cursor-based pagination for iteration when possible
128
+ self.last_seen_id = None
129
+ self.page_offset = 0 # Start from the first page for iteration
130
+ self.use_id_based_paging = self._should_use_keyset_pagination()
131
+ self.has_next_page = True # Start with assumption that there are more pages
132
+ self.page_size = self.page_size or 100
133
+ pbar = tqdm.tqdm(total=self.items_count,
134
+ disable=self._client_api.verbose.disable_progress_bar_iterate_pages,
135
+ file=sys.stdout, desc="Iterate Pages")
136
+
137
+ # Get the first page
138
+ self.get_page()
139
+ if self.items:
140
+ yield self.items
141
+ pbar.update()
142
+
143
+ # Continue with next pages
144
+ while self.has_next_page:
145
+ if self.use_id_based_paging:
146
+ # For keyset pagination, just get the next page
147
+ self.page_offset = 0
148
+ self.get_page()
149
+ else:
150
+ # For offset pagination, increment the offset
151
+ self.page_offset += 1
152
+ self.get_page()
153
+
154
+ if not self.items:
155
+ break
156
+ yield self.items
157
+ pbar.update()
158
+ pbar.close()
159
+
160
+ def __reversed__(self):
161
+ # Force offset-based pagination for reverse iteration
162
+ self.use_id_based_paging = False
163
+ self.page_offset = self.total_pages_count - 1
164
+ while True:
165
+ self.get_page()
166
+ yield self.items
167
+ if self.page_offset == 0:
168
+ break
169
+ self.page_offset -= 1
170
+
171
+ def return_page(self, page_offset: Optional[int] = None, page_size: Optional[int] = None) -> List[Any]:
172
+ """
173
+ Return a page of results using offset-based pagination by default.
174
+ Switches to keyset/cursor-based pagination when supported and beneficial.
175
+ :param page_offset: page offset (for offset-based)
176
+ :param page_size: page size
177
+ :return: list of items
178
+ """
179
+ if page_size is not None:
180
+ self.page_size = page_size
181
+ if page_offset is not None:
182
+ self.page_offset = page_offset
183
+
184
+ if self.filters is None:
185
+ raise ValueError("Can't return page. Filters is empty")
186
+ self.filters.page_size = self.page_size
187
+ self.filters.page = self.page_offset
188
+ req = copy.deepcopy(self.filters)
189
+
190
+ # Determine pagination method based on page offset and resource type
191
+ self.use_id_based_paging = self._should_use_keyset_pagination()
192
+
193
+ if self.use_id_based_paging:
194
+ # Use keyset/cursor-based pagination
195
+ prepared = req.prepare()
196
+ sort_spec = prepared.get("sort", {})
197
+ order = next(iter(sort_spec.values()), None)
198
+ if order is None:
199
+ order = FiltersOrderByDirection.ASCENDING
200
+ if order == FiltersOrderByDirection.DESCENDING:
201
+ operator_value = FiltersOperations.LESS_THAN
202
+ else:
203
+ operator_value = FiltersOperations.GREATER_THAN
204
+
205
+ req.sort_by(field="id", value=order)
206
+ req.page = 0 # always fetch from the start for keyset
207
+ # Only add last_seen_id filter if we're not explicitly requesting page 0
208
+ if self.last_seen_id:
209
+ req.add(
210
+ field="id",
211
+ values=self.last_seen_id,
212
+ operator=operator_value,
213
+ method=FiltersOperations.AND,
214
+ )
215
+
216
+ # Fetch data
217
+ if self._list_function is None:
218
+ result = self.items_repository._list(filters=req)
219
+ else:
220
+ result = self._list_function(filters=req)
221
+
222
+ items = self.process_result(result)
223
+
224
+ # Update last_seen_id for keyset
225
+ if self.use_id_based_paging and items and hasattr(items[-1], "id"):
226
+ self.last_seen_id = items[-1].id
227
+ elif self.use_id_based_paging and not items:
228
+ self.last_seen_id = None
229
+ return items
230
+
231
+ def get_page(self, page_offset: Optional[int] = None, page_size: Optional[int] = None) -> None:
232
+ """
233
+ Get a page of results and update self.items.
234
+ :param page_offset: page offset (for offset-based)
235
+ :param page_size: page size
236
+ """
237
+ items = self.return_page(page_offset=page_offset, page_size=page_size)
238
+ self.items = items
239
+
240
+ def next_page(self) -> None:
241
+ """
242
+ Brings the next page of items from host.
243
+ """
244
+ if self.use_id_based_paging:
245
+ # For keyset pagination, just get the next page
246
+ self.get_page()
247
+ else:
248
+ # For offset pagination, increment the offset
249
+ self.page_offset += 1
250
+ self.get_page()
251
+
252
+ def prev_page(self) -> None:
253
+ """
254
+ Brings the previous page of items from host.
255
+ Only works with offset-based pagination.
256
+ """
257
+ if self.use_id_based_paging:
258
+ raise NotImplementedError("prev_page is not supported for keyset pagination.")
259
+ self.page_offset -= 1
260
+ self.get_page()
261
+
262
+ def go_to_page(self, page: int = 0) -> None:
263
+ """
264
+ Brings specified page of items from host.
265
+ For page 0, uses keyset pagination if supported.
266
+ For other pages, uses offset-based pagination.
267
+ :param page: page number
268
+ """
269
+ # Reset last_seen_id when going to page 0 to ensure we get all items
270
+ if page == 0:
271
+ self.last_seen_id = None
272
+ self.page_offset = page
273
+ self.get_page()
274
+
275
+ def all(self):
276
+ """
277
+ Iterate over all items in all pages efficiently.
278
+ Uses the iterator implementation (__iter__).
279
+ """
280
+ for items in self:
281
+ for item in items:
282
+ yield item
283
+
284
+ ########
285
+ # misc #
286
+ ########
287
+ def print(self, columns=None):
288
+ self.items.print(columns=columns)
289
+
290
+ def to_df(self, columns=None):
268
291
  return self.items.to_df(columns=columns)