deltacat 2.0.0b11__py3-none-any.whl → 2.0.0b12__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (194) hide show
  1. deltacat/__init__.py +78 -3
  2. deltacat/api.py +122 -67
  3. deltacat/aws/constants.py +0 -23
  4. deltacat/aws/s3u.py +4 -631
  5. deltacat/benchmarking/conftest.py +0 -18
  6. deltacat/catalog/__init__.py +2 -0
  7. deltacat/catalog/delegate.py +445 -63
  8. deltacat/catalog/interface.py +188 -62
  9. deltacat/catalog/main/impl.py +2417 -271
  10. deltacat/catalog/model/catalog.py +49 -10
  11. deltacat/catalog/model/properties.py +38 -0
  12. deltacat/compute/compactor/compaction_session.py +97 -75
  13. deltacat/compute/compactor/model/compact_partition_params.py +75 -30
  14. deltacat/compute/compactor/model/compaction_session_audit_info.py +17 -0
  15. deltacat/compute/compactor/model/round_completion_info.py +16 -6
  16. deltacat/compute/compactor/repartition_session.py +8 -21
  17. deltacat/compute/compactor/steps/hash_bucket.py +5 -5
  18. deltacat/compute/compactor/steps/materialize.py +9 -7
  19. deltacat/compute/compactor/steps/repartition.py +12 -11
  20. deltacat/compute/compactor/utils/io.py +6 -5
  21. deltacat/compute/compactor/utils/round_completion_reader.py +117 -0
  22. deltacat/compute/compactor/utils/system_columns.py +3 -1
  23. deltacat/compute/compactor_v2/compaction_session.py +17 -14
  24. deltacat/compute/compactor_v2/constants.py +30 -1
  25. deltacat/compute/compactor_v2/model/evaluate_compaction_result.py +0 -1
  26. deltacat/compute/compactor_v2/model/hash_bucket_input.py +9 -3
  27. deltacat/compute/compactor_v2/model/merge_file_group.py +5 -2
  28. deltacat/compute/compactor_v2/model/merge_input.py +33 -8
  29. deltacat/compute/compactor_v2/private/compaction_utils.py +167 -68
  30. deltacat/compute/compactor_v2/steps/hash_bucket.py +5 -2
  31. deltacat/compute/compactor_v2/steps/merge.py +267 -55
  32. deltacat/compute/compactor_v2/utils/content_type_params.py +34 -6
  33. deltacat/compute/compactor_v2/utils/dedupe.py +1 -1
  34. deltacat/compute/compactor_v2/utils/delta.py +5 -3
  35. deltacat/compute/compactor_v2/utils/io.py +11 -4
  36. deltacat/compute/compactor_v2/utils/merge.py +15 -2
  37. deltacat/compute/compactor_v2/utils/primary_key_index.py +28 -4
  38. deltacat/compute/compactor_v2/utils/task_options.py +45 -33
  39. deltacat/compute/converter/converter_session.py +145 -32
  40. deltacat/compute/converter/model/convert_input.py +26 -19
  41. deltacat/compute/converter/model/convert_input_files.py +33 -16
  42. deltacat/compute/converter/model/convert_result.py +35 -16
  43. deltacat/compute/converter/model/converter_session_params.py +24 -21
  44. deltacat/compute/converter/pyiceberg/catalog.py +21 -18
  45. deltacat/compute/converter/pyiceberg/overrides.py +18 -9
  46. deltacat/compute/converter/pyiceberg/update_snapshot_overrides.py +148 -100
  47. deltacat/compute/converter/steps/convert.py +157 -50
  48. deltacat/compute/converter/steps/dedupe.py +24 -11
  49. deltacat/compute/converter/utils/convert_task_options.py +27 -12
  50. deltacat/compute/converter/utils/converter_session_utils.py +126 -60
  51. deltacat/compute/converter/utils/iceberg_columns.py +8 -8
  52. deltacat/compute/converter/utils/io.py +101 -12
  53. deltacat/compute/converter/utils/s3u.py +33 -27
  54. deltacat/compute/janitor.py +205 -0
  55. deltacat/compute/jobs/client.py +19 -8
  56. deltacat/compute/resource_estimation/delta.py +38 -6
  57. deltacat/compute/resource_estimation/model.py +8 -0
  58. deltacat/constants.py +44 -0
  59. deltacat/docs/autogen/schema/__init__.py +0 -0
  60. deltacat/docs/autogen/schema/inference/__init__.py +0 -0
  61. deltacat/docs/autogen/schema/inference/generate_type_mappings.py +687 -0
  62. deltacat/docs/autogen/schema/inference/parse_json_type_mappings.py +673 -0
  63. deltacat/examples/compactor/__init__.py +0 -0
  64. deltacat/examples/compactor/aws/__init__.py +1 -0
  65. deltacat/examples/compactor/bootstrap.py +863 -0
  66. deltacat/examples/compactor/compactor.py +373 -0
  67. deltacat/examples/compactor/explorer.py +473 -0
  68. deltacat/examples/compactor/gcp/__init__.py +1 -0
  69. deltacat/examples/compactor/job_runner.py +439 -0
  70. deltacat/examples/compactor/utils/__init__.py +1 -0
  71. deltacat/examples/compactor/utils/common.py +261 -0
  72. deltacat/examples/experimental/iceberg/converter/__init__.py +0 -0
  73. deltacat/examples/experimental/iceberg/converter/beam/__init__.py +0 -0
  74. deltacat/examples/experimental/iceberg/converter/beam/app.py +226 -0
  75. deltacat/examples/experimental/iceberg/converter/beam/main.py +133 -0
  76. deltacat/examples/experimental/iceberg/converter/beam/test_workflow.py +113 -0
  77. deltacat/examples/experimental/iceberg/converter/beam/utils/__init__.py +3 -0
  78. deltacat/examples/experimental/iceberg/converter/beam/utils/common.py +174 -0
  79. deltacat/examples/experimental/iceberg/converter/beam/utils/spark.py +263 -0
  80. deltacat/exceptions.py +66 -4
  81. deltacat/experimental/catalog/iceberg/impl.py +2 -2
  82. deltacat/experimental/compatibility/__init__.py +0 -0
  83. deltacat/experimental/compatibility/backfill_locator_to_id_mappings.py +201 -0
  84. deltacat/experimental/converter_agent/__init__.py +0 -0
  85. deltacat/experimental/converter_agent/beam/__init__.py +0 -0
  86. deltacat/experimental/converter_agent/beam/managed.py +173 -0
  87. deltacat/experimental/converter_agent/table_monitor.py +479 -0
  88. deltacat/experimental/storage/iceberg/iceberg_scan_planner.py +105 -4
  89. deltacat/experimental/storage/iceberg/impl.py +5 -3
  90. deltacat/experimental/storage/iceberg/model.py +7 -3
  91. deltacat/experimental/storage/iceberg/visitor.py +119 -0
  92. deltacat/experimental/storage/rivulet/dataset.py +0 -3
  93. deltacat/experimental/storage/rivulet/metastore/delta.py +0 -2
  94. deltacat/experimental/storage/rivulet/reader/dataset_metastore.py +3 -2
  95. deltacat/io/datasource/deltacat_datasource.py +0 -1
  96. deltacat/storage/__init__.py +20 -2
  97. deltacat/storage/interface.py +54 -32
  98. deltacat/storage/main/impl.py +1494 -541
  99. deltacat/storage/model/delta.py +27 -3
  100. deltacat/storage/model/locator.py +6 -12
  101. deltacat/storage/model/manifest.py +182 -6
  102. deltacat/storage/model/metafile.py +151 -78
  103. deltacat/storage/model/namespace.py +8 -1
  104. deltacat/storage/model/partition.py +117 -42
  105. deltacat/storage/model/schema.py +2427 -159
  106. deltacat/storage/model/sort_key.py +40 -0
  107. deltacat/storage/model/stream.py +9 -2
  108. deltacat/storage/model/table.py +12 -1
  109. deltacat/storage/model/table_version.py +11 -0
  110. deltacat/storage/model/transaction.py +1184 -208
  111. deltacat/storage/model/transform.py +81 -2
  112. deltacat/storage/model/types.py +48 -26
  113. deltacat/tests/_io/test_cloudpickle_bug_fix.py +8 -4
  114. deltacat/tests/aws/test_s3u.py +2 -31
  115. deltacat/tests/catalog/main/test_catalog_impl_table_operations.py +1606 -70
  116. deltacat/tests/catalog/test_catalogs.py +54 -11
  117. deltacat/tests/catalog/test_default_catalog_impl.py +12152 -71
  118. deltacat/tests/compute/compact_partition_test_cases.py +35 -8
  119. deltacat/tests/compute/compactor/steps/test_repartition.py +12 -12
  120. deltacat/tests/compute/compactor/utils/test_io.py +124 -120
  121. deltacat/tests/compute/compactor/utils/test_round_completion_reader.py +254 -0
  122. deltacat/tests/compute/compactor_v2/test_compaction_session.py +423 -312
  123. deltacat/tests/compute/compactor_v2/utils/test_content_type_params.py +266 -0
  124. deltacat/tests/compute/compactor_v2/utils/test_primary_key_index.py +45 -0
  125. deltacat/tests/compute/compactor_v2/utils/test_task_options.py +270 -1
  126. deltacat/tests/compute/conftest.py +8 -44
  127. deltacat/tests/compute/converter/test_convert_session.py +675 -490
  128. deltacat/tests/compute/converter/utils.py +15 -6
  129. deltacat/tests/compute/resource_estimation/test_delta.py +145 -79
  130. deltacat/tests/compute/test_compact_partition_incremental.py +103 -70
  131. deltacat/tests/compute/test_compact_partition_multiple_rounds.py +89 -66
  132. deltacat/tests/compute/test_compact_partition_params.py +13 -8
  133. deltacat/tests/compute/test_compact_partition_rebase.py +77 -62
  134. deltacat/tests/compute/test_compact_partition_rebase_then_incremental.py +263 -193
  135. deltacat/tests/compute/test_janitor.py +236 -0
  136. deltacat/tests/compute/test_util_common.py +716 -43
  137. deltacat/tests/compute/test_util_constant.py +0 -1
  138. deltacat/tests/{storage/conftest.py → conftest.py} +1 -1
  139. deltacat/tests/experimental/__init__.py +1 -0
  140. deltacat/tests/experimental/compatibility/__init__.py +1 -0
  141. deltacat/tests/experimental/compatibility/test_backfill_locator_to_id_mappings.py +582 -0
  142. deltacat/tests/storage/main/test_main_storage.py +6900 -95
  143. deltacat/tests/storage/model/test_metafile_io.py +78 -173
  144. deltacat/tests/storage/model/test_partition_scheme.py +85 -0
  145. deltacat/tests/storage/model/test_schema.py +171 -0
  146. deltacat/tests/storage/model/test_schema_update.py +1925 -0
  147. deltacat/tests/storage/model/test_sort_scheme.py +90 -0
  148. deltacat/tests/storage/model/test_transaction.py +393 -48
  149. deltacat/tests/storage/model/test_transaction_history.py +886 -0
  150. deltacat/tests/test_deltacat_api.py +988 -4
  151. deltacat/tests/test_exceptions.py +9 -5
  152. deltacat/tests/test_utils/pyarrow.py +52 -21
  153. deltacat/tests/test_utils/storage.py +23 -34
  154. deltacat/tests/types/__init__.py +0 -0
  155. deltacat/tests/types/test_tables.py +104 -0
  156. deltacat/tests/utils/exceptions.py +22 -0
  157. deltacat/tests/utils/main_deltacat_storage_mock.py +31 -0
  158. deltacat/tests/utils/ray_utils/test_dataset.py +123 -5
  159. deltacat/tests/utils/test_daft.py +121 -31
  160. deltacat/tests/utils/test_numpy.py +1193 -0
  161. deltacat/tests/utils/test_pandas.py +1106 -0
  162. deltacat/tests/utils/test_polars.py +1040 -0
  163. deltacat/tests/utils/test_pyarrow.py +1370 -89
  164. deltacat/types/media.py +221 -11
  165. deltacat/types/tables.py +2329 -59
  166. deltacat/utils/arguments.py +33 -1
  167. deltacat/utils/daft.py +411 -150
  168. deltacat/utils/filesystem.py +100 -0
  169. deltacat/utils/metafile_locator.py +2 -1
  170. deltacat/utils/numpy.py +118 -26
  171. deltacat/utils/pandas.py +577 -48
  172. deltacat/utils/polars.py +658 -27
  173. deltacat/utils/pyarrow.py +1258 -213
  174. deltacat/utils/ray_utils/dataset.py +101 -10
  175. deltacat/utils/reader_compatibility_mapping.py +3083 -0
  176. deltacat/utils/url.py +56 -15
  177. deltacat-2.0.0b12.dist-info/METADATA +1163 -0
  178. {deltacat-2.0.0b11.dist-info → deltacat-2.0.0b12.dist-info}/RECORD +183 -145
  179. {deltacat-2.0.0b11.dist-info → deltacat-2.0.0b12.dist-info}/WHEEL +1 -1
  180. deltacat/compute/compactor/utils/round_completion_file.py +0 -97
  181. deltacat/compute/merge_on_read/__init__.py +0 -4
  182. deltacat/compute/merge_on_read/daft.py +0 -40
  183. deltacat/compute/merge_on_read/model/merge_on_read_params.py +0 -66
  184. deltacat/compute/merge_on_read/utils/delta.py +0 -42
  185. deltacat/tests/compute/compactor/utils/test_round_completion_file.py +0 -231
  186. deltacat/tests/compute/test_util_create_table_deltas_repo.py +0 -388
  187. deltacat/tests/local_deltacat_storage/__init__.py +0 -1236
  188. deltacat/tests/local_deltacat_storage/exceptions.py +0 -10
  189. deltacat/utils/s3fs.py +0 -21
  190. deltacat-2.0.0b11.dist-info/METADATA +0 -67
  191. /deltacat/{compute/merge_on_read/model → docs}/__init__.py +0 -0
  192. /deltacat/{compute/merge_on_read/utils → docs/autogen}/__init__.py +0 -0
  193. {deltacat-2.0.0b11.dist-info → deltacat-2.0.0b12.dist-info/licenses}/LICENSE +0 -0
  194. {deltacat-2.0.0b11.dist-info → deltacat-2.0.0b12.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,3083 @@
1
+ """
2
+ Reader compatibility mapping generated from test results.
3
+
4
+ This mapping shows which DatasetType readers can successfully read data
5
+ written by each (arrow_type, writer_dataset_type, content_type) combination.
6
+
7
+ Keys: (arrow_type, writer_dataset_type, content_type)
8
+ Values: List of compatible DatasetType enum values
9
+ """
10
+
11
+ from deltacat.types.tables import DatasetType
12
+
13
+ # Mapping of (arrow_type, writer_dataset_type, content_type) -> list of compatible readers
14
+ READER_COMPATIBILITY_MAPPING = {
15
+ ("binary", "daft", "application/parquet"): [
16
+ DatasetType.DAFT,
17
+ DatasetType.PANDAS,
18
+ DatasetType.POLARS,
19
+ DatasetType.PYARROW,
20
+ DatasetType.RAY_DATASET,
21
+ ],
22
+ ("binary", "pandas", "application/avro"): [
23
+ DatasetType.PANDAS,
24
+ DatasetType.POLARS,
25
+ DatasetType.PYARROW,
26
+ DatasetType.RAY_DATASET,
27
+ ],
28
+ ("binary", "pandas", "application/feather"): [
29
+ DatasetType.PANDAS,
30
+ DatasetType.POLARS,
31
+ DatasetType.PYARROW,
32
+ DatasetType.RAY_DATASET,
33
+ ],
34
+ ("binary", "pandas", "application/orc"): [
35
+ DatasetType.PANDAS,
36
+ DatasetType.POLARS,
37
+ DatasetType.PYARROW,
38
+ DatasetType.RAY_DATASET,
39
+ ],
40
+ ("binary", "pandas", "application/parquet"): [
41
+ DatasetType.DAFT,
42
+ DatasetType.PANDAS,
43
+ DatasetType.POLARS,
44
+ DatasetType.PYARROW,
45
+ DatasetType.RAY_DATASET,
46
+ ],
47
+ ("binary", "polars", "application/avro"): [
48
+ DatasetType.PANDAS,
49
+ DatasetType.POLARS,
50
+ DatasetType.PYARROW,
51
+ DatasetType.RAY_DATASET,
52
+ ],
53
+ ("binary", "polars", "application/feather"): [
54
+ DatasetType.PANDAS,
55
+ DatasetType.POLARS,
56
+ ],
57
+ ("binary", "polars", "application/orc"): [
58
+ DatasetType.PANDAS,
59
+ DatasetType.POLARS,
60
+ DatasetType.PYARROW,
61
+ DatasetType.RAY_DATASET,
62
+ ],
63
+ ("binary", "polars", "application/parquet"): [
64
+ DatasetType.DAFT,
65
+ DatasetType.PANDAS,
66
+ DatasetType.POLARS,
67
+ DatasetType.PYARROW,
68
+ DatasetType.RAY_DATASET,
69
+ ],
70
+ ("binary", "pyarrow", "application/avro"): [
71
+ DatasetType.PANDAS,
72
+ DatasetType.POLARS,
73
+ DatasetType.PYARROW,
74
+ DatasetType.RAY_DATASET,
75
+ ],
76
+ ("binary", "pyarrow", "application/feather"): [
77
+ DatasetType.PANDAS,
78
+ DatasetType.POLARS,
79
+ DatasetType.PYARROW,
80
+ DatasetType.RAY_DATASET,
81
+ ],
82
+ ("binary", "pyarrow", "application/orc"): [
83
+ DatasetType.PANDAS,
84
+ DatasetType.POLARS,
85
+ DatasetType.PYARROW,
86
+ DatasetType.RAY_DATASET,
87
+ ],
88
+ ("binary", "pyarrow", "application/parquet"): [
89
+ DatasetType.DAFT,
90
+ DatasetType.PANDAS,
91
+ DatasetType.POLARS,
92
+ DatasetType.PYARROW,
93
+ DatasetType.RAY_DATASET,
94
+ ],
95
+ ("binary", "ray_dataset", "application/parquet"): [
96
+ DatasetType.DAFT,
97
+ DatasetType.PANDAS,
98
+ DatasetType.POLARS,
99
+ DatasetType.PYARROW,
100
+ DatasetType.RAY_DATASET,
101
+ ],
102
+ ("bool", "daft", "application/parquet"): [
103
+ DatasetType.DAFT,
104
+ DatasetType.PANDAS,
105
+ DatasetType.POLARS,
106
+ DatasetType.PYARROW,
107
+ DatasetType.RAY_DATASET,
108
+ ],
109
+ ("bool", "pandas", "application/avro"): [
110
+ DatasetType.PANDAS,
111
+ DatasetType.POLARS,
112
+ DatasetType.PYARROW,
113
+ DatasetType.RAY_DATASET,
114
+ ],
115
+ ("bool", "pandas", "application/feather"): [
116
+ DatasetType.PANDAS,
117
+ DatasetType.POLARS,
118
+ DatasetType.PYARROW,
119
+ DatasetType.RAY_DATASET,
120
+ ],
121
+ ("bool", "pandas", "application/orc"): [
122
+ DatasetType.PANDAS,
123
+ DatasetType.POLARS,
124
+ DatasetType.PYARROW,
125
+ DatasetType.RAY_DATASET,
126
+ ],
127
+ ("bool", "pandas", "application/parquet"): [
128
+ DatasetType.DAFT,
129
+ DatasetType.PANDAS,
130
+ DatasetType.POLARS,
131
+ DatasetType.PYARROW,
132
+ DatasetType.RAY_DATASET,
133
+ ],
134
+ ("bool", "polars", "application/avro"): [
135
+ DatasetType.PANDAS,
136
+ DatasetType.POLARS,
137
+ DatasetType.PYARROW,
138
+ DatasetType.RAY_DATASET,
139
+ ],
140
+ ("bool", "polars", "application/feather"): [
141
+ DatasetType.PANDAS,
142
+ DatasetType.POLARS,
143
+ DatasetType.PYARROW,
144
+ DatasetType.RAY_DATASET,
145
+ ],
146
+ ("bool", "polars", "application/orc"): [
147
+ DatasetType.PANDAS,
148
+ DatasetType.POLARS,
149
+ DatasetType.PYARROW,
150
+ DatasetType.RAY_DATASET,
151
+ ],
152
+ ("bool", "polars", "application/parquet"): [
153
+ DatasetType.DAFT,
154
+ DatasetType.PANDAS,
155
+ DatasetType.POLARS,
156
+ DatasetType.PYARROW,
157
+ DatasetType.RAY_DATASET,
158
+ ],
159
+ ("bool", "pyarrow", "application/avro"): [
160
+ DatasetType.PANDAS,
161
+ DatasetType.POLARS,
162
+ DatasetType.PYARROW,
163
+ DatasetType.RAY_DATASET,
164
+ ],
165
+ ("bool", "pyarrow", "application/feather"): [
166
+ DatasetType.PANDAS,
167
+ DatasetType.POLARS,
168
+ DatasetType.PYARROW,
169
+ DatasetType.RAY_DATASET,
170
+ ],
171
+ ("bool", "pyarrow", "application/orc"): [
172
+ DatasetType.PANDAS,
173
+ DatasetType.POLARS,
174
+ DatasetType.PYARROW,
175
+ DatasetType.RAY_DATASET,
176
+ ],
177
+ ("bool", "pyarrow", "application/parquet"): [
178
+ DatasetType.DAFT,
179
+ DatasetType.PANDAS,
180
+ DatasetType.POLARS,
181
+ DatasetType.PYARROW,
182
+ DatasetType.RAY_DATASET,
183
+ ],
184
+ ("bool", "ray_dataset", "application/parquet"): [
185
+ DatasetType.DAFT,
186
+ DatasetType.PANDAS,
187
+ DatasetType.POLARS,
188
+ DatasetType.PYARROW,
189
+ DatasetType.RAY_DATASET,
190
+ ],
191
+ ("date32[day]", "daft", "application/parquet"): [
192
+ DatasetType.DAFT,
193
+ DatasetType.PANDAS,
194
+ DatasetType.POLARS,
195
+ DatasetType.PYARROW,
196
+ DatasetType.RAY_DATASET,
197
+ ],
198
+ ("date32[day]", "pandas", "application/avro"): [
199
+ DatasetType.PANDAS,
200
+ DatasetType.POLARS,
201
+ DatasetType.PYARROW,
202
+ DatasetType.RAY_DATASET,
203
+ ],
204
+ ("date32[day]", "pandas", "application/feather"): [
205
+ DatasetType.PANDAS,
206
+ DatasetType.POLARS,
207
+ DatasetType.PYARROW,
208
+ DatasetType.RAY_DATASET,
209
+ ],
210
+ ("date32[day]", "pandas", "application/orc"): [
211
+ DatasetType.PANDAS,
212
+ DatasetType.POLARS,
213
+ DatasetType.PYARROW,
214
+ DatasetType.RAY_DATASET,
215
+ ],
216
+ ("date32[day]", "pandas", "application/parquet"): [
217
+ DatasetType.DAFT,
218
+ DatasetType.PANDAS,
219
+ DatasetType.POLARS,
220
+ DatasetType.PYARROW,
221
+ DatasetType.RAY_DATASET,
222
+ ],
223
+ ("date32[day]", "polars", "application/avro"): [
224
+ DatasetType.PANDAS,
225
+ DatasetType.POLARS,
226
+ DatasetType.PYARROW,
227
+ DatasetType.RAY_DATASET,
228
+ ],
229
+ ("date32[day]", "polars", "application/feather"): [
230
+ DatasetType.PANDAS,
231
+ DatasetType.POLARS,
232
+ DatasetType.PYARROW,
233
+ DatasetType.RAY_DATASET,
234
+ ],
235
+ ("date32[day]", "polars", "application/orc"): [
236
+ DatasetType.PANDAS,
237
+ DatasetType.POLARS,
238
+ DatasetType.PYARROW,
239
+ DatasetType.RAY_DATASET,
240
+ ],
241
+ ("date32[day]", "polars", "application/parquet"): [
242
+ DatasetType.DAFT,
243
+ DatasetType.PANDAS,
244
+ DatasetType.POLARS,
245
+ DatasetType.PYARROW,
246
+ DatasetType.RAY_DATASET,
247
+ ],
248
+ ("date32[day]", "pyarrow", "application/avro"): [
249
+ DatasetType.PANDAS,
250
+ DatasetType.POLARS,
251
+ DatasetType.PYARROW,
252
+ DatasetType.RAY_DATASET,
253
+ ],
254
+ ("date32[day]", "pyarrow", "application/feather"): [
255
+ DatasetType.PANDAS,
256
+ DatasetType.POLARS,
257
+ DatasetType.PYARROW,
258
+ DatasetType.RAY_DATASET,
259
+ ],
260
+ ("date32[day]", "pyarrow", "application/orc"): [
261
+ DatasetType.PANDAS,
262
+ DatasetType.POLARS,
263
+ DatasetType.PYARROW,
264
+ DatasetType.RAY_DATASET,
265
+ ],
266
+ ("date32[day]", "pyarrow", "application/parquet"): [
267
+ DatasetType.DAFT,
268
+ DatasetType.PANDAS,
269
+ DatasetType.POLARS,
270
+ DatasetType.PYARROW,
271
+ DatasetType.RAY_DATASET,
272
+ ],
273
+ ("date32[day]", "ray_dataset", "application/parquet"): [
274
+ DatasetType.DAFT,
275
+ DatasetType.PANDAS,
276
+ DatasetType.POLARS,
277
+ DatasetType.PYARROW,
278
+ DatasetType.RAY_DATASET,
279
+ ],
280
+ ("date64[ms]", "daft", "application/parquet"): [
281
+ DatasetType.DAFT,
282
+ DatasetType.PANDAS,
283
+ DatasetType.POLARS,
284
+ DatasetType.PYARROW,
285
+ DatasetType.RAY_DATASET,
286
+ ],
287
+ ("date64[ms]", "pandas", "application/avro"): [
288
+ DatasetType.PANDAS,
289
+ DatasetType.POLARS,
290
+ DatasetType.PYARROW,
291
+ DatasetType.RAY_DATASET,
292
+ ],
293
+ ("date64[ms]", "pandas", "application/feather"): [
294
+ DatasetType.PANDAS,
295
+ DatasetType.POLARS,
296
+ DatasetType.PYARROW,
297
+ DatasetType.RAY_DATASET,
298
+ ],
299
+ ("date64[ms]", "pandas", "application/orc"): [
300
+ DatasetType.PANDAS,
301
+ DatasetType.POLARS,
302
+ DatasetType.PYARROW,
303
+ DatasetType.RAY_DATASET,
304
+ ],
305
+ ("date64[ms]", "pandas", "application/parquet"): [
306
+ DatasetType.DAFT,
307
+ DatasetType.PANDAS,
308
+ DatasetType.POLARS,
309
+ DatasetType.PYARROW,
310
+ DatasetType.RAY_DATASET,
311
+ ],
312
+ ("date64[ms]", "polars", "application/avro"): [
313
+ DatasetType.PANDAS,
314
+ DatasetType.POLARS,
315
+ DatasetType.PYARROW,
316
+ DatasetType.RAY_DATASET,
317
+ ],
318
+ ("date64[ms]", "polars", "application/feather"): [
319
+ DatasetType.PANDAS,
320
+ DatasetType.POLARS,
321
+ DatasetType.PYARROW,
322
+ DatasetType.RAY_DATASET,
323
+ ],
324
+ ("date64[ms]", "polars", "application/orc"): [
325
+ DatasetType.PANDAS,
326
+ DatasetType.POLARS,
327
+ DatasetType.PYARROW,
328
+ DatasetType.RAY_DATASET,
329
+ ],
330
+ ("date64[ms]", "polars", "application/parquet"): [
331
+ DatasetType.DAFT,
332
+ DatasetType.PANDAS,
333
+ DatasetType.POLARS,
334
+ DatasetType.PYARROW,
335
+ DatasetType.RAY_DATASET,
336
+ ],
337
+ ("date64[ms]", "pyarrow", "application/avro"): [
338
+ DatasetType.PANDAS,
339
+ DatasetType.RAY_DATASET,
340
+ ],
341
+ ("date64[ms]", "pyarrow", "application/feather"): [
342
+ DatasetType.PANDAS,
343
+ DatasetType.PYARROW,
344
+ DatasetType.RAY_DATASET,
345
+ ],
346
+ ("date64[ms]", "pyarrow", "application/orc"): [
347
+ DatasetType.PANDAS,
348
+ DatasetType.RAY_DATASET,
349
+ ],
350
+ ("date64[ms]", "pyarrow", "application/parquet"): [
351
+ DatasetType.DAFT,
352
+ DatasetType.PANDAS,
353
+ DatasetType.PYARROW,
354
+ DatasetType.RAY_DATASET,
355
+ ],
356
+ ("decimal128", "daft", "application/parquet"): [
357
+ DatasetType.DAFT,
358
+ DatasetType.PANDAS,
359
+ DatasetType.POLARS,
360
+ DatasetType.PYARROW,
361
+ DatasetType.RAY_DATASET,
362
+ ],
363
+ ("decimal128", "pandas", "application/avro"): [
364
+ DatasetType.PANDAS,
365
+ DatasetType.POLARS,
366
+ DatasetType.PYARROW,
367
+ DatasetType.RAY_DATASET,
368
+ ],
369
+ ("decimal128", "pandas", "application/feather"): [
370
+ DatasetType.PANDAS,
371
+ DatasetType.POLARS,
372
+ DatasetType.PYARROW,
373
+ DatasetType.RAY_DATASET,
374
+ ],
375
+ ("decimal128", "pandas", "application/orc"): [
376
+ DatasetType.PANDAS,
377
+ DatasetType.POLARS,
378
+ DatasetType.PYARROW,
379
+ DatasetType.RAY_DATASET,
380
+ ],
381
+ ("decimal128", "pandas", "application/parquet"): [
382
+ DatasetType.DAFT,
383
+ DatasetType.PANDAS,
384
+ DatasetType.POLARS,
385
+ DatasetType.PYARROW,
386
+ DatasetType.RAY_DATASET,
387
+ ],
388
+ ("decimal128", "polars", "application/avro"): [
389
+ DatasetType.PANDAS,
390
+ DatasetType.POLARS,
391
+ DatasetType.PYARROW,
392
+ DatasetType.RAY_DATASET,
393
+ ],
394
+ ("decimal128", "polars", "application/feather"): [
395
+ DatasetType.PANDAS,
396
+ DatasetType.POLARS,
397
+ DatasetType.PYARROW,
398
+ DatasetType.RAY_DATASET,
399
+ ],
400
+ ("decimal128", "polars", "application/orc"): [
401
+ DatasetType.PANDAS,
402
+ DatasetType.POLARS,
403
+ DatasetType.PYARROW,
404
+ DatasetType.RAY_DATASET,
405
+ ],
406
+ ("decimal128", "polars", "application/parquet"): [
407
+ DatasetType.DAFT,
408
+ DatasetType.PANDAS,
409
+ DatasetType.POLARS,
410
+ DatasetType.PYARROW,
411
+ DatasetType.RAY_DATASET,
412
+ ],
413
+ ("decimal128", "pyarrow", "application/avro"): [
414
+ DatasetType.PANDAS,
415
+ DatasetType.POLARS,
416
+ DatasetType.PYARROW,
417
+ DatasetType.RAY_DATASET,
418
+ ],
419
+ ("decimal128", "pyarrow", "application/feather"): [
420
+ DatasetType.PANDAS,
421
+ DatasetType.POLARS,
422
+ DatasetType.PYARROW,
423
+ DatasetType.RAY_DATASET,
424
+ ],
425
+ ("decimal128", "pyarrow", "application/orc"): [
426
+ DatasetType.PANDAS,
427
+ DatasetType.POLARS,
428
+ DatasetType.PYARROW,
429
+ DatasetType.RAY_DATASET,
430
+ ],
431
+ ("decimal128", "pyarrow", "application/parquet"): [
432
+ DatasetType.DAFT,
433
+ DatasetType.PANDAS,
434
+ DatasetType.POLARS,
435
+ DatasetType.PYARROW,
436
+ DatasetType.RAY_DATASET,
437
+ ],
438
+ ("decimal128", "ray_dataset", "application/parquet"): [
439
+ DatasetType.DAFT,
440
+ DatasetType.PANDAS,
441
+ DatasetType.POLARS,
442
+ DatasetType.PYARROW,
443
+ DatasetType.RAY_DATASET,
444
+ ],
445
+ ("decimal256", "pandas", "application/avro"): [
446
+ DatasetType.PANDAS,
447
+ DatasetType.POLARS,
448
+ DatasetType.PYARROW,
449
+ DatasetType.RAY_DATASET,
450
+ ],
451
+ ("decimal256", "pandas", "application/feather"): [
452
+ DatasetType.PANDAS,
453
+ DatasetType.POLARS,
454
+ DatasetType.PYARROW,
455
+ DatasetType.RAY_DATASET,
456
+ ],
457
+ ("decimal256", "pandas", "application/orc"): [
458
+ DatasetType.PANDAS,
459
+ DatasetType.POLARS,
460
+ DatasetType.PYARROW,
461
+ DatasetType.RAY_DATASET,
462
+ ],
463
+ ("decimal256", "pandas", "application/parquet"): [
464
+ DatasetType.DAFT,
465
+ DatasetType.PANDAS,
466
+ DatasetType.POLARS,
467
+ DatasetType.PYARROW,
468
+ DatasetType.RAY_DATASET,
469
+ ],
470
+ ("decimal256", "pyarrow", "application/feather"): [
471
+ DatasetType.PANDAS,
472
+ DatasetType.PYARROW,
473
+ DatasetType.RAY_DATASET,
474
+ ],
475
+ ("decimal256", "pyarrow", "application/parquet"): [
476
+ DatasetType.DAFT,
477
+ DatasetType.PANDAS,
478
+ DatasetType.PYARROW,
479
+ DatasetType.RAY_DATASET,
480
+ ],
481
+ ("dictionary", "pandas", "application/feather"): [
482
+ DatasetType.PANDAS,
483
+ DatasetType.POLARS,
484
+ DatasetType.PYARROW,
485
+ DatasetType.RAY_DATASET,
486
+ ],
487
+ ("dictionary", "pandas", "application/parquet"): [
488
+ DatasetType.DAFT,
489
+ DatasetType.PANDAS,
490
+ DatasetType.POLARS,
491
+ DatasetType.PYARROW,
492
+ DatasetType.RAY_DATASET,
493
+ ],
494
+ ("dictionary", "polars", "application/feather"): [DatasetType.POLARS],
495
+ ("dictionary", "polars", "application/parquet"): [
496
+ DatasetType.DAFT,
497
+ DatasetType.POLARS,
498
+ DatasetType.PYARROW,
499
+ DatasetType.RAY_DATASET,
500
+ ],
501
+ ("dictionary", "pyarrow", "application/feather"): [
502
+ DatasetType.PANDAS,
503
+ DatasetType.POLARS,
504
+ DatasetType.PYARROW,
505
+ DatasetType.RAY_DATASET,
506
+ ],
507
+ ("dictionary", "pyarrow", "application/parquet"): [
508
+ DatasetType.DAFT,
509
+ DatasetType.PANDAS,
510
+ DatasetType.POLARS,
511
+ DatasetType.PYARROW,
512
+ DatasetType.RAY_DATASET,
513
+ ],
514
+ ("double", "daft", "application/parquet"): [
515
+ DatasetType.DAFT,
516
+ DatasetType.PANDAS,
517
+ DatasetType.POLARS,
518
+ DatasetType.PYARROW,
519
+ DatasetType.RAY_DATASET,
520
+ ],
521
+ ("double", "pandas", "application/avro"): [
522
+ DatasetType.PANDAS,
523
+ DatasetType.POLARS,
524
+ DatasetType.PYARROW,
525
+ DatasetType.RAY_DATASET,
526
+ ],
527
+ ("double", "pandas", "application/feather"): [
528
+ DatasetType.PANDAS,
529
+ DatasetType.POLARS,
530
+ DatasetType.PYARROW,
531
+ DatasetType.RAY_DATASET,
532
+ ],
533
+ ("double", "pandas", "application/orc"): [
534
+ DatasetType.PANDAS,
535
+ DatasetType.POLARS,
536
+ DatasetType.PYARROW,
537
+ DatasetType.RAY_DATASET,
538
+ ],
539
+ ("double", "pandas", "application/parquet"): [
540
+ DatasetType.DAFT,
541
+ DatasetType.PANDAS,
542
+ DatasetType.POLARS,
543
+ DatasetType.PYARROW,
544
+ DatasetType.RAY_DATASET,
545
+ ],
546
+ ("double", "polars", "application/avro"): [
547
+ DatasetType.PANDAS,
548
+ DatasetType.POLARS,
549
+ DatasetType.PYARROW,
550
+ DatasetType.RAY_DATASET,
551
+ ],
552
+ ("double", "polars", "application/feather"): [
553
+ DatasetType.PANDAS,
554
+ DatasetType.POLARS,
555
+ DatasetType.PYARROW,
556
+ DatasetType.RAY_DATASET,
557
+ ],
558
+ ("double", "polars", "application/orc"): [
559
+ DatasetType.PANDAS,
560
+ DatasetType.POLARS,
561
+ DatasetType.PYARROW,
562
+ DatasetType.RAY_DATASET,
563
+ ],
564
+ ("double", "polars", "application/parquet"): [
565
+ DatasetType.DAFT,
566
+ DatasetType.PANDAS,
567
+ DatasetType.POLARS,
568
+ DatasetType.PYARROW,
569
+ DatasetType.RAY_DATASET,
570
+ ],
571
+ ("double", "pyarrow", "application/avro"): [
572
+ DatasetType.PANDAS,
573
+ DatasetType.POLARS,
574
+ DatasetType.PYARROW,
575
+ DatasetType.RAY_DATASET,
576
+ ],
577
+ ("double", "pyarrow", "application/feather"): [
578
+ DatasetType.PANDAS,
579
+ DatasetType.POLARS,
580
+ DatasetType.PYARROW,
581
+ DatasetType.RAY_DATASET,
582
+ ],
583
+ ("double", "pyarrow", "application/orc"): [
584
+ DatasetType.PANDAS,
585
+ DatasetType.POLARS,
586
+ DatasetType.PYARROW,
587
+ DatasetType.RAY_DATASET,
588
+ ],
589
+ ("double", "pyarrow", "application/parquet"): [
590
+ DatasetType.DAFT,
591
+ DatasetType.PANDAS,
592
+ DatasetType.POLARS,
593
+ DatasetType.PYARROW,
594
+ DatasetType.RAY_DATASET,
595
+ ],
596
+ ("double", "ray_dataset", "application/parquet"): [
597
+ DatasetType.DAFT,
598
+ DatasetType.PANDAS,
599
+ DatasetType.POLARS,
600
+ DatasetType.PYARROW,
601
+ DatasetType.RAY_DATASET,
602
+ ],
603
+ ("duration[ms]", "daft", "application/parquet"): [
604
+ DatasetType.DAFT,
605
+ DatasetType.PANDAS,
606
+ DatasetType.POLARS,
607
+ DatasetType.PYARROW,
608
+ DatasetType.RAY_DATASET,
609
+ ],
610
+ ("duration[ms]", "pandas", "application/feather"): [
611
+ DatasetType.PANDAS,
612
+ DatasetType.POLARS,
613
+ DatasetType.PYARROW,
614
+ DatasetType.RAY_DATASET,
615
+ ],
616
+ ("duration[ms]", "pandas", "application/parquet"): [
617
+ DatasetType.DAFT,
618
+ DatasetType.PANDAS,
619
+ DatasetType.POLARS,
620
+ DatasetType.PYARROW,
621
+ DatasetType.RAY_DATASET,
622
+ ],
623
+ ("duration[ms]", "polars", "application/feather"): [
624
+ DatasetType.PANDAS,
625
+ DatasetType.POLARS,
626
+ DatasetType.PYARROW,
627
+ DatasetType.RAY_DATASET,
628
+ ],
629
+ ("duration[ms]", "polars", "application/parquet"): [
630
+ DatasetType.DAFT,
631
+ DatasetType.PANDAS,
632
+ DatasetType.POLARS,
633
+ DatasetType.PYARROW,
634
+ DatasetType.RAY_DATASET,
635
+ ],
636
+ ("duration[ms]", "pyarrow", "application/feather"): [
637
+ DatasetType.PANDAS,
638
+ DatasetType.POLARS,
639
+ DatasetType.PYARROW,
640
+ DatasetType.RAY_DATASET,
641
+ ],
642
+ ("duration[ms]", "pyarrow", "application/parquet"): [
643
+ DatasetType.DAFT,
644
+ DatasetType.PANDAS,
645
+ DatasetType.POLARS,
646
+ DatasetType.PYARROW,
647
+ DatasetType.RAY_DATASET,
648
+ ],
649
+ ("duration[ms]", "ray_dataset", "application/parquet"): [
650
+ DatasetType.DAFT,
651
+ DatasetType.PANDAS,
652
+ DatasetType.POLARS,
653
+ DatasetType.PYARROW,
654
+ DatasetType.RAY_DATASET,
655
+ ],
656
+ ("duration[ns]", "daft", "application/parquet"): [
657
+ DatasetType.DAFT,
658
+ DatasetType.PANDAS,
659
+ DatasetType.POLARS,
660
+ DatasetType.PYARROW,
661
+ DatasetType.RAY_DATASET,
662
+ ],
663
+ ("duration[ns]", "pandas", "application/feather"): [
664
+ DatasetType.PANDAS,
665
+ DatasetType.POLARS,
666
+ DatasetType.PYARROW,
667
+ DatasetType.RAY_DATASET,
668
+ ],
669
+ ("duration[ns]", "pandas", "application/parquet"): [
670
+ DatasetType.DAFT,
671
+ DatasetType.PANDAS,
672
+ DatasetType.POLARS,
673
+ DatasetType.PYARROW,
674
+ DatasetType.RAY_DATASET,
675
+ ],
676
+ ("duration[ns]", "polars", "application/feather"): [
677
+ DatasetType.PANDAS,
678
+ DatasetType.POLARS,
679
+ DatasetType.PYARROW,
680
+ DatasetType.RAY_DATASET,
681
+ ],
682
+ ("duration[ns]", "polars", "application/parquet"): [
683
+ DatasetType.DAFT,
684
+ DatasetType.PANDAS,
685
+ DatasetType.POLARS,
686
+ DatasetType.PYARROW,
687
+ DatasetType.RAY_DATASET,
688
+ ],
689
+ ("duration[ns]", "pyarrow", "application/feather"): [
690
+ DatasetType.PANDAS,
691
+ DatasetType.POLARS,
692
+ DatasetType.PYARROW,
693
+ DatasetType.RAY_DATASET,
694
+ ],
695
+ ("duration[ns]", "pyarrow", "application/parquet"): [
696
+ DatasetType.DAFT,
697
+ DatasetType.PANDAS,
698
+ DatasetType.POLARS,
699
+ DatasetType.PYARROW,
700
+ DatasetType.RAY_DATASET,
701
+ ],
702
+ ("duration[ns]", "ray_dataset", "application/parquet"): [
703
+ DatasetType.DAFT,
704
+ DatasetType.PANDAS,
705
+ DatasetType.POLARS,
706
+ DatasetType.PYARROW,
707
+ DatasetType.RAY_DATASET,
708
+ ],
709
+ ("duration[s]", "daft", "application/parquet"): [
710
+ DatasetType.DAFT,
711
+ DatasetType.PANDAS,
712
+ DatasetType.POLARS,
713
+ DatasetType.PYARROW,
714
+ DatasetType.RAY_DATASET,
715
+ ],
716
+ ("duration[s]", "pandas", "application/feather"): [
717
+ DatasetType.PANDAS,
718
+ DatasetType.POLARS,
719
+ DatasetType.PYARROW,
720
+ DatasetType.RAY_DATASET,
721
+ ],
722
+ ("duration[s]", "pandas", "application/parquet"): [
723
+ DatasetType.DAFT,
724
+ DatasetType.PANDAS,
725
+ DatasetType.POLARS,
726
+ DatasetType.PYARROW,
727
+ DatasetType.RAY_DATASET,
728
+ ],
729
+ ("duration[s]", "polars", "application/feather"): [
730
+ DatasetType.PANDAS,
731
+ DatasetType.POLARS,
732
+ DatasetType.PYARROW,
733
+ DatasetType.RAY_DATASET,
734
+ ],
735
+ ("duration[s]", "polars", "application/parquet"): [
736
+ DatasetType.DAFT,
737
+ DatasetType.PANDAS,
738
+ DatasetType.POLARS,
739
+ DatasetType.PYARROW,
740
+ DatasetType.RAY_DATASET,
741
+ ],
742
+ ("duration[s]", "pyarrow", "application/feather"): [
743
+ DatasetType.PANDAS,
744
+ DatasetType.POLARS,
745
+ DatasetType.PYARROW,
746
+ DatasetType.RAY_DATASET,
747
+ ],
748
+ ("duration[s]", "pyarrow", "application/parquet"): [
749
+ DatasetType.DAFT,
750
+ DatasetType.PANDAS,
751
+ DatasetType.POLARS,
752
+ DatasetType.PYARROW,
753
+ DatasetType.RAY_DATASET,
754
+ ],
755
+ ("duration[s]", "ray_dataset", "application/parquet"): [
756
+ DatasetType.DAFT,
757
+ DatasetType.PANDAS,
758
+ DatasetType.POLARS,
759
+ DatasetType.PYARROW,
760
+ DatasetType.RAY_DATASET,
761
+ ],
762
+ ("duration[us]", "daft", "application/parquet"): [
763
+ DatasetType.DAFT,
764
+ DatasetType.PANDAS,
765
+ DatasetType.POLARS,
766
+ DatasetType.PYARROW,
767
+ DatasetType.RAY_DATASET,
768
+ ],
769
+ ("duration[us]", "pandas", "application/feather"): [
770
+ DatasetType.PANDAS,
771
+ DatasetType.POLARS,
772
+ DatasetType.PYARROW,
773
+ DatasetType.RAY_DATASET,
774
+ ],
775
+ ("duration[us]", "pandas", "application/parquet"): [
776
+ DatasetType.DAFT,
777
+ DatasetType.PANDAS,
778
+ DatasetType.POLARS,
779
+ DatasetType.PYARROW,
780
+ DatasetType.RAY_DATASET,
781
+ ],
782
+ ("duration[us]", "polars", "application/feather"): [
783
+ DatasetType.PANDAS,
784
+ DatasetType.POLARS,
785
+ DatasetType.PYARROW,
786
+ DatasetType.RAY_DATASET,
787
+ ],
788
+ ("duration[us]", "polars", "application/parquet"): [
789
+ DatasetType.DAFT,
790
+ DatasetType.PANDAS,
791
+ DatasetType.POLARS,
792
+ DatasetType.PYARROW,
793
+ DatasetType.RAY_DATASET,
794
+ ],
795
+ ("duration[us]", "pyarrow", "application/feather"): [
796
+ DatasetType.PANDAS,
797
+ DatasetType.POLARS,
798
+ DatasetType.PYARROW,
799
+ DatasetType.RAY_DATASET,
800
+ ],
801
+ ("duration[us]", "pyarrow", "application/parquet"): [
802
+ DatasetType.DAFT,
803
+ DatasetType.PANDAS,
804
+ DatasetType.POLARS,
805
+ DatasetType.PYARROW,
806
+ DatasetType.RAY_DATASET,
807
+ ],
808
+ ("duration[us]", "ray_dataset", "application/parquet"): [
809
+ DatasetType.DAFT,
810
+ DatasetType.PANDAS,
811
+ DatasetType.POLARS,
812
+ DatasetType.PYARROW,
813
+ DatasetType.RAY_DATASET,
814
+ ],
815
+ ("fixed_shape_tensor", "daft", "application/parquet"): [
816
+ DatasetType.DAFT,
817
+ DatasetType.RAY_DATASET,
818
+ ],
819
+ ("fixed_shape_tensor", "pandas", "application/avro"): [
820
+ DatasetType.PANDAS,
821
+ DatasetType.POLARS,
822
+ DatasetType.PYARROW,
823
+ DatasetType.RAY_DATASET,
824
+ ],
825
+ ("fixed_shape_tensor", "pandas", "application/feather"): [
826
+ DatasetType.PANDAS,
827
+ DatasetType.POLARS,
828
+ DatasetType.PYARROW,
829
+ DatasetType.RAY_DATASET,
830
+ ],
831
+ ("fixed_shape_tensor", "pandas", "application/orc"): [
832
+ DatasetType.PANDAS,
833
+ DatasetType.POLARS,
834
+ DatasetType.PYARROW,
835
+ DatasetType.RAY_DATASET,
836
+ ],
837
+ ("fixed_shape_tensor", "pandas", "application/parquet"): [
838
+ DatasetType.DAFT,
839
+ DatasetType.PANDAS,
840
+ DatasetType.POLARS,
841
+ DatasetType.PYARROW,
842
+ DatasetType.RAY_DATASET,
843
+ ],
844
+ ("fixed_shape_tensor", "pyarrow", "application/feather"): [
845
+ DatasetType.PANDAS,
846
+ DatasetType.PYARROW,
847
+ DatasetType.RAY_DATASET,
848
+ ],
849
+ ("fixed_shape_tensor", "pyarrow", "application/parquet"): [
850
+ DatasetType.DAFT,
851
+ DatasetType.PANDAS,
852
+ DatasetType.PYARROW,
853
+ DatasetType.RAY_DATASET,
854
+ ],
855
+ ("fixed_shape_tensor", "ray_dataset", "application/parquet"): [
856
+ DatasetType.DAFT,
857
+ DatasetType.RAY_DATASET,
858
+ ],
859
+ ("fixed_size_list", "daft", "application/parquet"): [
860
+ DatasetType.DAFT,
861
+ DatasetType.PANDAS,
862
+ DatasetType.POLARS,
863
+ DatasetType.PYARROW,
864
+ DatasetType.RAY_DATASET,
865
+ ],
866
+ ("fixed_size_list", "pandas", "application/avro"): [
867
+ DatasetType.PANDAS,
868
+ DatasetType.POLARS,
869
+ DatasetType.PYARROW,
870
+ DatasetType.RAY_DATASET,
871
+ ],
872
+ ("fixed_size_list", "pandas", "application/feather"): [
873
+ DatasetType.PANDAS,
874
+ DatasetType.POLARS,
875
+ DatasetType.PYARROW,
876
+ DatasetType.RAY_DATASET,
877
+ ],
878
+ ("fixed_size_list", "pandas", "application/orc"): [
879
+ DatasetType.PANDAS,
880
+ DatasetType.POLARS,
881
+ DatasetType.PYARROW,
882
+ DatasetType.RAY_DATASET,
883
+ ],
884
+ ("fixed_size_list", "pandas", "application/parquet"): [
885
+ DatasetType.DAFT,
886
+ DatasetType.PANDAS,
887
+ DatasetType.POLARS,
888
+ DatasetType.PYARROW,
889
+ DatasetType.RAY_DATASET,
890
+ ],
891
+ ("fixed_size_list", "polars", "application/feather"): [
892
+ DatasetType.PANDAS,
893
+ DatasetType.POLARS,
894
+ DatasetType.PYARROW,
895
+ DatasetType.RAY_DATASET,
896
+ ],
897
+ ("fixed_size_list", "polars", "application/orc"): [
898
+ DatasetType.PANDAS,
899
+ DatasetType.POLARS,
900
+ DatasetType.PYARROW,
901
+ DatasetType.RAY_DATASET,
902
+ ],
903
+ ("fixed_size_list", "polars", "application/parquet"): [
904
+ DatasetType.DAFT,
905
+ DatasetType.PANDAS,
906
+ DatasetType.POLARS,
907
+ DatasetType.PYARROW,
908
+ DatasetType.RAY_DATASET,
909
+ ],
910
+ ("fixed_size_list", "pyarrow", "application/feather"): [
911
+ DatasetType.PANDAS,
912
+ DatasetType.POLARS,
913
+ DatasetType.PYARROW,
914
+ DatasetType.RAY_DATASET,
915
+ ],
916
+ ("fixed_size_list", "pyarrow", "application/orc"): [
917
+ DatasetType.PANDAS,
918
+ DatasetType.POLARS,
919
+ DatasetType.PYARROW,
920
+ DatasetType.RAY_DATASET,
921
+ ],
922
+ ("fixed_size_list", "pyarrow", "application/parquet"): [
923
+ DatasetType.DAFT,
924
+ DatasetType.PANDAS,
925
+ DatasetType.POLARS,
926
+ DatasetType.PYARROW,
927
+ DatasetType.RAY_DATASET,
928
+ ],
929
+ ("fixed_size_list", "ray_dataset", "application/parquet"): [
930
+ DatasetType.DAFT,
931
+ DatasetType.PANDAS,
932
+ DatasetType.POLARS,
933
+ DatasetType.PYARROW,
934
+ DatasetType.RAY_DATASET,
935
+ ],
936
+ ("float", "daft", "application/parquet"): [
937
+ DatasetType.DAFT,
938
+ DatasetType.PANDAS,
939
+ DatasetType.POLARS,
940
+ DatasetType.PYARROW,
941
+ DatasetType.RAY_DATASET,
942
+ ],
943
+ ("float", "pandas", "application/avro"): [
944
+ DatasetType.PANDAS,
945
+ DatasetType.POLARS,
946
+ DatasetType.PYARROW,
947
+ DatasetType.RAY_DATASET,
948
+ ],
949
+ ("float", "pandas", "application/feather"): [
950
+ DatasetType.PANDAS,
951
+ DatasetType.POLARS,
952
+ DatasetType.PYARROW,
953
+ DatasetType.RAY_DATASET,
954
+ ],
955
+ ("float", "pandas", "application/orc"): [
956
+ DatasetType.PANDAS,
957
+ DatasetType.POLARS,
958
+ DatasetType.PYARROW,
959
+ DatasetType.RAY_DATASET,
960
+ ],
961
+ ("float", "pandas", "application/parquet"): [
962
+ DatasetType.DAFT,
963
+ DatasetType.PANDAS,
964
+ DatasetType.POLARS,
965
+ DatasetType.PYARROW,
966
+ DatasetType.RAY_DATASET,
967
+ ],
968
+ ("float", "polars", "application/avro"): [
969
+ DatasetType.PANDAS,
970
+ DatasetType.POLARS,
971
+ DatasetType.PYARROW,
972
+ DatasetType.RAY_DATASET,
973
+ ],
974
+ ("float", "polars", "application/feather"): [
975
+ DatasetType.PANDAS,
976
+ DatasetType.POLARS,
977
+ DatasetType.PYARROW,
978
+ DatasetType.RAY_DATASET,
979
+ ],
980
+ ("float", "polars", "application/orc"): [
981
+ DatasetType.PANDAS,
982
+ DatasetType.POLARS,
983
+ DatasetType.PYARROW,
984
+ DatasetType.RAY_DATASET,
985
+ ],
986
+ ("float", "polars", "application/parquet"): [
987
+ DatasetType.DAFT,
988
+ DatasetType.PANDAS,
989
+ DatasetType.POLARS,
990
+ DatasetType.PYARROW,
991
+ DatasetType.RAY_DATASET,
992
+ ],
993
+ ("float", "pyarrow", "application/avro"): [
994
+ DatasetType.PANDAS,
995
+ DatasetType.POLARS,
996
+ DatasetType.PYARROW,
997
+ DatasetType.RAY_DATASET,
998
+ ],
999
+ ("float", "pyarrow", "application/feather"): [
1000
+ DatasetType.PANDAS,
1001
+ DatasetType.POLARS,
1002
+ DatasetType.PYARROW,
1003
+ DatasetType.RAY_DATASET,
1004
+ ],
1005
+ ("float", "pyarrow", "application/orc"): [
1006
+ DatasetType.PANDAS,
1007
+ DatasetType.POLARS,
1008
+ DatasetType.PYARROW,
1009
+ DatasetType.RAY_DATASET,
1010
+ ],
1011
+ ("float", "pyarrow", "application/parquet"): [
1012
+ DatasetType.DAFT,
1013
+ DatasetType.PANDAS,
1014
+ DatasetType.POLARS,
1015
+ DatasetType.PYARROW,
1016
+ DatasetType.RAY_DATASET,
1017
+ ],
1018
+ ("float", "ray_dataset", "application/parquet"): [
1019
+ DatasetType.DAFT,
1020
+ DatasetType.PANDAS,
1021
+ DatasetType.POLARS,
1022
+ DatasetType.PYARROW,
1023
+ DatasetType.RAY_DATASET,
1024
+ ],
1025
+ ("halffloat", "pandas", "application/avro"): [
1026
+ DatasetType.PANDAS,
1027
+ DatasetType.POLARS,
1028
+ DatasetType.PYARROW,
1029
+ DatasetType.RAY_DATASET,
1030
+ ],
1031
+ ("halffloat", "pandas", "application/feather"): [
1032
+ DatasetType.PANDAS,
1033
+ DatasetType.POLARS,
1034
+ DatasetType.PYARROW,
1035
+ DatasetType.RAY_DATASET,
1036
+ ],
1037
+ ("halffloat", "pandas", "application/parquet"): [
1038
+ DatasetType.DAFT,
1039
+ DatasetType.PANDAS,
1040
+ DatasetType.POLARS,
1041
+ DatasetType.PYARROW,
1042
+ DatasetType.RAY_DATASET,
1043
+ ],
1044
+ ("halffloat", "polars", "application/avro"): [
1045
+ DatasetType.PANDAS,
1046
+ DatasetType.POLARS,
1047
+ DatasetType.PYARROW,
1048
+ DatasetType.RAY_DATASET,
1049
+ ],
1050
+ ("halffloat", "polars", "application/feather"): [
1051
+ DatasetType.PANDAS,
1052
+ DatasetType.POLARS,
1053
+ DatasetType.PYARROW,
1054
+ DatasetType.RAY_DATASET,
1055
+ ],
1056
+ ("halffloat", "polars", "application/orc"): [
1057
+ DatasetType.PANDAS,
1058
+ DatasetType.POLARS,
1059
+ DatasetType.PYARROW,
1060
+ DatasetType.RAY_DATASET,
1061
+ ],
1062
+ ("halffloat", "polars", "application/parquet"): [
1063
+ DatasetType.DAFT,
1064
+ DatasetType.PANDAS,
1065
+ DatasetType.POLARS,
1066
+ DatasetType.PYARROW,
1067
+ DatasetType.RAY_DATASET,
1068
+ ],
1069
+ ("halffloat", "pyarrow", "application/avro"): [
1070
+ DatasetType.PANDAS,
1071
+ DatasetType.POLARS,
1072
+ DatasetType.PYARROW,
1073
+ DatasetType.RAY_DATASET,
1074
+ ],
1075
+ ("halffloat", "pyarrow", "application/feather"): [
1076
+ DatasetType.PANDAS,
1077
+ DatasetType.POLARS,
1078
+ DatasetType.PYARROW,
1079
+ DatasetType.RAY_DATASET,
1080
+ ],
1081
+ ("halffloat", "pyarrow", "application/parquet"): [
1082
+ DatasetType.DAFT,
1083
+ DatasetType.PANDAS,
1084
+ DatasetType.POLARS,
1085
+ DatasetType.PYARROW,
1086
+ DatasetType.RAY_DATASET,
1087
+ ],
1088
+ ("int16", "daft", "application/parquet"): [
1089
+ DatasetType.DAFT,
1090
+ DatasetType.PANDAS,
1091
+ DatasetType.POLARS,
1092
+ DatasetType.PYARROW,
1093
+ DatasetType.RAY_DATASET,
1094
+ ],
1095
+ ("int16", "pandas", "application/feather"): [
1096
+ DatasetType.PANDAS,
1097
+ DatasetType.POLARS,
1098
+ DatasetType.PYARROW,
1099
+ DatasetType.RAY_DATASET,
1100
+ ],
1101
+ ("int16", "pandas", "application/orc"): [
1102
+ DatasetType.PANDAS,
1103
+ DatasetType.POLARS,
1104
+ DatasetType.PYARROW,
1105
+ DatasetType.RAY_DATASET,
1106
+ ],
1107
+ ("int16", "pandas", "application/parquet"): [
1108
+ DatasetType.DAFT,
1109
+ DatasetType.PANDAS,
1110
+ DatasetType.POLARS,
1111
+ DatasetType.PYARROW,
1112
+ DatasetType.RAY_DATASET,
1113
+ ],
1114
+ ("int16", "polars", "application/feather"): [
1115
+ DatasetType.PANDAS,
1116
+ DatasetType.POLARS,
1117
+ DatasetType.PYARROW,
1118
+ DatasetType.RAY_DATASET,
1119
+ ],
1120
+ ("int16", "polars", "application/orc"): [
1121
+ DatasetType.PANDAS,
1122
+ DatasetType.POLARS,
1123
+ DatasetType.PYARROW,
1124
+ DatasetType.RAY_DATASET,
1125
+ ],
1126
+ ("int16", "polars", "application/parquet"): [
1127
+ DatasetType.DAFT,
1128
+ DatasetType.PANDAS,
1129
+ DatasetType.POLARS,
1130
+ DatasetType.PYARROW,
1131
+ DatasetType.RAY_DATASET,
1132
+ ],
1133
+ ("int16", "pyarrow", "application/feather"): [
1134
+ DatasetType.PANDAS,
1135
+ DatasetType.POLARS,
1136
+ DatasetType.PYARROW,
1137
+ DatasetType.RAY_DATASET,
1138
+ ],
1139
+ ("int16", "pyarrow", "application/orc"): [
1140
+ DatasetType.PANDAS,
1141
+ DatasetType.POLARS,
1142
+ DatasetType.PYARROW,
1143
+ DatasetType.RAY_DATASET,
1144
+ ],
1145
+ ("int16", "pyarrow", "application/parquet"): [
1146
+ DatasetType.DAFT,
1147
+ DatasetType.PANDAS,
1148
+ DatasetType.POLARS,
1149
+ DatasetType.PYARROW,
1150
+ DatasetType.RAY_DATASET,
1151
+ ],
1152
+ ("int16", "ray_dataset", "application/parquet"): [
1153
+ DatasetType.DAFT,
1154
+ DatasetType.PANDAS,
1155
+ DatasetType.POLARS,
1156
+ DatasetType.PYARROW,
1157
+ DatasetType.RAY_DATASET,
1158
+ ],
1159
+ ("int32", "daft", "application/parquet"): [
1160
+ DatasetType.DAFT,
1161
+ DatasetType.PANDAS,
1162
+ DatasetType.POLARS,
1163
+ DatasetType.PYARROW,
1164
+ DatasetType.RAY_DATASET,
1165
+ ],
1166
+ ("int32", "pandas", "application/avro"): [
1167
+ DatasetType.PANDAS,
1168
+ DatasetType.POLARS,
1169
+ DatasetType.PYARROW,
1170
+ DatasetType.RAY_DATASET,
1171
+ ],
1172
+ ("int32", "pandas", "application/feather"): [
1173
+ DatasetType.PANDAS,
1174
+ DatasetType.POLARS,
1175
+ DatasetType.PYARROW,
1176
+ DatasetType.RAY_DATASET,
1177
+ ],
1178
+ ("int32", "pandas", "application/orc"): [
1179
+ DatasetType.PANDAS,
1180
+ DatasetType.POLARS,
1181
+ DatasetType.PYARROW,
1182
+ DatasetType.RAY_DATASET,
1183
+ ],
1184
+ ("int32", "pandas", "application/parquet"): [
1185
+ DatasetType.DAFT,
1186
+ DatasetType.PANDAS,
1187
+ DatasetType.POLARS,
1188
+ DatasetType.PYARROW,
1189
+ DatasetType.RAY_DATASET,
1190
+ ],
1191
+ ("int32", "polars", "application/avro"): [
1192
+ DatasetType.PANDAS,
1193
+ DatasetType.POLARS,
1194
+ DatasetType.PYARROW,
1195
+ DatasetType.RAY_DATASET,
1196
+ ],
1197
+ ("int32", "polars", "application/feather"): [
1198
+ DatasetType.PANDAS,
1199
+ DatasetType.POLARS,
1200
+ DatasetType.PYARROW,
1201
+ DatasetType.RAY_DATASET,
1202
+ ],
1203
+ ("int32", "polars", "application/orc"): [
1204
+ DatasetType.PANDAS,
1205
+ DatasetType.POLARS,
1206
+ DatasetType.PYARROW,
1207
+ DatasetType.RAY_DATASET,
1208
+ ],
1209
+ ("int32", "polars", "application/parquet"): [
1210
+ DatasetType.DAFT,
1211
+ DatasetType.PANDAS,
1212
+ DatasetType.POLARS,
1213
+ DatasetType.PYARROW,
1214
+ DatasetType.RAY_DATASET,
1215
+ ],
1216
+ ("int32", "pyarrow", "application/avro"): [
1217
+ DatasetType.PANDAS,
1218
+ DatasetType.POLARS,
1219
+ DatasetType.PYARROW,
1220
+ DatasetType.RAY_DATASET,
1221
+ ],
1222
+ ("int32", "pyarrow", "application/feather"): [
1223
+ DatasetType.PANDAS,
1224
+ DatasetType.POLARS,
1225
+ DatasetType.PYARROW,
1226
+ DatasetType.RAY_DATASET,
1227
+ ],
1228
+ ("int32", "pyarrow", "application/orc"): [
1229
+ DatasetType.PANDAS,
1230
+ DatasetType.POLARS,
1231
+ DatasetType.PYARROW,
1232
+ DatasetType.RAY_DATASET,
1233
+ ],
1234
+ ("int32", "pyarrow", "application/parquet"): [
1235
+ DatasetType.DAFT,
1236
+ DatasetType.PANDAS,
1237
+ DatasetType.POLARS,
1238
+ DatasetType.PYARROW,
1239
+ DatasetType.RAY_DATASET,
1240
+ ],
1241
+ ("int32", "ray_dataset", "application/parquet"): [
1242
+ DatasetType.DAFT,
1243
+ DatasetType.PANDAS,
1244
+ DatasetType.POLARS,
1245
+ DatasetType.PYARROW,
1246
+ DatasetType.RAY_DATASET,
1247
+ ],
1248
+ ("int64", "daft", "application/parquet"): [
1249
+ DatasetType.DAFT,
1250
+ DatasetType.PANDAS,
1251
+ DatasetType.POLARS,
1252
+ DatasetType.PYARROW,
1253
+ DatasetType.RAY_DATASET,
1254
+ ],
1255
+ ("int64", "pandas", "application/avro"): [
1256
+ DatasetType.PANDAS,
1257
+ DatasetType.POLARS,
1258
+ DatasetType.PYARROW,
1259
+ DatasetType.RAY_DATASET,
1260
+ ],
1261
+ ("int64", "pandas", "application/feather"): [
1262
+ DatasetType.PANDAS,
1263
+ DatasetType.POLARS,
1264
+ DatasetType.PYARROW,
1265
+ DatasetType.RAY_DATASET,
1266
+ ],
1267
+ ("int64", "pandas", "application/orc"): [
1268
+ DatasetType.PANDAS,
1269
+ DatasetType.POLARS,
1270
+ DatasetType.PYARROW,
1271
+ DatasetType.RAY_DATASET,
1272
+ ],
1273
+ ("int64", "pandas", "application/parquet"): [
1274
+ DatasetType.DAFT,
1275
+ DatasetType.PANDAS,
1276
+ DatasetType.POLARS,
1277
+ DatasetType.PYARROW,
1278
+ DatasetType.RAY_DATASET,
1279
+ ],
1280
+ ("int64", "polars", "application/avro"): [
1281
+ DatasetType.PANDAS,
1282
+ DatasetType.POLARS,
1283
+ DatasetType.PYARROW,
1284
+ DatasetType.RAY_DATASET,
1285
+ ],
1286
+ ("int64", "polars", "application/feather"): [
1287
+ DatasetType.PANDAS,
1288
+ DatasetType.POLARS,
1289
+ DatasetType.PYARROW,
1290
+ DatasetType.RAY_DATASET,
1291
+ ],
1292
+ ("int64", "polars", "application/orc"): [
1293
+ DatasetType.PANDAS,
1294
+ DatasetType.POLARS,
1295
+ DatasetType.PYARROW,
1296
+ DatasetType.RAY_DATASET,
1297
+ ],
1298
+ ("int64", "polars", "application/parquet"): [
1299
+ DatasetType.DAFT,
1300
+ DatasetType.PANDAS,
1301
+ DatasetType.POLARS,
1302
+ DatasetType.PYARROW,
1303
+ DatasetType.RAY_DATASET,
1304
+ ],
1305
+ ("int64", "pyarrow", "application/avro"): [
1306
+ DatasetType.PANDAS,
1307
+ DatasetType.POLARS,
1308
+ DatasetType.PYARROW,
1309
+ DatasetType.RAY_DATASET,
1310
+ ],
1311
+ ("int64", "pyarrow", "application/feather"): [
1312
+ DatasetType.PANDAS,
1313
+ DatasetType.POLARS,
1314
+ DatasetType.PYARROW,
1315
+ DatasetType.RAY_DATASET,
1316
+ ],
1317
+ ("int64", "pyarrow", "application/orc"): [
1318
+ DatasetType.PANDAS,
1319
+ DatasetType.POLARS,
1320
+ DatasetType.PYARROW,
1321
+ DatasetType.RAY_DATASET,
1322
+ ],
1323
+ ("int64", "pyarrow", "application/parquet"): [
1324
+ DatasetType.DAFT,
1325
+ DatasetType.PANDAS,
1326
+ DatasetType.POLARS,
1327
+ DatasetType.PYARROW,
1328
+ DatasetType.RAY_DATASET,
1329
+ ],
1330
+ ("int64", "ray_dataset", "application/parquet"): [
1331
+ DatasetType.DAFT,
1332
+ DatasetType.PANDAS,
1333
+ DatasetType.POLARS,
1334
+ DatasetType.PYARROW,
1335
+ DatasetType.RAY_DATASET,
1336
+ ],
1337
+ ("int8", "daft", "application/parquet"): [
1338
+ DatasetType.DAFT,
1339
+ DatasetType.PANDAS,
1340
+ DatasetType.POLARS,
1341
+ DatasetType.PYARROW,
1342
+ DatasetType.RAY_DATASET,
1343
+ ],
1344
+ ("int8", "pandas", "application/feather"): [
1345
+ DatasetType.PANDAS,
1346
+ DatasetType.POLARS,
1347
+ DatasetType.PYARROW,
1348
+ DatasetType.RAY_DATASET,
1349
+ ],
1350
+ ("int8", "pandas", "application/orc"): [
1351
+ DatasetType.PANDAS,
1352
+ DatasetType.POLARS,
1353
+ DatasetType.PYARROW,
1354
+ DatasetType.RAY_DATASET,
1355
+ ],
1356
+ ("int8", "pandas", "application/parquet"): [
1357
+ DatasetType.DAFT,
1358
+ DatasetType.PANDAS,
1359
+ DatasetType.POLARS,
1360
+ DatasetType.PYARROW,
1361
+ DatasetType.RAY_DATASET,
1362
+ ],
1363
+ ("int8", "polars", "application/feather"): [
1364
+ DatasetType.PANDAS,
1365
+ DatasetType.POLARS,
1366
+ DatasetType.PYARROW,
1367
+ DatasetType.RAY_DATASET,
1368
+ ],
1369
+ ("int8", "polars", "application/orc"): [
1370
+ DatasetType.PANDAS,
1371
+ DatasetType.POLARS,
1372
+ DatasetType.PYARROW,
1373
+ DatasetType.RAY_DATASET,
1374
+ ],
1375
+ ("int8", "polars", "application/parquet"): [
1376
+ DatasetType.DAFT,
1377
+ DatasetType.PANDAS,
1378
+ DatasetType.POLARS,
1379
+ DatasetType.PYARROW,
1380
+ DatasetType.RAY_DATASET,
1381
+ ],
1382
+ ("int8", "pyarrow", "application/feather"): [
1383
+ DatasetType.PANDAS,
1384
+ DatasetType.POLARS,
1385
+ DatasetType.PYARROW,
1386
+ DatasetType.RAY_DATASET,
1387
+ ],
1388
+ ("int8", "pyarrow", "application/orc"): [
1389
+ DatasetType.PANDAS,
1390
+ DatasetType.POLARS,
1391
+ DatasetType.PYARROW,
1392
+ DatasetType.RAY_DATASET,
1393
+ ],
1394
+ ("int8", "pyarrow", "application/parquet"): [
1395
+ DatasetType.DAFT,
1396
+ DatasetType.PANDAS,
1397
+ DatasetType.POLARS,
1398
+ DatasetType.PYARROW,
1399
+ DatasetType.RAY_DATASET,
1400
+ ],
1401
+ ("int8", "ray_dataset", "application/parquet"): [
1402
+ DatasetType.DAFT,
1403
+ DatasetType.PANDAS,
1404
+ DatasetType.POLARS,
1405
+ DatasetType.PYARROW,
1406
+ DatasetType.RAY_DATASET,
1407
+ ],
1408
+ ("large_binary", "daft", "application/parquet"): [
1409
+ DatasetType.DAFT,
1410
+ DatasetType.PANDAS,
1411
+ DatasetType.POLARS,
1412
+ DatasetType.PYARROW,
1413
+ DatasetType.RAY_DATASET,
1414
+ ],
1415
+ ("large_binary", "pandas", "application/avro"): [
1416
+ DatasetType.PANDAS,
1417
+ DatasetType.POLARS,
1418
+ DatasetType.PYARROW,
1419
+ DatasetType.RAY_DATASET,
1420
+ ],
1421
+ ("large_binary", "pandas", "application/feather"): [
1422
+ DatasetType.PANDAS,
1423
+ DatasetType.POLARS,
1424
+ DatasetType.PYARROW,
1425
+ DatasetType.RAY_DATASET,
1426
+ ],
1427
+ ("large_binary", "pandas", "application/orc"): [
1428
+ DatasetType.PANDAS,
1429
+ DatasetType.POLARS,
1430
+ DatasetType.PYARROW,
1431
+ DatasetType.RAY_DATASET,
1432
+ ],
1433
+ ("large_binary", "pandas", "application/parquet"): [
1434
+ DatasetType.DAFT,
1435
+ DatasetType.PANDAS,
1436
+ DatasetType.POLARS,
1437
+ DatasetType.PYARROW,
1438
+ DatasetType.RAY_DATASET,
1439
+ ],
1440
+ ("large_binary", "polars", "application/avro"): [
1441
+ DatasetType.PANDAS,
1442
+ DatasetType.POLARS,
1443
+ DatasetType.PYARROW,
1444
+ DatasetType.RAY_DATASET,
1445
+ ],
1446
+ ("large_binary", "polars", "application/feather"): [
1447
+ DatasetType.PANDAS,
1448
+ DatasetType.POLARS,
1449
+ ],
1450
+ ("large_binary", "polars", "application/orc"): [
1451
+ DatasetType.PANDAS,
1452
+ DatasetType.POLARS,
1453
+ DatasetType.PYARROW,
1454
+ DatasetType.RAY_DATASET,
1455
+ ],
1456
+ ("large_binary", "polars", "application/parquet"): [
1457
+ DatasetType.DAFT,
1458
+ DatasetType.PANDAS,
1459
+ DatasetType.POLARS,
1460
+ DatasetType.PYARROW,
1461
+ DatasetType.RAY_DATASET,
1462
+ ],
1463
+ ("large_binary", "pyarrow", "application/avro"): [
1464
+ DatasetType.PANDAS,
1465
+ DatasetType.POLARS,
1466
+ DatasetType.PYARROW,
1467
+ DatasetType.RAY_DATASET,
1468
+ ],
1469
+ ("large_binary", "pyarrow", "application/feather"): [
1470
+ DatasetType.PANDAS,
1471
+ DatasetType.POLARS,
1472
+ DatasetType.PYARROW,
1473
+ DatasetType.RAY_DATASET,
1474
+ ],
1475
+ ("large_binary", "pyarrow", "application/orc"): [
1476
+ DatasetType.PANDAS,
1477
+ DatasetType.POLARS,
1478
+ DatasetType.PYARROW,
1479
+ DatasetType.RAY_DATASET,
1480
+ ],
1481
+ ("large_binary", "pyarrow", "application/parquet"): [
1482
+ DatasetType.DAFT,
1483
+ DatasetType.PANDAS,
1484
+ DatasetType.POLARS,
1485
+ DatasetType.PYARROW,
1486
+ DatasetType.RAY_DATASET,
1487
+ ],
1488
+ ("large_binary", "ray_dataset", "application/parquet"): [
1489
+ DatasetType.DAFT,
1490
+ DatasetType.PANDAS,
1491
+ DatasetType.POLARS,
1492
+ DatasetType.PYARROW,
1493
+ DatasetType.RAY_DATASET,
1494
+ ],
1495
+ ("large_list", "daft", "application/parquet"): [
1496
+ DatasetType.DAFT,
1497
+ DatasetType.PANDAS,
1498
+ DatasetType.POLARS,
1499
+ DatasetType.PYARROW,
1500
+ DatasetType.RAY_DATASET,
1501
+ ],
1502
+ ("large_list", "pandas", "application/avro"): [
1503
+ DatasetType.PANDAS,
1504
+ DatasetType.POLARS,
1505
+ DatasetType.PYARROW,
1506
+ DatasetType.RAY_DATASET,
1507
+ ],
1508
+ ("large_list", "pandas", "application/feather"): [
1509
+ DatasetType.PANDAS,
1510
+ DatasetType.POLARS,
1511
+ DatasetType.PYARROW,
1512
+ DatasetType.RAY_DATASET,
1513
+ ],
1514
+ ("large_list", "pandas", "application/orc"): [
1515
+ DatasetType.PANDAS,
1516
+ DatasetType.POLARS,
1517
+ DatasetType.PYARROW,
1518
+ DatasetType.RAY_DATASET,
1519
+ ],
1520
+ ("large_list", "pandas", "application/parquet"): [
1521
+ DatasetType.DAFT,
1522
+ DatasetType.PANDAS,
1523
+ DatasetType.POLARS,
1524
+ DatasetType.PYARROW,
1525
+ DatasetType.RAY_DATASET,
1526
+ ],
1527
+ ("large_list", "polars", "application/avro"): [
1528
+ DatasetType.PANDAS,
1529
+ DatasetType.POLARS,
1530
+ DatasetType.PYARROW,
1531
+ DatasetType.RAY_DATASET,
1532
+ ],
1533
+ ("large_list", "polars", "application/feather"): [
1534
+ DatasetType.PANDAS,
1535
+ DatasetType.POLARS,
1536
+ DatasetType.PYARROW,
1537
+ DatasetType.RAY_DATASET,
1538
+ ],
1539
+ ("large_list", "polars", "application/orc"): [
1540
+ DatasetType.PANDAS,
1541
+ DatasetType.POLARS,
1542
+ DatasetType.PYARROW,
1543
+ DatasetType.RAY_DATASET,
1544
+ ],
1545
+ ("large_list", "polars", "application/parquet"): [
1546
+ DatasetType.DAFT,
1547
+ DatasetType.PANDAS,
1548
+ DatasetType.POLARS,
1549
+ DatasetType.PYARROW,
1550
+ DatasetType.RAY_DATASET,
1551
+ ],
1552
+ ("large_list", "pyarrow", "application/avro"): [
1553
+ DatasetType.PANDAS,
1554
+ DatasetType.POLARS,
1555
+ DatasetType.PYARROW,
1556
+ DatasetType.RAY_DATASET,
1557
+ ],
1558
+ ("large_list", "pyarrow", "application/feather"): [
1559
+ DatasetType.PANDAS,
1560
+ DatasetType.POLARS,
1561
+ DatasetType.PYARROW,
1562
+ DatasetType.RAY_DATASET,
1563
+ ],
1564
+ ("large_list", "pyarrow", "application/orc"): [
1565
+ DatasetType.PANDAS,
1566
+ DatasetType.POLARS,
1567
+ DatasetType.PYARROW,
1568
+ DatasetType.RAY_DATASET,
1569
+ ],
1570
+ ("large_list", "pyarrow", "application/parquet"): [
1571
+ DatasetType.DAFT,
1572
+ DatasetType.PANDAS,
1573
+ DatasetType.POLARS,
1574
+ DatasetType.PYARROW,
1575
+ DatasetType.RAY_DATASET,
1576
+ ],
1577
+ ("large_list", "ray_dataset", "application/parquet"): [
1578
+ DatasetType.DAFT,
1579
+ DatasetType.PANDAS,
1580
+ DatasetType.POLARS,
1581
+ DatasetType.PYARROW,
1582
+ DatasetType.RAY_DATASET,
1583
+ ],
1584
+ ("large_list_view", "pandas", "application/avro"): [
1585
+ DatasetType.PANDAS,
1586
+ DatasetType.POLARS,
1587
+ DatasetType.PYARROW,
1588
+ DatasetType.RAY_DATASET,
1589
+ ],
1590
+ ("large_list_view", "pandas", "application/feather"): [
1591
+ DatasetType.PANDAS,
1592
+ DatasetType.POLARS,
1593
+ DatasetType.PYARROW,
1594
+ DatasetType.RAY_DATASET,
1595
+ ],
1596
+ ("large_list_view", "pandas", "application/orc"): [
1597
+ DatasetType.PANDAS,
1598
+ DatasetType.POLARS,
1599
+ DatasetType.PYARROW,
1600
+ DatasetType.RAY_DATASET,
1601
+ ],
1602
+ ("large_list_view", "pandas", "application/parquet"): [
1603
+ DatasetType.DAFT,
1604
+ DatasetType.PANDAS,
1605
+ DatasetType.POLARS,
1606
+ DatasetType.PYARROW,
1607
+ DatasetType.RAY_DATASET,
1608
+ ],
1609
+ ("large_string", "daft", "application/parquet"): [
1610
+ DatasetType.DAFT,
1611
+ DatasetType.PANDAS,
1612
+ DatasetType.POLARS,
1613
+ DatasetType.PYARROW,
1614
+ DatasetType.RAY_DATASET,
1615
+ ],
1616
+ ("large_string", "pandas", "application/avro"): [
1617
+ DatasetType.PANDAS,
1618
+ DatasetType.POLARS,
1619
+ DatasetType.PYARROW,
1620
+ DatasetType.RAY_DATASET,
1621
+ ],
1622
+ ("large_string", "pandas", "application/feather"): [
1623
+ DatasetType.PANDAS,
1624
+ DatasetType.POLARS,
1625
+ DatasetType.PYARROW,
1626
+ DatasetType.RAY_DATASET,
1627
+ ],
1628
+ ("large_string", "pandas", "application/orc"): [
1629
+ DatasetType.PANDAS,
1630
+ DatasetType.POLARS,
1631
+ DatasetType.PYARROW,
1632
+ DatasetType.RAY_DATASET,
1633
+ ],
1634
+ ("large_string", "pandas", "application/parquet"): [
1635
+ DatasetType.DAFT,
1636
+ DatasetType.PANDAS,
1637
+ DatasetType.POLARS,
1638
+ DatasetType.PYARROW,
1639
+ DatasetType.RAY_DATASET,
1640
+ ],
1641
+ ("large_string", "polars", "application/avro"): [
1642
+ DatasetType.PANDAS,
1643
+ DatasetType.POLARS,
1644
+ DatasetType.PYARROW,
1645
+ DatasetType.RAY_DATASET,
1646
+ ],
1647
+ ("large_string", "polars", "application/feather"): [
1648
+ DatasetType.PANDAS,
1649
+ DatasetType.POLARS,
1650
+ DatasetType.RAY_DATASET,
1651
+ ],
1652
+ ("large_string", "polars", "application/orc"): [
1653
+ DatasetType.PANDAS,
1654
+ DatasetType.POLARS,
1655
+ DatasetType.PYARROW,
1656
+ DatasetType.RAY_DATASET,
1657
+ ],
1658
+ ("large_string", "polars", "application/parquet"): [
1659
+ DatasetType.DAFT,
1660
+ DatasetType.PANDAS,
1661
+ DatasetType.POLARS,
1662
+ DatasetType.PYARROW,
1663
+ DatasetType.RAY_DATASET,
1664
+ ],
1665
+ ("large_string", "pyarrow", "application/avro"): [
1666
+ DatasetType.PANDAS,
1667
+ DatasetType.POLARS,
1668
+ DatasetType.PYARROW,
1669
+ DatasetType.RAY_DATASET,
1670
+ ],
1671
+ ("large_string", "pyarrow", "application/feather"): [
1672
+ DatasetType.PANDAS,
1673
+ DatasetType.POLARS,
1674
+ DatasetType.PYARROW,
1675
+ DatasetType.RAY_DATASET,
1676
+ ],
1677
+ ("large_string", "pyarrow", "application/orc"): [
1678
+ DatasetType.PANDAS,
1679
+ DatasetType.POLARS,
1680
+ DatasetType.PYARROW,
1681
+ DatasetType.RAY_DATASET,
1682
+ ],
1683
+ ("large_string", "pyarrow", "application/parquet"): [
1684
+ DatasetType.DAFT,
1685
+ DatasetType.PANDAS,
1686
+ DatasetType.POLARS,
1687
+ DatasetType.PYARROW,
1688
+ DatasetType.RAY_DATASET,
1689
+ ],
1690
+ ("large_string", "ray_dataset", "application/parquet"): [
1691
+ DatasetType.DAFT,
1692
+ DatasetType.PANDAS,
1693
+ DatasetType.POLARS,
1694
+ DatasetType.PYARROW,
1695
+ DatasetType.RAY_DATASET,
1696
+ ],
1697
+ ("list", "daft", "application/parquet"): [
1698
+ DatasetType.DAFT,
1699
+ DatasetType.PANDAS,
1700
+ DatasetType.POLARS,
1701
+ DatasetType.PYARROW,
1702
+ DatasetType.RAY_DATASET,
1703
+ ],
1704
+ ("list", "pandas", "application/avro"): [
1705
+ DatasetType.PANDAS,
1706
+ DatasetType.POLARS,
1707
+ DatasetType.PYARROW,
1708
+ DatasetType.RAY_DATASET,
1709
+ ],
1710
+ ("list", "pandas", "application/feather"): [
1711
+ DatasetType.PANDAS,
1712
+ DatasetType.POLARS,
1713
+ DatasetType.PYARROW,
1714
+ DatasetType.RAY_DATASET,
1715
+ ],
1716
+ ("list", "pandas", "application/orc"): [
1717
+ DatasetType.PANDAS,
1718
+ DatasetType.POLARS,
1719
+ DatasetType.PYARROW,
1720
+ DatasetType.RAY_DATASET,
1721
+ ],
1722
+ ("list", "pandas", "application/parquet"): [
1723
+ DatasetType.DAFT,
1724
+ DatasetType.PANDAS,
1725
+ DatasetType.POLARS,
1726
+ DatasetType.PYARROW,
1727
+ DatasetType.RAY_DATASET,
1728
+ ],
1729
+ ("list", "polars", "application/avro"): [
1730
+ DatasetType.PANDAS,
1731
+ DatasetType.POLARS,
1732
+ DatasetType.PYARROW,
1733
+ DatasetType.RAY_DATASET,
1734
+ ],
1735
+ ("list", "polars", "application/feather"): [
1736
+ DatasetType.PANDAS,
1737
+ DatasetType.POLARS,
1738
+ DatasetType.PYARROW,
1739
+ DatasetType.RAY_DATASET,
1740
+ ],
1741
+ ("list", "polars", "application/orc"): [
1742
+ DatasetType.PANDAS,
1743
+ DatasetType.POLARS,
1744
+ DatasetType.PYARROW,
1745
+ DatasetType.RAY_DATASET,
1746
+ ],
1747
+ ("list", "polars", "application/parquet"): [
1748
+ DatasetType.DAFT,
1749
+ DatasetType.PANDAS,
1750
+ DatasetType.POLARS,
1751
+ DatasetType.PYARROW,
1752
+ DatasetType.RAY_DATASET,
1753
+ ],
1754
+ ("list", "pyarrow", "application/avro"): [
1755
+ DatasetType.PANDAS,
1756
+ DatasetType.POLARS,
1757
+ DatasetType.PYARROW,
1758
+ DatasetType.RAY_DATASET,
1759
+ ],
1760
+ ("list", "pyarrow", "application/feather"): [
1761
+ DatasetType.PANDAS,
1762
+ DatasetType.POLARS,
1763
+ DatasetType.PYARROW,
1764
+ DatasetType.RAY_DATASET,
1765
+ ],
1766
+ ("list", "pyarrow", "application/orc"): [
1767
+ DatasetType.PANDAS,
1768
+ DatasetType.POLARS,
1769
+ DatasetType.PYARROW,
1770
+ DatasetType.RAY_DATASET,
1771
+ ],
1772
+ ("list", "pyarrow", "application/parquet"): [
1773
+ DatasetType.DAFT,
1774
+ DatasetType.PANDAS,
1775
+ DatasetType.POLARS,
1776
+ DatasetType.PYARROW,
1777
+ DatasetType.RAY_DATASET,
1778
+ ],
1779
+ ("list", "ray_dataset", "application/parquet"): [
1780
+ DatasetType.DAFT,
1781
+ DatasetType.PANDAS,
1782
+ DatasetType.POLARS,
1783
+ DatasetType.PYARROW,
1784
+ DatasetType.RAY_DATASET,
1785
+ ],
1786
+ ("list_view", "pandas", "application/avro"): [
1787
+ DatasetType.PANDAS,
1788
+ DatasetType.POLARS,
1789
+ DatasetType.PYARROW,
1790
+ DatasetType.RAY_DATASET,
1791
+ ],
1792
+ ("list_view", "pandas", "application/feather"): [
1793
+ DatasetType.PANDAS,
1794
+ DatasetType.POLARS,
1795
+ DatasetType.PYARROW,
1796
+ DatasetType.RAY_DATASET,
1797
+ ],
1798
+ ("list_view", "pandas", "application/orc"): [
1799
+ DatasetType.PANDAS,
1800
+ DatasetType.POLARS,
1801
+ DatasetType.PYARROW,
1802
+ DatasetType.RAY_DATASET,
1803
+ ],
1804
+ ("list_view", "pandas", "application/parquet"): [
1805
+ DatasetType.DAFT,
1806
+ DatasetType.PANDAS,
1807
+ DatasetType.POLARS,
1808
+ DatasetType.PYARROW,
1809
+ DatasetType.RAY_DATASET,
1810
+ ],
1811
+ ("map", "daft", "application/parquet"): [
1812
+ DatasetType.DAFT,
1813
+ DatasetType.PANDAS,
1814
+ DatasetType.PYARROW,
1815
+ DatasetType.RAY_DATASET,
1816
+ ],
1817
+ ("map", "polars", "application/avro"): [
1818
+ DatasetType.PANDAS,
1819
+ DatasetType.POLARS,
1820
+ DatasetType.PYARROW,
1821
+ DatasetType.RAY_DATASET,
1822
+ ],
1823
+ ("map", "polars", "application/feather"): [DatasetType.PANDAS, DatasetType.POLARS],
1824
+ ("map", "polars", "application/orc"): [
1825
+ DatasetType.PANDAS,
1826
+ DatasetType.POLARS,
1827
+ DatasetType.PYARROW,
1828
+ DatasetType.RAY_DATASET,
1829
+ ],
1830
+ ("map", "polars", "application/parquet"): [
1831
+ DatasetType.DAFT,
1832
+ DatasetType.PANDAS,
1833
+ DatasetType.POLARS,
1834
+ DatasetType.PYARROW,
1835
+ DatasetType.RAY_DATASET,
1836
+ ],
1837
+ ("map", "pyarrow", "application/avro"): [
1838
+ DatasetType.PANDAS,
1839
+ DatasetType.RAY_DATASET,
1840
+ ],
1841
+ ("map", "pyarrow", "application/feather"): [
1842
+ DatasetType.PANDAS,
1843
+ DatasetType.PYARROW,
1844
+ DatasetType.RAY_DATASET,
1845
+ ],
1846
+ ("map", "pyarrow", "application/orc"): [
1847
+ DatasetType.PANDAS,
1848
+ DatasetType.PYARROW,
1849
+ DatasetType.RAY_DATASET,
1850
+ ],
1851
+ ("map", "pyarrow", "application/parquet"): [
1852
+ DatasetType.DAFT,
1853
+ DatasetType.PANDAS,
1854
+ DatasetType.PYARROW,
1855
+ DatasetType.RAY_DATASET,
1856
+ ],
1857
+ ("map", "ray_dataset", "application/parquet"): [
1858
+ DatasetType.DAFT,
1859
+ DatasetType.PANDAS,
1860
+ DatasetType.PYARROW,
1861
+ DatasetType.RAY_DATASET,
1862
+ ],
1863
+ ("month_day_nano_interval", "pandas", "application/feather"): [
1864
+ DatasetType.PANDAS,
1865
+ DatasetType.PYARROW,
1866
+ DatasetType.RAY_DATASET,
1867
+ ],
1868
+ ("month_day_nano_interval", "pyarrow", "application/feather"): [
1869
+ DatasetType.PANDAS,
1870
+ DatasetType.PYARROW,
1871
+ DatasetType.RAY_DATASET,
1872
+ ],
1873
+ ("null", "daft", "application/parquet"): [
1874
+ DatasetType.DAFT,
1875
+ DatasetType.PANDAS,
1876
+ DatasetType.POLARS,
1877
+ DatasetType.PYARROW,
1878
+ DatasetType.RAY_DATASET,
1879
+ ],
1880
+ ("null", "pandas", "application/avro"): [
1881
+ DatasetType.PANDAS,
1882
+ DatasetType.RAY_DATASET,
1883
+ ],
1884
+ ("null", "pandas", "application/feather"): [
1885
+ DatasetType.PANDAS,
1886
+ DatasetType.POLARS,
1887
+ DatasetType.PYARROW,
1888
+ DatasetType.RAY_DATASET,
1889
+ ],
1890
+ ("null", "pandas", "application/parquet"): [
1891
+ DatasetType.DAFT,
1892
+ DatasetType.PANDAS,
1893
+ DatasetType.POLARS,
1894
+ DatasetType.PYARROW,
1895
+ DatasetType.RAY_DATASET,
1896
+ ],
1897
+ ("null", "polars", "application/feather"): [
1898
+ DatasetType.PANDAS,
1899
+ DatasetType.POLARS,
1900
+ DatasetType.PYARROW,
1901
+ DatasetType.RAY_DATASET,
1902
+ ],
1903
+ ("null", "polars", "application/parquet"): [
1904
+ DatasetType.DAFT,
1905
+ DatasetType.PANDAS,
1906
+ DatasetType.POLARS,
1907
+ DatasetType.PYARROW,
1908
+ DatasetType.RAY_DATASET,
1909
+ ],
1910
+ ("null", "pyarrow", "application/feather"): [
1911
+ DatasetType.PANDAS,
1912
+ DatasetType.POLARS,
1913
+ DatasetType.PYARROW,
1914
+ DatasetType.RAY_DATASET,
1915
+ ],
1916
+ ("null", "pyarrow", "application/parquet"): [
1917
+ DatasetType.DAFT,
1918
+ DatasetType.PANDAS,
1919
+ DatasetType.POLARS,
1920
+ DatasetType.PYARROW,
1921
+ DatasetType.RAY_DATASET,
1922
+ ],
1923
+ ("null", "ray_dataset", "application/parquet"): [
1924
+ DatasetType.DAFT,
1925
+ DatasetType.PANDAS,
1926
+ DatasetType.POLARS,
1927
+ DatasetType.PYARROW,
1928
+ DatasetType.RAY_DATASET,
1929
+ ],
1930
+ ("string", "daft", "application/parquet"): [
1931
+ DatasetType.DAFT,
1932
+ DatasetType.PANDAS,
1933
+ DatasetType.POLARS,
1934
+ DatasetType.PYARROW,
1935
+ DatasetType.RAY_DATASET,
1936
+ ],
1937
+ ("string", "pandas", "application/avro"): [
1938
+ DatasetType.PANDAS,
1939
+ DatasetType.POLARS,
1940
+ DatasetType.PYARROW,
1941
+ DatasetType.RAY_DATASET,
1942
+ ],
1943
+ ("string", "pandas", "application/feather"): [
1944
+ DatasetType.PANDAS,
1945
+ DatasetType.POLARS,
1946
+ DatasetType.PYARROW,
1947
+ DatasetType.RAY_DATASET,
1948
+ ],
1949
+ ("string", "pandas", "application/orc"): [
1950
+ DatasetType.PANDAS,
1951
+ DatasetType.POLARS,
1952
+ DatasetType.PYARROW,
1953
+ DatasetType.RAY_DATASET,
1954
+ ],
1955
+ ("string", "pandas", "application/parquet"): [
1956
+ DatasetType.DAFT,
1957
+ DatasetType.PANDAS,
1958
+ DatasetType.POLARS,
1959
+ DatasetType.PYARROW,
1960
+ DatasetType.RAY_DATASET,
1961
+ ],
1962
+ ("string", "polars", "application/avro"): [
1963
+ DatasetType.PANDAS,
1964
+ DatasetType.POLARS,
1965
+ DatasetType.PYARROW,
1966
+ DatasetType.RAY_DATASET,
1967
+ ],
1968
+ ("string", "polars", "application/feather"): [
1969
+ DatasetType.PANDAS,
1970
+ DatasetType.POLARS,
1971
+ DatasetType.RAY_DATASET,
1972
+ ],
1973
+ ("string", "polars", "application/orc"): [
1974
+ DatasetType.PANDAS,
1975
+ DatasetType.POLARS,
1976
+ DatasetType.PYARROW,
1977
+ DatasetType.RAY_DATASET,
1978
+ ],
1979
+ ("string", "polars", "application/parquet"): [
1980
+ DatasetType.DAFT,
1981
+ DatasetType.PANDAS,
1982
+ DatasetType.POLARS,
1983
+ DatasetType.PYARROW,
1984
+ DatasetType.RAY_DATASET,
1985
+ ],
1986
+ ("string", "pyarrow", "application/avro"): [
1987
+ DatasetType.PANDAS,
1988
+ DatasetType.POLARS,
1989
+ DatasetType.PYARROW,
1990
+ DatasetType.RAY_DATASET,
1991
+ ],
1992
+ ("string", "pyarrow", "application/feather"): [
1993
+ DatasetType.PANDAS,
1994
+ DatasetType.POLARS,
1995
+ DatasetType.PYARROW,
1996
+ DatasetType.RAY_DATASET,
1997
+ ],
1998
+ ("string", "pyarrow", "application/orc"): [
1999
+ DatasetType.PANDAS,
2000
+ DatasetType.POLARS,
2001
+ DatasetType.PYARROW,
2002
+ DatasetType.RAY_DATASET,
2003
+ ],
2004
+ ("string", "pyarrow", "application/parquet"): [
2005
+ DatasetType.DAFT,
2006
+ DatasetType.PANDAS,
2007
+ DatasetType.POLARS,
2008
+ DatasetType.PYARROW,
2009
+ DatasetType.RAY_DATASET,
2010
+ ],
2011
+ ("string", "ray_dataset", "application/parquet"): [
2012
+ DatasetType.DAFT,
2013
+ DatasetType.PANDAS,
2014
+ DatasetType.POLARS,
2015
+ DatasetType.PYARROW,
2016
+ DatasetType.RAY_DATASET,
2017
+ ],
2018
+ ("struct", "daft", "application/parquet"): [
2019
+ DatasetType.DAFT,
2020
+ DatasetType.PANDAS,
2021
+ DatasetType.POLARS,
2022
+ DatasetType.PYARROW,
2023
+ DatasetType.RAY_DATASET,
2024
+ ],
2025
+ ("struct", "pandas", "application/avro"): [
2026
+ DatasetType.PANDAS,
2027
+ DatasetType.POLARS,
2028
+ DatasetType.PYARROW,
2029
+ DatasetType.RAY_DATASET,
2030
+ ],
2031
+ ("struct", "pandas", "application/feather"): [
2032
+ DatasetType.PANDAS,
2033
+ DatasetType.POLARS,
2034
+ DatasetType.PYARROW,
2035
+ DatasetType.RAY_DATASET,
2036
+ ],
2037
+ ("struct", "pandas", "application/orc"): [
2038
+ DatasetType.PANDAS,
2039
+ DatasetType.POLARS,
2040
+ DatasetType.PYARROW,
2041
+ DatasetType.RAY_DATASET,
2042
+ ],
2043
+ ("struct", "pandas", "application/parquet"): [
2044
+ DatasetType.DAFT,
2045
+ DatasetType.PANDAS,
2046
+ DatasetType.POLARS,
2047
+ DatasetType.PYARROW,
2048
+ DatasetType.RAY_DATASET,
2049
+ ],
2050
+ ("struct", "polars", "application/avro"): [
2051
+ DatasetType.PANDAS,
2052
+ DatasetType.POLARS,
2053
+ DatasetType.PYARROW,
2054
+ DatasetType.RAY_DATASET,
2055
+ ],
2056
+ ("struct", "polars", "application/feather"): [
2057
+ DatasetType.PANDAS,
2058
+ DatasetType.POLARS,
2059
+ ],
2060
+ ("struct", "polars", "application/orc"): [
2061
+ DatasetType.PANDAS,
2062
+ DatasetType.PYARROW,
2063
+ DatasetType.RAY_DATASET,
2064
+ ],
2065
+ ("struct", "polars", "application/parquet"): [
2066
+ DatasetType.DAFT,
2067
+ DatasetType.PANDAS,
2068
+ DatasetType.POLARS,
2069
+ DatasetType.PYARROW,
2070
+ DatasetType.RAY_DATASET,
2071
+ ],
2072
+ ("struct", "pyarrow", "application/avro"): [
2073
+ DatasetType.PANDAS,
2074
+ DatasetType.POLARS,
2075
+ DatasetType.PYARROW,
2076
+ DatasetType.RAY_DATASET,
2077
+ ],
2078
+ ("struct", "pyarrow", "application/feather"): [
2079
+ DatasetType.PANDAS,
2080
+ DatasetType.POLARS,
2081
+ DatasetType.PYARROW,
2082
+ DatasetType.RAY_DATASET,
2083
+ ],
2084
+ ("struct", "pyarrow", "application/orc"): [
2085
+ DatasetType.PANDAS,
2086
+ DatasetType.PYARROW,
2087
+ DatasetType.RAY_DATASET,
2088
+ ],
2089
+ ("struct", "pyarrow", "application/parquet"): [
2090
+ DatasetType.DAFT,
2091
+ DatasetType.PANDAS,
2092
+ DatasetType.POLARS,
2093
+ DatasetType.PYARROW,
2094
+ DatasetType.RAY_DATASET,
2095
+ ],
2096
+ ("struct", "ray_dataset", "application/parquet"): [
2097
+ DatasetType.DAFT,
2098
+ DatasetType.PANDAS,
2099
+ DatasetType.POLARS,
2100
+ DatasetType.PYARROW,
2101
+ DatasetType.RAY_DATASET,
2102
+ ],
2103
+ ("time32[ms]", "polars", "application/feather"): [
2104
+ DatasetType.PANDAS,
2105
+ DatasetType.POLARS,
2106
+ DatasetType.PYARROW,
2107
+ DatasetType.RAY_DATASET,
2108
+ ],
2109
+ ("time32[ms]", "polars", "application/parquet"): [
2110
+ DatasetType.DAFT,
2111
+ DatasetType.PANDAS,
2112
+ DatasetType.POLARS,
2113
+ DatasetType.PYARROW,
2114
+ DatasetType.RAY_DATASET,
2115
+ ],
2116
+ ("time32[ms]", "pyarrow", "application/feather"): [
2117
+ DatasetType.POLARS,
2118
+ DatasetType.PYARROW,
2119
+ DatasetType.RAY_DATASET,
2120
+ ],
2121
+ ("time32[ms]", "pyarrow", "application/parquet"): [
2122
+ DatasetType.DAFT,
2123
+ DatasetType.POLARS,
2124
+ DatasetType.PYARROW,
2125
+ DatasetType.RAY_DATASET,
2126
+ ],
2127
+ ("time32[s]", "polars", "application/feather"): [
2128
+ DatasetType.PANDAS,
2129
+ DatasetType.POLARS,
2130
+ DatasetType.PYARROW,
2131
+ DatasetType.RAY_DATASET,
2132
+ ],
2133
+ ("time32[s]", "polars", "application/parquet"): [
2134
+ DatasetType.DAFT,
2135
+ DatasetType.PANDAS,
2136
+ DatasetType.POLARS,
2137
+ DatasetType.PYARROW,
2138
+ DatasetType.RAY_DATASET,
2139
+ ],
2140
+ ("time32[s]", "pyarrow", "application/feather"): [
2141
+ DatasetType.POLARS,
2142
+ DatasetType.PYARROW,
2143
+ DatasetType.RAY_DATASET,
2144
+ ],
2145
+ ("time32[s]", "pyarrow", "application/parquet"): [
2146
+ DatasetType.DAFT,
2147
+ DatasetType.POLARS,
2148
+ DatasetType.RAY_DATASET,
2149
+ ],
2150
+ ("time64[ns]", "daft", "application/parquet"): [
2151
+ DatasetType.DAFT,
2152
+ DatasetType.POLARS,
2153
+ DatasetType.PYARROW,
2154
+ DatasetType.RAY_DATASET,
2155
+ ],
2156
+ ("time64[ns]", "polars", "application/feather"): [
2157
+ DatasetType.PANDAS,
2158
+ DatasetType.POLARS,
2159
+ DatasetType.PYARROW,
2160
+ DatasetType.RAY_DATASET,
2161
+ ],
2162
+ ("time64[ns]", "polars", "application/parquet"): [
2163
+ DatasetType.DAFT,
2164
+ DatasetType.PANDAS,
2165
+ DatasetType.POLARS,
2166
+ DatasetType.PYARROW,
2167
+ DatasetType.RAY_DATASET,
2168
+ ],
2169
+ ("time64[ns]", "pyarrow", "application/feather"): [
2170
+ DatasetType.POLARS,
2171
+ DatasetType.PYARROW,
2172
+ DatasetType.RAY_DATASET,
2173
+ ],
2174
+ ("time64[ns]", "pyarrow", "application/parquet"): [
2175
+ DatasetType.DAFT,
2176
+ DatasetType.POLARS,
2177
+ DatasetType.PYARROW,
2178
+ DatasetType.RAY_DATASET,
2179
+ ],
2180
+ ("time64[ns]", "ray_dataset", "application/parquet"): [
2181
+ DatasetType.DAFT,
2182
+ DatasetType.POLARS,
2183
+ DatasetType.PYARROW,
2184
+ DatasetType.RAY_DATASET,
2185
+ ],
2186
+ ("time64[us]", "daft", "application/parquet"): [
2187
+ DatasetType.DAFT,
2188
+ DatasetType.POLARS,
2189
+ DatasetType.PYARROW,
2190
+ DatasetType.RAY_DATASET,
2191
+ ],
2192
+ ("time64[us]", "polars", "application/feather"): [
2193
+ DatasetType.PANDAS,
2194
+ DatasetType.POLARS,
2195
+ DatasetType.PYARROW,
2196
+ DatasetType.RAY_DATASET,
2197
+ ],
2198
+ ("time64[us]", "polars", "application/parquet"): [
2199
+ DatasetType.DAFT,
2200
+ DatasetType.PANDAS,
2201
+ DatasetType.POLARS,
2202
+ DatasetType.PYARROW,
2203
+ DatasetType.RAY_DATASET,
2204
+ ],
2205
+ ("time64[us]", "pyarrow", "application/feather"): [
2206
+ DatasetType.POLARS,
2207
+ DatasetType.PYARROW,
2208
+ DatasetType.RAY_DATASET,
2209
+ ],
2210
+ ("time64[us]", "pyarrow", "application/parquet"): [
2211
+ DatasetType.DAFT,
2212
+ DatasetType.POLARS,
2213
+ DatasetType.PYARROW,
2214
+ DatasetType.RAY_DATASET,
2215
+ ],
2216
+ ("time64[us]", "ray_dataset", "application/parquet"): [
2217
+ DatasetType.DAFT,
2218
+ DatasetType.POLARS,
2219
+ DatasetType.PYARROW,
2220
+ DatasetType.RAY_DATASET,
2221
+ ],
2222
+ ("timestamp[ms]", "daft", "application/parquet"): [
2223
+ DatasetType.DAFT,
2224
+ DatasetType.PANDAS,
2225
+ DatasetType.POLARS,
2226
+ DatasetType.PYARROW,
2227
+ DatasetType.RAY_DATASET,
2228
+ ],
2229
+ ("timestamp[ms]", "pandas", "application/avro"): [
2230
+ DatasetType.PANDAS,
2231
+ DatasetType.POLARS,
2232
+ DatasetType.PYARROW,
2233
+ DatasetType.RAY_DATASET,
2234
+ ],
2235
+ ("timestamp[ms]", "pandas", "application/feather"): [
2236
+ DatasetType.PANDAS,
2237
+ DatasetType.POLARS,
2238
+ DatasetType.PYARROW,
2239
+ DatasetType.RAY_DATASET,
2240
+ ],
2241
+ ("timestamp[ms]", "pandas", "application/orc"): [
2242
+ DatasetType.PANDAS,
2243
+ DatasetType.POLARS,
2244
+ DatasetType.PYARROW,
2245
+ DatasetType.RAY_DATASET,
2246
+ ],
2247
+ ("timestamp[ms]", "pandas", "application/parquet"): [
2248
+ DatasetType.DAFT,
2249
+ DatasetType.PANDAS,
2250
+ DatasetType.POLARS,
2251
+ DatasetType.PYARROW,
2252
+ DatasetType.RAY_DATASET,
2253
+ ],
2254
+ ("timestamp[ms]", "polars", "application/avro"): [
2255
+ DatasetType.PANDAS,
2256
+ DatasetType.POLARS,
2257
+ DatasetType.PYARROW,
2258
+ DatasetType.RAY_DATASET,
2259
+ ],
2260
+ ("timestamp[ms]", "polars", "application/feather"): [
2261
+ DatasetType.PANDAS,
2262
+ DatasetType.POLARS,
2263
+ DatasetType.PYARROW,
2264
+ DatasetType.RAY_DATASET,
2265
+ ],
2266
+ ("timestamp[ms]", "polars", "application/orc"): [
2267
+ DatasetType.PANDAS,
2268
+ DatasetType.POLARS,
2269
+ DatasetType.PYARROW,
2270
+ DatasetType.RAY_DATASET,
2271
+ ],
2272
+ ("timestamp[ms]", "polars", "application/parquet"): [
2273
+ DatasetType.DAFT,
2274
+ DatasetType.PANDAS,
2275
+ DatasetType.POLARS,
2276
+ DatasetType.PYARROW,
2277
+ DatasetType.RAY_DATASET,
2278
+ ],
2279
+ ("timestamp[ms]", "pyarrow", "application/avro"): [
2280
+ DatasetType.PANDAS,
2281
+ DatasetType.POLARS,
2282
+ DatasetType.PYARROW,
2283
+ DatasetType.RAY_DATASET,
2284
+ ],
2285
+ ("timestamp[ms]", "pyarrow", "application/feather"): [
2286
+ DatasetType.PANDAS,
2287
+ DatasetType.POLARS,
2288
+ DatasetType.PYARROW,
2289
+ DatasetType.RAY_DATASET,
2290
+ ],
2291
+ ("timestamp[ms]", "pyarrow", "application/orc"): [
2292
+ DatasetType.PANDAS,
2293
+ DatasetType.POLARS,
2294
+ DatasetType.PYARROW,
2295
+ DatasetType.RAY_DATASET,
2296
+ ],
2297
+ ("timestamp[ms]", "pyarrow", "application/parquet"): [
2298
+ DatasetType.DAFT,
2299
+ DatasetType.PANDAS,
2300
+ DatasetType.POLARS,
2301
+ DatasetType.PYARROW,
2302
+ DatasetType.RAY_DATASET,
2303
+ ],
2304
+ ("timestamp[ms]", "ray_dataset", "application/parquet"): [
2305
+ DatasetType.DAFT,
2306
+ DatasetType.PANDAS,
2307
+ DatasetType.POLARS,
2308
+ DatasetType.PYARROW,
2309
+ DatasetType.RAY_DATASET,
2310
+ ],
2311
+ ("timestamp[ns]", "daft", "application/parquet"): [
2312
+ DatasetType.DAFT,
2313
+ DatasetType.PANDAS,
2314
+ DatasetType.POLARS,
2315
+ DatasetType.PYARROW,
2316
+ DatasetType.RAY_DATASET,
2317
+ ],
2318
+ ("timestamp[ns]", "pandas", "application/feather"): [
2319
+ DatasetType.PANDAS,
2320
+ DatasetType.POLARS,
2321
+ DatasetType.PYARROW,
2322
+ DatasetType.RAY_DATASET,
2323
+ ],
2324
+ ("timestamp[ns]", "pandas", "application/orc"): [
2325
+ DatasetType.PANDAS,
2326
+ DatasetType.POLARS,
2327
+ DatasetType.PYARROW,
2328
+ DatasetType.RAY_DATASET,
2329
+ ],
2330
+ ("timestamp[ns]", "pandas", "application/parquet"): [
2331
+ DatasetType.DAFT,
2332
+ DatasetType.PANDAS,
2333
+ DatasetType.POLARS,
2334
+ DatasetType.PYARROW,
2335
+ DatasetType.RAY_DATASET,
2336
+ ],
2337
+ ("timestamp[ns]", "polars", "application/feather"): [
2338
+ DatasetType.PANDAS,
2339
+ DatasetType.POLARS,
2340
+ DatasetType.PYARROW,
2341
+ DatasetType.RAY_DATASET,
2342
+ ],
2343
+ ("timestamp[ns]", "polars", "application/orc"): [
2344
+ DatasetType.PANDAS,
2345
+ DatasetType.POLARS,
2346
+ DatasetType.PYARROW,
2347
+ DatasetType.RAY_DATASET,
2348
+ ],
2349
+ ("timestamp[ns]", "polars", "application/parquet"): [
2350
+ DatasetType.DAFT,
2351
+ DatasetType.PANDAS,
2352
+ DatasetType.POLARS,
2353
+ DatasetType.PYARROW,
2354
+ DatasetType.RAY_DATASET,
2355
+ ],
2356
+ ("timestamp[ns]", "pyarrow", "application/feather"): [
2357
+ DatasetType.PANDAS,
2358
+ DatasetType.POLARS,
2359
+ DatasetType.PYARROW,
2360
+ DatasetType.RAY_DATASET,
2361
+ ],
2362
+ ("timestamp[ns]", "pyarrow", "application/orc"): [
2363
+ DatasetType.PANDAS,
2364
+ DatasetType.POLARS,
2365
+ DatasetType.PYARROW,
2366
+ DatasetType.RAY_DATASET,
2367
+ ],
2368
+ ("timestamp[ns]", "pyarrow", "application/parquet"): [
2369
+ DatasetType.DAFT,
2370
+ DatasetType.PANDAS,
2371
+ DatasetType.POLARS,
2372
+ DatasetType.PYARROW,
2373
+ DatasetType.RAY_DATASET,
2374
+ ],
2375
+ ("timestamp[ns]", "ray_dataset", "application/parquet"): [
2376
+ DatasetType.DAFT,
2377
+ DatasetType.PANDAS,
2378
+ DatasetType.POLARS,
2379
+ DatasetType.PYARROW,
2380
+ DatasetType.RAY_DATASET,
2381
+ ],
2382
+ ("timestamp[s]", "daft", "application/parquet"): [
2383
+ DatasetType.DAFT,
2384
+ DatasetType.PANDAS,
2385
+ DatasetType.POLARS,
2386
+ DatasetType.PYARROW,
2387
+ DatasetType.RAY_DATASET,
2388
+ ],
2389
+ ("timestamp[s]", "pandas", "application/avro"): [
2390
+ DatasetType.PANDAS,
2391
+ DatasetType.POLARS,
2392
+ DatasetType.PYARROW,
2393
+ DatasetType.RAY_DATASET,
2394
+ ],
2395
+ ("timestamp[s]", "pandas", "application/feather"): [
2396
+ DatasetType.PANDAS,
2397
+ DatasetType.POLARS,
2398
+ DatasetType.PYARROW,
2399
+ DatasetType.RAY_DATASET,
2400
+ ],
2401
+ ("timestamp[s]", "pandas", "application/orc"): [
2402
+ DatasetType.PANDAS,
2403
+ DatasetType.POLARS,
2404
+ DatasetType.PYARROW,
2405
+ DatasetType.RAY_DATASET,
2406
+ ],
2407
+ ("timestamp[s]", "pandas", "application/parquet"): [
2408
+ DatasetType.DAFT,
2409
+ DatasetType.PANDAS,
2410
+ DatasetType.POLARS,
2411
+ DatasetType.PYARROW,
2412
+ DatasetType.RAY_DATASET,
2413
+ ],
2414
+ ("timestamp[s]", "polars", "application/avro"): [
2415
+ DatasetType.PANDAS,
2416
+ DatasetType.POLARS,
2417
+ DatasetType.PYARROW,
2418
+ DatasetType.RAY_DATASET,
2419
+ ],
2420
+ ("timestamp[s]", "polars", "application/feather"): [
2421
+ DatasetType.PANDAS,
2422
+ DatasetType.POLARS,
2423
+ DatasetType.PYARROW,
2424
+ DatasetType.RAY_DATASET,
2425
+ ],
2426
+ ("timestamp[s]", "polars", "application/orc"): [
2427
+ DatasetType.PANDAS,
2428
+ DatasetType.POLARS,
2429
+ DatasetType.PYARROW,
2430
+ DatasetType.RAY_DATASET,
2431
+ ],
2432
+ ("timestamp[s]", "polars", "application/parquet"): [
2433
+ DatasetType.DAFT,
2434
+ DatasetType.PANDAS,
2435
+ DatasetType.POLARS,
2436
+ DatasetType.PYARROW,
2437
+ DatasetType.RAY_DATASET,
2438
+ ],
2439
+ ("timestamp[s]", "pyarrow", "application/avro"): [
2440
+ DatasetType.PANDAS,
2441
+ DatasetType.POLARS,
2442
+ DatasetType.PYARROW,
2443
+ DatasetType.RAY_DATASET,
2444
+ ],
2445
+ ("timestamp[s]", "pyarrow", "application/feather"): [
2446
+ DatasetType.PANDAS,
2447
+ DatasetType.POLARS,
2448
+ DatasetType.PYARROW,
2449
+ DatasetType.RAY_DATASET,
2450
+ ],
2451
+ ("timestamp[s]", "pyarrow", "application/orc"): [
2452
+ DatasetType.PANDAS,
2453
+ DatasetType.POLARS,
2454
+ DatasetType.PYARROW,
2455
+ DatasetType.RAY_DATASET,
2456
+ ],
2457
+ ("timestamp[s]", "pyarrow", "application/parquet"): [
2458
+ DatasetType.DAFT,
2459
+ DatasetType.PANDAS,
2460
+ DatasetType.POLARS,
2461
+ DatasetType.PYARROW,
2462
+ DatasetType.RAY_DATASET,
2463
+ ],
2464
+ ("timestamp[s]", "ray_dataset", "application/parquet"): [
2465
+ DatasetType.DAFT,
2466
+ DatasetType.PANDAS,
2467
+ DatasetType.POLARS,
2468
+ DatasetType.PYARROW,
2469
+ DatasetType.RAY_DATASET,
2470
+ ],
2471
+ ("timestamp[us]", "daft", "application/parquet"): [
2472
+ DatasetType.DAFT,
2473
+ DatasetType.PANDAS,
2474
+ DatasetType.POLARS,
2475
+ DatasetType.PYARROW,
2476
+ DatasetType.RAY_DATASET,
2477
+ ],
2478
+ ("timestamp[us]", "pandas", "application/avro"): [
2479
+ DatasetType.PANDAS,
2480
+ DatasetType.POLARS,
2481
+ DatasetType.PYARROW,
2482
+ DatasetType.RAY_DATASET,
2483
+ ],
2484
+ ("timestamp[us]", "pandas", "application/feather"): [
2485
+ DatasetType.PANDAS,
2486
+ DatasetType.POLARS,
2487
+ DatasetType.PYARROW,
2488
+ DatasetType.RAY_DATASET,
2489
+ ],
2490
+ ("timestamp[us]", "pandas", "application/orc"): [
2491
+ DatasetType.PANDAS,
2492
+ DatasetType.POLARS,
2493
+ DatasetType.PYARROW,
2494
+ DatasetType.RAY_DATASET,
2495
+ ],
2496
+ ("timestamp[us]", "pandas", "application/parquet"): [
2497
+ DatasetType.DAFT,
2498
+ DatasetType.PANDAS,
2499
+ DatasetType.POLARS,
2500
+ DatasetType.PYARROW,
2501
+ DatasetType.RAY_DATASET,
2502
+ ],
2503
+ ("timestamp[us]", "polars", "application/avro"): [
2504
+ DatasetType.PANDAS,
2505
+ DatasetType.POLARS,
2506
+ DatasetType.PYARROW,
2507
+ DatasetType.RAY_DATASET,
2508
+ ],
2509
+ ("timestamp[us]", "polars", "application/feather"): [
2510
+ DatasetType.PANDAS,
2511
+ DatasetType.POLARS,
2512
+ DatasetType.PYARROW,
2513
+ DatasetType.RAY_DATASET,
2514
+ ],
2515
+ ("timestamp[us]", "polars", "application/orc"): [
2516
+ DatasetType.PANDAS,
2517
+ DatasetType.POLARS,
2518
+ DatasetType.PYARROW,
2519
+ DatasetType.RAY_DATASET,
2520
+ ],
2521
+ ("timestamp[us]", "polars", "application/parquet"): [
2522
+ DatasetType.DAFT,
2523
+ DatasetType.PANDAS,
2524
+ DatasetType.POLARS,
2525
+ DatasetType.PYARROW,
2526
+ DatasetType.RAY_DATASET,
2527
+ ],
2528
+ ("timestamp[us]", "pyarrow", "application/avro"): [
2529
+ DatasetType.PANDAS,
2530
+ DatasetType.POLARS,
2531
+ DatasetType.PYARROW,
2532
+ DatasetType.RAY_DATASET,
2533
+ ],
2534
+ ("timestamp[us]", "pyarrow", "application/feather"): [
2535
+ DatasetType.PANDAS,
2536
+ DatasetType.POLARS,
2537
+ DatasetType.PYARROW,
2538
+ DatasetType.RAY_DATASET,
2539
+ ],
2540
+ ("timestamp[us]", "pyarrow", "application/orc"): [
2541
+ DatasetType.PANDAS,
2542
+ DatasetType.POLARS,
2543
+ DatasetType.PYARROW,
2544
+ DatasetType.RAY_DATASET,
2545
+ ],
2546
+ ("timestamp[us]", "pyarrow", "application/parquet"): [
2547
+ DatasetType.DAFT,
2548
+ DatasetType.PANDAS,
2549
+ DatasetType.POLARS,
2550
+ DatasetType.PYARROW,
2551
+ DatasetType.RAY_DATASET,
2552
+ ],
2553
+ ("timestamp[us]", "ray_dataset", "application/parquet"): [
2554
+ DatasetType.DAFT,
2555
+ DatasetType.PANDAS,
2556
+ DatasetType.POLARS,
2557
+ DatasetType.PYARROW,
2558
+ DatasetType.RAY_DATASET,
2559
+ ],
2560
+ ("timestamp_tz[ms]", "daft", "application/parquet"): [
2561
+ DatasetType.DAFT,
2562
+ DatasetType.PANDAS,
2563
+ DatasetType.POLARS,
2564
+ DatasetType.PYARROW,
2565
+ DatasetType.RAY_DATASET,
2566
+ ],
2567
+ ("timestamp_tz[ms]", "pandas", "application/feather"): [
2568
+ DatasetType.PANDAS,
2569
+ DatasetType.POLARS,
2570
+ DatasetType.PYARROW,
2571
+ DatasetType.RAY_DATASET,
2572
+ ],
2573
+ ("timestamp_tz[ms]", "pandas", "application/orc"): [
2574
+ DatasetType.PANDAS,
2575
+ DatasetType.POLARS,
2576
+ DatasetType.PYARROW,
2577
+ DatasetType.RAY_DATASET,
2578
+ ],
2579
+ ("timestamp_tz[ms]", "pandas", "application/parquet"): [
2580
+ DatasetType.DAFT,
2581
+ DatasetType.PANDAS,
2582
+ DatasetType.POLARS,
2583
+ DatasetType.PYARROW,
2584
+ DatasetType.RAY_DATASET,
2585
+ ],
2586
+ ("timestamp_tz[ms]", "polars", "application/feather"): [
2587
+ DatasetType.PANDAS,
2588
+ DatasetType.POLARS,
2589
+ DatasetType.PYARROW,
2590
+ DatasetType.RAY_DATASET,
2591
+ ],
2592
+ ("timestamp_tz[ms]", "polars", "application/orc"): [
2593
+ DatasetType.PANDAS,
2594
+ DatasetType.POLARS,
2595
+ DatasetType.PYARROW,
2596
+ DatasetType.RAY_DATASET,
2597
+ ],
2598
+ ("timestamp_tz[ms]", "polars", "application/parquet"): [
2599
+ DatasetType.DAFT,
2600
+ DatasetType.PANDAS,
2601
+ DatasetType.POLARS,
2602
+ DatasetType.PYARROW,
2603
+ DatasetType.RAY_DATASET,
2604
+ ],
2605
+ ("timestamp_tz[ms]", "pyarrow", "application/feather"): [
2606
+ DatasetType.PANDAS,
2607
+ DatasetType.POLARS,
2608
+ DatasetType.PYARROW,
2609
+ DatasetType.RAY_DATASET,
2610
+ ],
2611
+ ("timestamp_tz[ms]", "pyarrow", "application/orc"): [
2612
+ DatasetType.PANDAS,
2613
+ DatasetType.POLARS,
2614
+ DatasetType.PYARROW,
2615
+ DatasetType.RAY_DATASET,
2616
+ ],
2617
+ ("timestamp_tz[ms]", "pyarrow", "application/parquet"): [
2618
+ DatasetType.DAFT,
2619
+ DatasetType.PANDAS,
2620
+ DatasetType.POLARS,
2621
+ DatasetType.PYARROW,
2622
+ DatasetType.RAY_DATASET,
2623
+ ],
2624
+ ("timestamp_tz[ms]", "ray_dataset", "application/parquet"): [
2625
+ DatasetType.DAFT,
2626
+ DatasetType.PANDAS,
2627
+ DatasetType.POLARS,
2628
+ DatasetType.PYARROW,
2629
+ DatasetType.RAY_DATASET,
2630
+ ],
2631
+ ("timestamp_tz[ns]", "daft", "application/parquet"): [
2632
+ DatasetType.DAFT,
2633
+ DatasetType.PANDAS,
2634
+ DatasetType.POLARS,
2635
+ DatasetType.PYARROW,
2636
+ DatasetType.RAY_DATASET,
2637
+ ],
2638
+ ("timestamp_tz[ns]", "pandas", "application/feather"): [
2639
+ DatasetType.PANDAS,
2640
+ DatasetType.POLARS,
2641
+ DatasetType.PYARROW,
2642
+ DatasetType.RAY_DATASET,
2643
+ ],
2644
+ ("timestamp_tz[ns]", "pandas", "application/orc"): [
2645
+ DatasetType.PANDAS,
2646
+ DatasetType.POLARS,
2647
+ DatasetType.PYARROW,
2648
+ DatasetType.RAY_DATASET,
2649
+ ],
2650
+ ("timestamp_tz[ns]", "pandas", "application/parquet"): [
2651
+ DatasetType.DAFT,
2652
+ DatasetType.PANDAS,
2653
+ DatasetType.POLARS,
2654
+ DatasetType.PYARROW,
2655
+ DatasetType.RAY_DATASET,
2656
+ ],
2657
+ ("timestamp_tz[ns]", "polars", "application/feather"): [
2658
+ DatasetType.PANDAS,
2659
+ DatasetType.POLARS,
2660
+ DatasetType.PYARROW,
2661
+ DatasetType.RAY_DATASET,
2662
+ ],
2663
+ ("timestamp_tz[ns]", "polars", "application/orc"): [
2664
+ DatasetType.PANDAS,
2665
+ DatasetType.POLARS,
2666
+ DatasetType.PYARROW,
2667
+ DatasetType.RAY_DATASET,
2668
+ ],
2669
+ ("timestamp_tz[ns]", "polars", "application/parquet"): [
2670
+ DatasetType.DAFT,
2671
+ DatasetType.PANDAS,
2672
+ DatasetType.POLARS,
2673
+ DatasetType.PYARROW,
2674
+ DatasetType.RAY_DATASET,
2675
+ ],
2676
+ ("timestamp_tz[ns]", "pyarrow", "application/feather"): [
2677
+ DatasetType.PANDAS,
2678
+ DatasetType.POLARS,
2679
+ DatasetType.PYARROW,
2680
+ DatasetType.RAY_DATASET,
2681
+ ],
2682
+ ("timestamp_tz[ns]", "pyarrow", "application/orc"): [
2683
+ DatasetType.PANDAS,
2684
+ DatasetType.POLARS,
2685
+ DatasetType.PYARROW,
2686
+ DatasetType.RAY_DATASET,
2687
+ ],
2688
+ ("timestamp_tz[ns]", "pyarrow", "application/parquet"): [
2689
+ DatasetType.DAFT,
2690
+ DatasetType.PANDAS,
2691
+ DatasetType.POLARS,
2692
+ DatasetType.PYARROW,
2693
+ DatasetType.RAY_DATASET,
2694
+ ],
2695
+ ("timestamp_tz[ns]", "ray_dataset", "application/parquet"): [
2696
+ DatasetType.DAFT,
2697
+ DatasetType.PANDAS,
2698
+ DatasetType.POLARS,
2699
+ DatasetType.PYARROW,
2700
+ DatasetType.RAY_DATASET,
2701
+ ],
2702
+ ("timestamp_tz[s]", "daft", "application/parquet"): [
2703
+ DatasetType.DAFT,
2704
+ DatasetType.PANDAS,
2705
+ DatasetType.POLARS,
2706
+ DatasetType.PYARROW,
2707
+ DatasetType.RAY_DATASET,
2708
+ ],
2709
+ ("timestamp_tz[s]", "pandas", "application/feather"): [
2710
+ DatasetType.PANDAS,
2711
+ DatasetType.POLARS,
2712
+ DatasetType.PYARROW,
2713
+ DatasetType.RAY_DATASET,
2714
+ ],
2715
+ ("timestamp_tz[s]", "pandas", "application/orc"): [
2716
+ DatasetType.PANDAS,
2717
+ DatasetType.POLARS,
2718
+ DatasetType.PYARROW,
2719
+ DatasetType.RAY_DATASET,
2720
+ ],
2721
+ ("timestamp_tz[s]", "pandas", "application/parquet"): [
2722
+ DatasetType.DAFT,
2723
+ DatasetType.PANDAS,
2724
+ DatasetType.POLARS,
2725
+ DatasetType.PYARROW,
2726
+ DatasetType.RAY_DATASET,
2727
+ ],
2728
+ ("timestamp_tz[s]", "polars", "application/feather"): [
2729
+ DatasetType.PANDAS,
2730
+ DatasetType.POLARS,
2731
+ DatasetType.PYARROW,
2732
+ DatasetType.RAY_DATASET,
2733
+ ],
2734
+ ("timestamp_tz[s]", "polars", "application/orc"): [
2735
+ DatasetType.PANDAS,
2736
+ DatasetType.POLARS,
2737
+ DatasetType.PYARROW,
2738
+ DatasetType.RAY_DATASET,
2739
+ ],
2740
+ ("timestamp_tz[s]", "polars", "application/parquet"): [
2741
+ DatasetType.DAFT,
2742
+ DatasetType.PANDAS,
2743
+ DatasetType.POLARS,
2744
+ DatasetType.PYARROW,
2745
+ DatasetType.RAY_DATASET,
2746
+ ],
2747
+ ("timestamp_tz[s]", "pyarrow", "application/feather"): [
2748
+ DatasetType.PANDAS,
2749
+ DatasetType.POLARS,
2750
+ DatasetType.PYARROW,
2751
+ DatasetType.RAY_DATASET,
2752
+ ],
2753
+ ("timestamp_tz[s]", "pyarrow", "application/orc"): [
2754
+ DatasetType.PANDAS,
2755
+ DatasetType.POLARS,
2756
+ DatasetType.PYARROW,
2757
+ DatasetType.RAY_DATASET,
2758
+ ],
2759
+ ("timestamp_tz[s]", "pyarrow", "application/parquet"): [
2760
+ DatasetType.DAFT,
2761
+ DatasetType.PANDAS,
2762
+ DatasetType.POLARS,
2763
+ DatasetType.PYARROW,
2764
+ DatasetType.RAY_DATASET,
2765
+ ],
2766
+ ("timestamp_tz[s]", "ray_dataset", "application/parquet"): [
2767
+ DatasetType.DAFT,
2768
+ DatasetType.PANDAS,
2769
+ DatasetType.POLARS,
2770
+ DatasetType.PYARROW,
2771
+ DatasetType.RAY_DATASET,
2772
+ ],
2773
+ ("timestamp_tz[us]", "daft", "application/parquet"): [
2774
+ DatasetType.DAFT,
2775
+ DatasetType.PANDAS,
2776
+ DatasetType.POLARS,
2777
+ DatasetType.PYARROW,
2778
+ DatasetType.RAY_DATASET,
2779
+ ],
2780
+ ("timestamp_tz[us]", "pandas", "application/feather"): [
2781
+ DatasetType.PANDAS,
2782
+ DatasetType.POLARS,
2783
+ DatasetType.PYARROW,
2784
+ DatasetType.RAY_DATASET,
2785
+ ],
2786
+ ("timestamp_tz[us]", "pandas", "application/orc"): [
2787
+ DatasetType.PANDAS,
2788
+ DatasetType.POLARS,
2789
+ DatasetType.PYARROW,
2790
+ DatasetType.RAY_DATASET,
2791
+ ],
2792
+ ("timestamp_tz[us]", "pandas", "application/parquet"): [
2793
+ DatasetType.DAFT,
2794
+ DatasetType.PANDAS,
2795
+ DatasetType.POLARS,
2796
+ DatasetType.PYARROW,
2797
+ DatasetType.RAY_DATASET,
2798
+ ],
2799
+ ("timestamp_tz[us]", "polars", "application/feather"): [
2800
+ DatasetType.PANDAS,
2801
+ DatasetType.POLARS,
2802
+ DatasetType.PYARROW,
2803
+ DatasetType.RAY_DATASET,
2804
+ ],
2805
+ ("timestamp_tz[us]", "polars", "application/orc"): [
2806
+ DatasetType.PANDAS,
2807
+ DatasetType.POLARS,
2808
+ DatasetType.PYARROW,
2809
+ DatasetType.RAY_DATASET,
2810
+ ],
2811
+ ("timestamp_tz[us]", "polars", "application/parquet"): [
2812
+ DatasetType.DAFT,
2813
+ DatasetType.PANDAS,
2814
+ DatasetType.POLARS,
2815
+ DatasetType.PYARROW,
2816
+ DatasetType.RAY_DATASET,
2817
+ ],
2818
+ ("timestamp_tz[us]", "pyarrow", "application/feather"): [
2819
+ DatasetType.PANDAS,
2820
+ DatasetType.POLARS,
2821
+ DatasetType.PYARROW,
2822
+ DatasetType.RAY_DATASET,
2823
+ ],
2824
+ ("timestamp_tz[us]", "pyarrow", "application/orc"): [
2825
+ DatasetType.PANDAS,
2826
+ DatasetType.POLARS,
2827
+ DatasetType.PYARROW,
2828
+ DatasetType.RAY_DATASET,
2829
+ ],
2830
+ ("timestamp_tz[us]", "pyarrow", "application/parquet"): [
2831
+ DatasetType.DAFT,
2832
+ DatasetType.PANDAS,
2833
+ DatasetType.POLARS,
2834
+ DatasetType.PYARROW,
2835
+ DatasetType.RAY_DATASET,
2836
+ ],
2837
+ ("timestamp_tz[us]", "ray_dataset", "application/parquet"): [
2838
+ DatasetType.DAFT,
2839
+ DatasetType.PANDAS,
2840
+ DatasetType.POLARS,
2841
+ DatasetType.PYARROW,
2842
+ DatasetType.RAY_DATASET,
2843
+ ],
2844
+ ("uint16", "daft", "application/parquet"): [
2845
+ DatasetType.DAFT,
2846
+ DatasetType.PANDAS,
2847
+ DatasetType.POLARS,
2848
+ DatasetType.PYARROW,
2849
+ DatasetType.RAY_DATASET,
2850
+ ],
2851
+ ("uint16", "pandas", "application/feather"): [
2852
+ DatasetType.PANDAS,
2853
+ DatasetType.POLARS,
2854
+ DatasetType.PYARROW,
2855
+ DatasetType.RAY_DATASET,
2856
+ ],
2857
+ ("uint16", "pandas", "application/parquet"): [
2858
+ DatasetType.DAFT,
2859
+ DatasetType.PANDAS,
2860
+ DatasetType.POLARS,
2861
+ DatasetType.PYARROW,
2862
+ DatasetType.RAY_DATASET,
2863
+ ],
2864
+ ("uint16", "polars", "application/feather"): [
2865
+ DatasetType.PANDAS,
2866
+ DatasetType.POLARS,
2867
+ DatasetType.PYARROW,
2868
+ DatasetType.RAY_DATASET,
2869
+ ],
2870
+ ("uint16", "polars", "application/parquet"): [
2871
+ DatasetType.DAFT,
2872
+ DatasetType.PANDAS,
2873
+ DatasetType.POLARS,
2874
+ DatasetType.PYARROW,
2875
+ DatasetType.RAY_DATASET,
2876
+ ],
2877
+ ("uint16", "pyarrow", "application/feather"): [
2878
+ DatasetType.PANDAS,
2879
+ DatasetType.POLARS,
2880
+ DatasetType.PYARROW,
2881
+ DatasetType.RAY_DATASET,
2882
+ ],
2883
+ ("uint16", "pyarrow", "application/parquet"): [
2884
+ DatasetType.DAFT,
2885
+ DatasetType.PANDAS,
2886
+ DatasetType.POLARS,
2887
+ DatasetType.PYARROW,
2888
+ DatasetType.RAY_DATASET,
2889
+ ],
2890
+ ("uint16", "ray_dataset", "application/parquet"): [
2891
+ DatasetType.DAFT,
2892
+ DatasetType.PANDAS,
2893
+ DatasetType.POLARS,
2894
+ DatasetType.PYARROW,
2895
+ DatasetType.RAY_DATASET,
2896
+ ],
2897
+ ("uint32", "daft", "application/parquet"): [
2898
+ DatasetType.DAFT,
2899
+ DatasetType.PANDAS,
2900
+ DatasetType.POLARS,
2901
+ DatasetType.PYARROW,
2902
+ DatasetType.RAY_DATASET,
2903
+ ],
2904
+ ("uint32", "pandas", "application/feather"): [
2905
+ DatasetType.PANDAS,
2906
+ DatasetType.POLARS,
2907
+ DatasetType.PYARROW,
2908
+ DatasetType.RAY_DATASET,
2909
+ ],
2910
+ ("uint32", "pandas", "application/parquet"): [
2911
+ DatasetType.DAFT,
2912
+ DatasetType.PANDAS,
2913
+ DatasetType.POLARS,
2914
+ DatasetType.PYARROW,
2915
+ DatasetType.RAY_DATASET,
2916
+ ],
2917
+ ("uint32", "polars", "application/feather"): [
2918
+ DatasetType.PANDAS,
2919
+ DatasetType.POLARS,
2920
+ DatasetType.PYARROW,
2921
+ DatasetType.RAY_DATASET,
2922
+ ],
2923
+ ("uint32", "polars", "application/parquet"): [
2924
+ DatasetType.DAFT,
2925
+ DatasetType.PANDAS,
2926
+ DatasetType.POLARS,
2927
+ DatasetType.PYARROW,
2928
+ DatasetType.RAY_DATASET,
2929
+ ],
2930
+ ("uint32", "pyarrow", "application/feather"): [
2931
+ DatasetType.PANDAS,
2932
+ DatasetType.POLARS,
2933
+ DatasetType.PYARROW,
2934
+ DatasetType.RAY_DATASET,
2935
+ ],
2936
+ ("uint32", "pyarrow", "application/parquet"): [
2937
+ DatasetType.DAFT,
2938
+ DatasetType.PANDAS,
2939
+ DatasetType.POLARS,
2940
+ DatasetType.PYARROW,
2941
+ DatasetType.RAY_DATASET,
2942
+ ],
2943
+ ("uint32", "ray_dataset", "application/parquet"): [
2944
+ DatasetType.DAFT,
2945
+ DatasetType.PANDAS,
2946
+ DatasetType.POLARS,
2947
+ DatasetType.PYARROW,
2948
+ DatasetType.RAY_DATASET,
2949
+ ],
2950
+ ("uint64", "daft", "application/parquet"): [
2951
+ DatasetType.DAFT,
2952
+ DatasetType.PANDAS,
2953
+ DatasetType.POLARS,
2954
+ DatasetType.PYARROW,
2955
+ DatasetType.RAY_DATASET,
2956
+ ],
2957
+ ("uint64", "pandas", "application/feather"): [
2958
+ DatasetType.PANDAS,
2959
+ DatasetType.POLARS,
2960
+ DatasetType.PYARROW,
2961
+ DatasetType.RAY_DATASET,
2962
+ ],
2963
+ ("uint64", "pandas", "application/parquet"): [
2964
+ DatasetType.DAFT,
2965
+ DatasetType.PANDAS,
2966
+ DatasetType.POLARS,
2967
+ DatasetType.PYARROW,
2968
+ DatasetType.RAY_DATASET,
2969
+ ],
2970
+ ("uint64", "polars", "application/feather"): [
2971
+ DatasetType.PANDAS,
2972
+ DatasetType.POLARS,
2973
+ DatasetType.PYARROW,
2974
+ DatasetType.RAY_DATASET,
2975
+ ],
2976
+ ("uint64", "polars", "application/parquet"): [
2977
+ DatasetType.DAFT,
2978
+ DatasetType.PANDAS,
2979
+ DatasetType.POLARS,
2980
+ DatasetType.PYARROW,
2981
+ DatasetType.RAY_DATASET,
2982
+ ],
2983
+ ("uint64", "pyarrow", "application/feather"): [
2984
+ DatasetType.PANDAS,
2985
+ DatasetType.POLARS,
2986
+ DatasetType.PYARROW,
2987
+ DatasetType.RAY_DATASET,
2988
+ ],
2989
+ ("uint64", "pyarrow", "application/parquet"): [
2990
+ DatasetType.DAFT,
2991
+ DatasetType.PANDAS,
2992
+ DatasetType.POLARS,
2993
+ DatasetType.PYARROW,
2994
+ DatasetType.RAY_DATASET,
2995
+ ],
2996
+ ("uint64", "ray_dataset", "application/parquet"): [
2997
+ DatasetType.DAFT,
2998
+ DatasetType.PANDAS,
2999
+ DatasetType.POLARS,
3000
+ DatasetType.PYARROW,
3001
+ DatasetType.RAY_DATASET,
3002
+ ],
3003
+ ("uint8", "daft", "application/parquet"): [
3004
+ DatasetType.DAFT,
3005
+ DatasetType.PANDAS,
3006
+ DatasetType.POLARS,
3007
+ DatasetType.PYARROW,
3008
+ DatasetType.RAY_DATASET,
3009
+ ],
3010
+ ("uint8", "pandas", "application/feather"): [
3011
+ DatasetType.PANDAS,
3012
+ DatasetType.POLARS,
3013
+ DatasetType.PYARROW,
3014
+ DatasetType.RAY_DATASET,
3015
+ ],
3016
+ ("uint8", "pandas", "application/parquet"): [
3017
+ DatasetType.DAFT,
3018
+ DatasetType.PANDAS,
3019
+ DatasetType.POLARS,
3020
+ DatasetType.PYARROW,
3021
+ DatasetType.RAY_DATASET,
3022
+ ],
3023
+ ("uint8", "polars", "application/feather"): [
3024
+ DatasetType.PANDAS,
3025
+ DatasetType.POLARS,
3026
+ DatasetType.PYARROW,
3027
+ DatasetType.RAY_DATASET,
3028
+ ],
3029
+ ("uint8", "polars", "application/parquet"): [
3030
+ DatasetType.DAFT,
3031
+ DatasetType.PANDAS,
3032
+ DatasetType.POLARS,
3033
+ DatasetType.PYARROW,
3034
+ DatasetType.RAY_DATASET,
3035
+ ],
3036
+ ("uint8", "pyarrow", "application/feather"): [
3037
+ DatasetType.PANDAS,
3038
+ DatasetType.POLARS,
3039
+ DatasetType.PYARROW,
3040
+ DatasetType.RAY_DATASET,
3041
+ ],
3042
+ ("uint8", "pyarrow", "application/parquet"): [
3043
+ DatasetType.DAFT,
3044
+ DatasetType.PANDAS,
3045
+ DatasetType.POLARS,
3046
+ DatasetType.PYARROW,
3047
+ DatasetType.RAY_DATASET,
3048
+ ],
3049
+ ("uint8", "ray_dataset", "application/parquet"): [
3050
+ DatasetType.DAFT,
3051
+ DatasetType.PANDAS,
3052
+ DatasetType.POLARS,
3053
+ DatasetType.PYARROW,
3054
+ DatasetType.RAY_DATASET,
3055
+ ],
3056
+ }
3057
+
3058
+
3059
+ def get_compatible_readers(
3060
+ arrow_type: str, writer_dataset_type: str, content_type: str
3061
+ ):
3062
+ """Get list of compatible reader DatasetTypes for given combination."""
3063
+ key = (arrow_type, writer_dataset_type, content_type)
3064
+ compatible_readers = READER_COMPATIBILITY_MAPPING.get(key, [])
3065
+ if (
3066
+ DatasetType.PANDAS in compatible_readers
3067
+ and DatasetType.NUMPY not in compatible_readers
3068
+ ):
3069
+ compatible_readers = compatible_readers + [DatasetType.NUMPY]
3070
+ return compatible_readers
3071
+
3072
+
3073
+ def is_reader_compatible(
3074
+ arrow_type: str,
3075
+ writer_dataset_type: str,
3076
+ content_type: str,
3077
+ reader_dataset_type: DatasetType,
3078
+ ) -> bool:
3079
+ """Check if a specific reader is compatible with given combination."""
3080
+ compatible_readers = get_compatible_readers(
3081
+ arrow_type, writer_dataset_type, content_type
3082
+ )
3083
+ return reader_dataset_type in compatible_readers