@loaders.gl/parquet 3.1.3 → 4.0.0-alpha.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (438) hide show
  1. package/dist/bundle.js +2 -2
  2. package/dist/bundle.js.map +1 -0
  3. package/dist/constants.js +6 -18
  4. package/dist/constants.js.map +1 -0
  5. package/dist/dist.min.js +17 -8
  6. package/dist/dist.min.js.map +3 -3
  7. package/dist/index.js +14 -29
  8. package/dist/index.js.map +1 -0
  9. package/dist/lib/convert-schema.js +63 -62
  10. package/dist/lib/convert-schema.js.map +1 -0
  11. package/dist/lib/parse-parquet.js +25 -25
  12. package/dist/lib/parse-parquet.js.map +1 -0
  13. package/dist/lib/read-array-buffer.js +8 -28
  14. package/dist/lib/read-array-buffer.js.map +1 -0
  15. package/dist/parquet-loader.js +19 -24
  16. package/dist/parquet-loader.js.map +1 -0
  17. package/dist/parquet-worker.js +18 -9
  18. package/dist/parquet-worker.js.map +3 -3
  19. package/dist/parquet-writer.js +14 -17
  20. package/dist/parquet-writer.js.map +1 -0
  21. package/dist/{es5/parquetjs → parquetjs}/LICENSE +0 -0
  22. package/dist/parquetjs/codecs/declare.js +2 -2
  23. package/dist/{es5/parquetjs → parquetjs}/codecs/declare.js.map +0 -0
  24. package/dist/parquetjs/codecs/dictionary.js +10 -12
  25. package/dist/parquetjs/codecs/dictionary.js.map +1 -0
  26. package/dist/parquetjs/codecs/index.js +22 -50
  27. package/dist/parquetjs/codecs/index.js.map +1 -0
  28. package/dist/parquetjs/codecs/plain.js +232 -173
  29. package/dist/parquetjs/codecs/plain.js.map +1 -0
  30. package/dist/parquetjs/codecs/rle.js +140 -134
  31. package/dist/parquetjs/codecs/rle.js.map +1 -0
  32. package/dist/parquetjs/compression.js +48 -154
  33. package/dist/parquetjs/compression.js.map +1 -0
  34. package/dist/parquetjs/encoder/writer.js +383 -440
  35. package/dist/parquetjs/encoder/writer.js.map +1 -0
  36. package/dist/parquetjs/file.js +66 -85
  37. package/dist/parquetjs/file.js.map +1 -0
  38. package/dist/{es5/parquetjs → parquetjs}/modules.d.ts +0 -0
  39. package/dist/parquetjs/parquet-thrift/BoundaryOrder.js +7 -14
  40. package/dist/parquetjs/parquet-thrift/BoundaryOrder.js.map +1 -0
  41. package/dist/parquetjs/parquet-thrift/BsonType.js +37 -56
  42. package/dist/parquetjs/parquet-thrift/BsonType.js.map +1 -0
  43. package/dist/parquetjs/parquet-thrift/ColumnChunk.js +215 -205
  44. package/dist/parquetjs/parquet-thrift/ColumnChunk.js.map +1 -0
  45. package/dist/parquetjs/parquet-thrift/ColumnIndex.js +212 -207
  46. package/dist/parquetjs/parquet-thrift/ColumnIndex.js.map +1 -0
  47. package/dist/parquetjs/parquet-thrift/ColumnMetaData.js +422 -391
  48. package/dist/parquetjs/parquet-thrift/ColumnMetaData.js.map +1 -0
  49. package/dist/parquetjs/parquet-thrift/ColumnOrder.js +90 -99
  50. package/dist/parquetjs/parquet-thrift/ColumnOrder.js.map +1 -0
  51. package/dist/parquetjs/parquet-thrift/CompressionCodec.js +12 -19
  52. package/dist/parquetjs/parquet-thrift/CompressionCodec.js.map +1 -0
  53. package/dist/parquetjs/parquet-thrift/ConvertedType.js +26 -33
  54. package/dist/parquetjs/parquet-thrift/ConvertedType.js.map +1 -0
  55. package/dist/parquetjs/parquet-thrift/DataPageHeader.js +162 -162
  56. package/dist/parquetjs/parquet-thrift/DataPageHeader.js.map +1 -0
  57. package/dist/parquetjs/parquet-thrift/DataPageHeaderV2.js +234 -224
  58. package/dist/parquetjs/parquet-thrift/DataPageHeaderV2.js.map +1 -0
  59. package/dist/parquetjs/parquet-thrift/DateType.js +37 -56
  60. package/dist/parquetjs/parquet-thrift/DateType.js.map +1 -0
  61. package/dist/parquetjs/parquet-thrift/DecimalType.js +91 -101
  62. package/dist/parquetjs/parquet-thrift/DecimalType.js.map +1 -0
  63. package/dist/parquetjs/parquet-thrift/DictionaryPageHeader.js +113 -118
  64. package/dist/parquetjs/parquet-thrift/DictionaryPageHeader.js.map +1 -0
  65. package/dist/parquetjs/parquet-thrift/Encoding.js +12 -19
  66. package/dist/parquetjs/parquet-thrift/Encoding.js.map +1 -0
  67. package/dist/parquetjs/parquet-thrift/EnumType.js +37 -56
  68. package/dist/parquetjs/parquet-thrift/EnumType.js.map +1 -0
  69. package/dist/parquetjs/parquet-thrift/FieldRepetitionType.js +7 -14
  70. package/dist/parquetjs/parquet-thrift/FieldRepetitionType.js.map +1 -0
  71. package/dist/parquetjs/parquet-thrift/FileMetaData.js +264 -250
  72. package/dist/parquetjs/parquet-thrift/FileMetaData.js.map +1 -0
  73. package/dist/parquetjs/parquet-thrift/IndexPageHeader.js +37 -56
  74. package/dist/parquetjs/parquet-thrift/IndexPageHeader.js.map +1 -0
  75. package/dist/parquetjs/parquet-thrift/IntType.js +91 -101
  76. package/dist/parquetjs/parquet-thrift/IntType.js.map +1 -0
  77. package/dist/parquetjs/parquet-thrift/JsonType.js +37 -56
  78. package/dist/parquetjs/parquet-thrift/JsonType.js.map +1 -0
  79. package/dist/parquetjs/parquet-thrift/KeyValue.js +89 -98
  80. package/dist/parquetjs/parquet-thrift/KeyValue.js.map +1 -0
  81. package/dist/parquetjs/parquet-thrift/ListType.js +37 -56
  82. package/dist/parquetjs/parquet-thrift/ListType.js.map +1 -0
  83. package/dist/parquetjs/parquet-thrift/LogicalType.js +450 -363
  84. package/dist/parquetjs/parquet-thrift/LogicalType.js.map +1 -0
  85. package/dist/parquetjs/parquet-thrift/MapType.js +37 -56
  86. package/dist/parquetjs/parquet-thrift/MapType.js.map +1 -0
  87. package/dist/parquetjs/parquet-thrift/MicroSeconds.js +37 -56
  88. package/dist/parquetjs/parquet-thrift/MicroSeconds.js.map +1 -0
  89. package/dist/parquetjs/parquet-thrift/MilliSeconds.js +37 -56
  90. package/dist/parquetjs/parquet-thrift/MilliSeconds.js.map +1 -0
  91. package/dist/parquetjs/parquet-thrift/NullType.js +37 -56
  92. package/dist/parquetjs/parquet-thrift/NullType.js.map +1 -0
  93. package/dist/parquetjs/parquet-thrift/OffsetIndex.js +80 -92
  94. package/dist/parquetjs/parquet-thrift/OffsetIndex.js.map +1 -0
  95. package/dist/parquetjs/parquet-thrift/PageEncodingStats.js +115 -123
  96. package/dist/parquetjs/parquet-thrift/PageEncodingStats.js.map +1 -0
  97. package/dist/parquetjs/parquet-thrift/PageHeader.js +231 -214
  98. package/dist/parquetjs/parquet-thrift/PageHeader.js.map +1 -0
  99. package/dist/parquetjs/parquet-thrift/PageLocation.js +124 -137
  100. package/dist/parquetjs/parquet-thrift/PageLocation.js.map +1 -0
  101. package/dist/parquetjs/parquet-thrift/PageType.js +8 -15
  102. package/dist/parquetjs/parquet-thrift/PageType.js.map +1 -0
  103. package/dist/parquetjs/parquet-thrift/RowGroup.js +172 -176
  104. package/dist/parquetjs/parquet-thrift/RowGroup.js.map +1 -0
  105. package/dist/parquetjs/parquet-thrift/SchemaElement.js +268 -237
  106. package/dist/parquetjs/parquet-thrift/SchemaElement.js.map +1 -0
  107. package/dist/parquetjs/parquet-thrift/SortingColumn.js +115 -123
  108. package/dist/parquetjs/parquet-thrift/SortingColumn.js.map +1 -0
  109. package/dist/parquetjs/parquet-thrift/Statistics.js +179 -172
  110. package/dist/parquetjs/parquet-thrift/Statistics.js.map +1 -0
  111. package/dist/parquetjs/parquet-thrift/StringType.js +37 -56
  112. package/dist/parquetjs/parquet-thrift/StringType.js.map +1 -0
  113. package/dist/parquetjs/parquet-thrift/TimeType.js +92 -102
  114. package/dist/parquetjs/parquet-thrift/TimeType.js.map +1 -0
  115. package/dist/parquetjs/parquet-thrift/TimeUnit.js +120 -121
  116. package/dist/parquetjs/parquet-thrift/TimeUnit.js.map +1 -0
  117. package/dist/parquetjs/parquet-thrift/TimestampType.js +92 -102
  118. package/dist/parquetjs/parquet-thrift/TimestampType.js.map +1 -0
  119. package/dist/parquetjs/parquet-thrift/Type.js +12 -19
  120. package/dist/parquetjs/parquet-thrift/Type.js.map +1 -0
  121. package/dist/parquetjs/parquet-thrift/TypeDefinedOrder.js +37 -56
  122. package/dist/parquetjs/parquet-thrift/TypeDefinedOrder.js.map +1 -0
  123. package/dist/parquetjs/parquet-thrift/UUIDType.js +37 -56
  124. package/dist/parquetjs/parquet-thrift/UUIDType.js.map +1 -0
  125. package/dist/parquetjs/parquet-thrift/index.js +44 -61
  126. package/dist/parquetjs/parquet-thrift/index.js.map +1 -0
  127. package/dist/parquetjs/parser/decoders.js +283 -301
  128. package/dist/{es5/parquetjs → parquetjs}/parser/decoders.js.map +1 -1
  129. package/dist/parquetjs/parser/parquet-cursor.js +85 -69
  130. package/dist/parquetjs/parser/parquet-cursor.js.map +1 -0
  131. package/dist/parquetjs/parser/parquet-envelope-reader.js +146 -127
  132. package/dist/parquetjs/parser/parquet-envelope-reader.js.map +1 -0
  133. package/dist/parquetjs/parser/parquet-reader.js +113 -127
  134. package/dist/parquetjs/parser/parquet-reader.js.map +1 -0
  135. package/dist/parquetjs/schema/declare.js +12 -9
  136. package/dist/parquetjs/schema/declare.js.map +1 -0
  137. package/dist/parquetjs/schema/schema.js +162 -148
  138. package/dist/{es5/parquetjs → parquetjs}/schema/schema.js.map +1 -1
  139. package/dist/parquetjs/schema/shred.js +151 -214
  140. package/dist/parquetjs/schema/shred.js.map +1 -0
  141. package/dist/parquetjs/schema/types.js +415 -357
  142. package/dist/parquetjs/schema/types.js.map +1 -0
  143. package/dist/parquetjs/utils/buffer-utils.js +10 -20
  144. package/dist/parquetjs/utils/buffer-utils.js.map +1 -0
  145. package/dist/parquetjs/utils/file-utils.js +28 -40
  146. package/dist/parquetjs/utils/file-utils.js.map +1 -0
  147. package/dist/parquetjs/utils/read-utils.js +95 -99
  148. package/dist/parquetjs/utils/read-utils.js.map +1 -0
  149. package/dist/workers/parquet-worker.js +4 -5
  150. package/dist/workers/parquet-worker.js.map +1 -0
  151. package/package.json +8 -8
  152. package/dist/es5/bundle.js +0 -7
  153. package/dist/es5/bundle.js.map +0 -1
  154. package/dist/es5/constants.js +0 -17
  155. package/dist/es5/constants.js.map +0 -1
  156. package/dist/es5/index.js +0 -82
  157. package/dist/es5/index.js.map +0 -1
  158. package/dist/es5/lib/convert-schema.js +0 -82
  159. package/dist/es5/lib/convert-schema.js.map +0 -1
  160. package/dist/es5/lib/parse-parquet.js +0 -173
  161. package/dist/es5/lib/parse-parquet.js.map +0 -1
  162. package/dist/es5/lib/read-array-buffer.js +0 -53
  163. package/dist/es5/lib/read-array-buffer.js.map +0 -1
  164. package/dist/es5/parquet-loader.js +0 -30
  165. package/dist/es5/parquet-loader.js.map +0 -1
  166. package/dist/es5/parquet-writer.js +0 -25
  167. package/dist/es5/parquet-writer.js.map +0 -1
  168. package/dist/es5/parquetjs/codecs/declare.js +0 -2
  169. package/dist/es5/parquetjs/codecs/dictionary.js +0 -30
  170. package/dist/es5/parquetjs/codecs/dictionary.js.map +0 -1
  171. package/dist/es5/parquetjs/codecs/index.js +0 -56
  172. package/dist/es5/parquetjs/codecs/index.js.map +0 -1
  173. package/dist/es5/parquetjs/codecs/plain.js +0 -287
  174. package/dist/es5/parquetjs/codecs/plain.js.map +0 -1
  175. package/dist/es5/parquetjs/codecs/rle.js +0 -174
  176. package/dist/es5/parquetjs/codecs/rle.js.map +0 -1
  177. package/dist/es5/parquetjs/compression.js +0 -167
  178. package/dist/es5/parquetjs/compression.js.map +0 -1
  179. package/dist/es5/parquetjs/encoder/writer.js +0 -875
  180. package/dist/es5/parquetjs/encoder/writer.js.map +0 -1
  181. package/dist/es5/parquetjs/file.js +0 -103
  182. package/dist/es5/parquetjs/file.js.map +0 -1
  183. package/dist/es5/parquetjs/parquet-thrift/BoundaryOrder.js +0 -15
  184. package/dist/es5/parquetjs/parquet-thrift/BoundaryOrder.js.map +0 -1
  185. package/dist/es5/parquetjs/parquet-thrift/BsonType.js +0 -67
  186. package/dist/es5/parquetjs/parquet-thrift/BsonType.js.map +0 -1
  187. package/dist/es5/parquetjs/parquet-thrift/ColumnChunk.js +0 -241
  188. package/dist/es5/parquetjs/parquet-thrift/ColumnChunk.js.map +0 -1
  189. package/dist/es5/parquetjs/parquet-thrift/ColumnIndex.js +0 -245
  190. package/dist/es5/parquetjs/parquet-thrift/ColumnIndex.js.map +0 -1
  191. package/dist/es5/parquetjs/parquet-thrift/ColumnMetaData.js +0 -449
  192. package/dist/es5/parquetjs/parquet-thrift/ColumnMetaData.js.map +0 -1
  193. package/dist/es5/parquetjs/parquet-thrift/ColumnOrder.js +0 -124
  194. package/dist/es5/parquetjs/parquet-thrift/ColumnOrder.js.map +0 -1
  195. package/dist/es5/parquetjs/parquet-thrift/CompressionCodec.js +0 -20
  196. package/dist/es5/parquetjs/parquet-thrift/CompressionCodec.js.map +0 -1
  197. package/dist/es5/parquetjs/parquet-thrift/ConvertedType.js +0 -34
  198. package/dist/es5/parquetjs/parquet-thrift/ConvertedType.js.map +0 -1
  199. package/dist/es5/parquetjs/parquet-thrift/DataPageHeader.js +0 -191
  200. package/dist/es5/parquetjs/parquet-thrift/DataPageHeader.js.map +0 -1
  201. package/dist/es5/parquetjs/parquet-thrift/DataPageHeaderV2.js +0 -258
  202. package/dist/es5/parquetjs/parquet-thrift/DataPageHeaderV2.js.map +0 -1
  203. package/dist/es5/parquetjs/parquet-thrift/DateType.js +0 -67
  204. package/dist/es5/parquetjs/parquet-thrift/DateType.js.map +0 -1
  205. package/dist/es5/parquetjs/parquet-thrift/DecimalType.js +0 -122
  206. package/dist/es5/parquetjs/parquet-thrift/DecimalType.js.map +0 -1
  207. package/dist/es5/parquetjs/parquet-thrift/DictionaryPageHeader.js +0 -143
  208. package/dist/es5/parquetjs/parquet-thrift/DictionaryPageHeader.js.map +0 -1
  209. package/dist/es5/parquetjs/parquet-thrift/Encoding.js +0 -20
  210. package/dist/es5/parquetjs/parquet-thrift/Encoding.js.map +0 -1
  211. package/dist/es5/parquetjs/parquet-thrift/EnumType.js +0 -67
  212. package/dist/es5/parquetjs/parquet-thrift/EnumType.js.map +0 -1
  213. package/dist/es5/parquetjs/parquet-thrift/FieldRepetitionType.js +0 -15
  214. package/dist/es5/parquetjs/parquet-thrift/FieldRepetitionType.js.map +0 -1
  215. package/dist/es5/parquetjs/parquet-thrift/FileMetaData.js +0 -298
  216. package/dist/es5/parquetjs/parquet-thrift/FileMetaData.js.map +0 -1
  217. package/dist/es5/parquetjs/parquet-thrift/IndexPageHeader.js +0 -67
  218. package/dist/es5/parquetjs/parquet-thrift/IndexPageHeader.js.map +0 -1
  219. package/dist/es5/parquetjs/parquet-thrift/IntType.js +0 -122
  220. package/dist/es5/parquetjs/parquet-thrift/IntType.js.map +0 -1
  221. package/dist/es5/parquetjs/parquet-thrift/JsonType.js +0 -67
  222. package/dist/es5/parquetjs/parquet-thrift/JsonType.js.map +0 -1
  223. package/dist/es5/parquetjs/parquet-thrift/KeyValue.js +0 -120
  224. package/dist/es5/parquetjs/parquet-thrift/KeyValue.js.map +0 -1
  225. package/dist/es5/parquetjs/parquet-thrift/ListType.js +0 -67
  226. package/dist/es5/parquetjs/parquet-thrift/ListType.js.map +0 -1
  227. package/dist/es5/parquetjs/parquet-thrift/LogicalType.js +0 -508
  228. package/dist/es5/parquetjs/parquet-thrift/LogicalType.js.map +0 -1
  229. package/dist/es5/parquetjs/parquet-thrift/MapType.js +0 -67
  230. package/dist/es5/parquetjs/parquet-thrift/MapType.js.map +0 -1
  231. package/dist/es5/parquetjs/parquet-thrift/MicroSeconds.js +0 -67
  232. package/dist/es5/parquetjs/parquet-thrift/MicroSeconds.js.map +0 -1
  233. package/dist/es5/parquetjs/parquet-thrift/MilliSeconds.js +0 -67
  234. package/dist/es5/parquetjs/parquet-thrift/MilliSeconds.js.map +0 -1
  235. package/dist/es5/parquetjs/parquet-thrift/NullType.js +0 -67
  236. package/dist/es5/parquetjs/parquet-thrift/NullType.js.map +0 -1
  237. package/dist/es5/parquetjs/parquet-thrift/OffsetIndex.js +0 -114
  238. package/dist/es5/parquetjs/parquet-thrift/OffsetIndex.js.map +0 -1
  239. package/dist/es5/parquetjs/parquet-thrift/PageEncodingStats.js +0 -145
  240. package/dist/es5/parquetjs/parquet-thrift/PageEncodingStats.js.map +0 -1
  241. package/dist/es5/parquetjs/parquet-thrift/PageHeader.js +0 -258
  242. package/dist/es5/parquetjs/parquet-thrift/PageHeader.js.map +0 -1
  243. package/dist/es5/parquetjs/parquet-thrift/PageLocation.js +0 -155
  244. package/dist/es5/parquetjs/parquet-thrift/PageLocation.js.map +0 -1
  245. package/dist/es5/parquetjs/parquet-thrift/PageType.js +0 -16
  246. package/dist/es5/parquetjs/parquet-thrift/PageType.js.map +0 -1
  247. package/dist/es5/parquetjs/parquet-thrift/RowGroup.js +0 -206
  248. package/dist/es5/parquetjs/parquet-thrift/RowGroup.js.map +0 -1
  249. package/dist/es5/parquetjs/parquet-thrift/SchemaElement.js +0 -290
  250. package/dist/es5/parquetjs/parquet-thrift/SchemaElement.js.map +0 -1
  251. package/dist/es5/parquetjs/parquet-thrift/SortingColumn.js +0 -145
  252. package/dist/es5/parquetjs/parquet-thrift/SortingColumn.js.map +0 -1
  253. package/dist/es5/parquetjs/parquet-thrift/Statistics.js +0 -207
  254. package/dist/es5/parquetjs/parquet-thrift/Statistics.js.map +0 -1
  255. package/dist/es5/parquetjs/parquet-thrift/StringType.js +0 -67
  256. package/dist/es5/parquetjs/parquet-thrift/StringType.js.map +0 -1
  257. package/dist/es5/parquetjs/parquet-thrift/TimeType.js +0 -124
  258. package/dist/es5/parquetjs/parquet-thrift/TimeType.js.map +0 -1
  259. package/dist/es5/parquetjs/parquet-thrift/TimeUnit.js +0 -156
  260. package/dist/es5/parquetjs/parquet-thrift/TimeUnit.js.map +0 -1
  261. package/dist/es5/parquetjs/parquet-thrift/TimestampType.js +0 -124
  262. package/dist/es5/parquetjs/parquet-thrift/TimestampType.js.map +0 -1
  263. package/dist/es5/parquetjs/parquet-thrift/Type.js +0 -20
  264. package/dist/es5/parquetjs/parquet-thrift/Type.js.map +0 -1
  265. package/dist/es5/parquetjs/parquet-thrift/TypeDefinedOrder.js +0 -67
  266. package/dist/es5/parquetjs/parquet-thrift/TypeDefinedOrder.js.map +0 -1
  267. package/dist/es5/parquetjs/parquet-thrift/UUIDType.js +0 -67
  268. package/dist/es5/parquetjs/parquet-thrift/UUIDType.js.map +0 -1
  269. package/dist/es5/parquetjs/parquet-thrift/index.js +0 -565
  270. package/dist/es5/parquetjs/parquet-thrift/index.js.map +0 -1
  271. package/dist/es5/parquetjs/parser/decoders.js +0 -489
  272. package/dist/es5/parquetjs/parser/parquet-cursor.js +0 -215
  273. package/dist/es5/parquetjs/parser/parquet-cursor.js.map +0 -1
  274. package/dist/es5/parquetjs/parser/parquet-envelope-reader.js +0 -413
  275. package/dist/es5/parquetjs/parser/parquet-envelope-reader.js.map +0 -1
  276. package/dist/es5/parquetjs/parser/parquet-reader.js +0 -364
  277. package/dist/es5/parquetjs/parser/parquet-reader.js.map +0 -1
  278. package/dist/es5/parquetjs/schema/declare.js +0 -25
  279. package/dist/es5/parquetjs/schema/declare.js.map +0 -1
  280. package/dist/es5/parquetjs/schema/schema.js +0 -203
  281. package/dist/es5/parquetjs/schema/shred.js +0 -223
  282. package/dist/es5/parquetjs/schema/shred.js.map +0 -1
  283. package/dist/es5/parquetjs/schema/types.js +0 -492
  284. package/dist/es5/parquetjs/schema/types.js.map +0 -1
  285. package/dist/es5/parquetjs/utils/buffer-utils.js +0 -21
  286. package/dist/es5/parquetjs/utils/buffer-utils.js.map +0 -1
  287. package/dist/es5/parquetjs/utils/file-utils.js +0 -55
  288. package/dist/es5/parquetjs/utils/file-utils.js.map +0 -1
  289. package/dist/es5/parquetjs/utils/read-utils.js +0 -159
  290. package/dist/es5/parquetjs/utils/read-utils.js.map +0 -1
  291. package/dist/es5/workers/parquet-worker.js +0 -8
  292. package/dist/es5/workers/parquet-worker.js.map +0 -1
  293. package/dist/esm/bundle.js +0 -5
  294. package/dist/esm/bundle.js.map +0 -1
  295. package/dist/esm/constants.js +0 -6
  296. package/dist/esm/constants.js.map +0 -1
  297. package/dist/esm/index.js +0 -15
  298. package/dist/esm/index.js.map +0 -1
  299. package/dist/esm/lib/convert-schema.js +0 -71
  300. package/dist/esm/lib/convert-schema.js.map +0 -1
  301. package/dist/esm/lib/parse-parquet.js +0 -28
  302. package/dist/esm/lib/parse-parquet.js.map +0 -1
  303. package/dist/esm/lib/read-array-buffer.js +0 -9
  304. package/dist/esm/lib/read-array-buffer.js.map +0 -1
  305. package/dist/esm/parquet-loader.js +0 -22
  306. package/dist/esm/parquet-loader.js.map +0 -1
  307. package/dist/esm/parquet-writer.js +0 -18
  308. package/dist/esm/parquet-writer.js.map +0 -1
  309. package/dist/esm/parquetjs/LICENSE +0 -20
  310. package/dist/esm/parquetjs/codecs/declare.js +0 -2
  311. package/dist/esm/parquetjs/codecs/declare.js.map +0 -1
  312. package/dist/esm/parquetjs/codecs/dictionary.js +0 -12
  313. package/dist/esm/parquetjs/codecs/dictionary.js.map +0 -1
  314. package/dist/esm/parquetjs/codecs/index.js +0 -23
  315. package/dist/esm/parquetjs/codecs/index.js.map +0 -1
  316. package/dist/esm/parquetjs/codecs/plain.js +0 -270
  317. package/dist/esm/parquetjs/codecs/plain.js.map +0 -1
  318. package/dist/esm/parquetjs/codecs/rle.js +0 -151
  319. package/dist/esm/parquetjs/codecs/rle.js.map +0 -1
  320. package/dist/esm/parquetjs/compression.js +0 -62
  321. package/dist/esm/parquetjs/compression.js.map +0 -1
  322. package/dist/esm/parquetjs/encoder/writer.js +0 -421
  323. package/dist/esm/parquetjs/encoder/writer.js.map +0 -1
  324. package/dist/esm/parquetjs/file.js +0 -80
  325. package/dist/esm/parquetjs/file.js.map +0 -1
  326. package/dist/esm/parquetjs/modules.d.ts +0 -21
  327. package/dist/esm/parquetjs/parquet-thrift/BoundaryOrder.js +0 -8
  328. package/dist/esm/parquetjs/parquet-thrift/BoundaryOrder.js.map +0 -1
  329. package/dist/esm/parquetjs/parquet-thrift/BsonType.js +0 -39
  330. package/dist/esm/parquetjs/parquet-thrift/BsonType.js.map +0 -1
  331. package/dist/esm/parquetjs/parquet-thrift/ColumnChunk.js +0 -217
  332. package/dist/esm/parquetjs/parquet-thrift/ColumnChunk.js.map +0 -1
  333. package/dist/esm/parquetjs/parquet-thrift/ColumnIndex.js +0 -218
  334. package/dist/esm/parquetjs/parquet-thrift/ColumnIndex.js.map +0 -1
  335. package/dist/esm/parquetjs/parquet-thrift/ColumnMetaData.js +0 -429
  336. package/dist/esm/parquetjs/parquet-thrift/ColumnMetaData.js.map +0 -1
  337. package/dist/esm/parquetjs/parquet-thrift/ColumnOrder.js +0 -95
  338. package/dist/esm/parquetjs/parquet-thrift/ColumnOrder.js.map +0 -1
  339. package/dist/esm/parquetjs/parquet-thrift/CompressionCodec.js +0 -13
  340. package/dist/esm/parquetjs/parquet-thrift/CompressionCodec.js.map +0 -1
  341. package/dist/esm/parquetjs/parquet-thrift/ConvertedType.js +0 -27
  342. package/dist/esm/parquetjs/parquet-thrift/ConvertedType.js.map +0 -1
  343. package/dist/esm/parquetjs/parquet-thrift/DataPageHeader.js +0 -166
  344. package/dist/esm/parquetjs/parquet-thrift/DataPageHeader.js.map +0 -1
  345. package/dist/esm/parquetjs/parquet-thrift/DataPageHeaderV2.js +0 -236
  346. package/dist/esm/parquetjs/parquet-thrift/DataPageHeaderV2.js.map +0 -1
  347. package/dist/esm/parquetjs/parquet-thrift/DateType.js +0 -39
  348. package/dist/esm/parquetjs/parquet-thrift/DateType.js.map +0 -1
  349. package/dist/esm/parquetjs/parquet-thrift/DecimalType.js +0 -95
  350. package/dist/esm/parquetjs/parquet-thrift/DecimalType.js.map +0 -1
  351. package/dist/esm/parquetjs/parquet-thrift/DictionaryPageHeader.js +0 -117
  352. package/dist/esm/parquetjs/parquet-thrift/DictionaryPageHeader.js.map +0 -1
  353. package/dist/esm/parquetjs/parquet-thrift/Encoding.js +0 -13
  354. package/dist/esm/parquetjs/parquet-thrift/Encoding.js.map +0 -1
  355. package/dist/esm/parquetjs/parquet-thrift/EnumType.js +0 -39
  356. package/dist/esm/parquetjs/parquet-thrift/EnumType.js.map +0 -1
  357. package/dist/esm/parquetjs/parquet-thrift/FieldRepetitionType.js +0 -8
  358. package/dist/esm/parquetjs/parquet-thrift/FieldRepetitionType.js.map +0 -1
  359. package/dist/esm/parquetjs/parquet-thrift/FileMetaData.js +0 -270
  360. package/dist/esm/parquetjs/parquet-thrift/FileMetaData.js.map +0 -1
  361. package/dist/esm/parquetjs/parquet-thrift/IndexPageHeader.js +0 -39
  362. package/dist/esm/parquetjs/parquet-thrift/IndexPageHeader.js.map +0 -1
  363. package/dist/esm/parquetjs/parquet-thrift/IntType.js +0 -95
  364. package/dist/esm/parquetjs/parquet-thrift/IntType.js.map +0 -1
  365. package/dist/esm/parquetjs/parquet-thrift/JsonType.js +0 -39
  366. package/dist/esm/parquetjs/parquet-thrift/JsonType.js.map +0 -1
  367. package/dist/esm/parquetjs/parquet-thrift/KeyValue.js +0 -93
  368. package/dist/esm/parquetjs/parquet-thrift/KeyValue.js.map +0 -1
  369. package/dist/esm/parquetjs/parquet-thrift/ListType.js +0 -39
  370. package/dist/esm/parquetjs/parquet-thrift/ListType.js.map +0 -1
  371. package/dist/esm/parquetjs/parquet-thrift/LogicalType.js +0 -467
  372. package/dist/esm/parquetjs/parquet-thrift/LogicalType.js.map +0 -1
  373. package/dist/esm/parquetjs/parquet-thrift/MapType.js +0 -39
  374. package/dist/esm/parquetjs/parquet-thrift/MapType.js.map +0 -1
  375. package/dist/esm/parquetjs/parquet-thrift/MicroSeconds.js +0 -39
  376. package/dist/esm/parquetjs/parquet-thrift/MicroSeconds.js.map +0 -1
  377. package/dist/esm/parquetjs/parquet-thrift/MilliSeconds.js +0 -39
  378. package/dist/esm/parquetjs/parquet-thrift/MilliSeconds.js.map +0 -1
  379. package/dist/esm/parquetjs/parquet-thrift/NullType.js +0 -39
  380. package/dist/esm/parquetjs/parquet-thrift/NullType.js.map +0 -1
  381. package/dist/esm/parquetjs/parquet-thrift/OffsetIndex.js +0 -85
  382. package/dist/esm/parquetjs/parquet-thrift/OffsetIndex.js.map +0 -1
  383. package/dist/esm/parquetjs/parquet-thrift/PageEncodingStats.js +0 -119
  384. package/dist/esm/parquetjs/parquet-thrift/PageEncodingStats.js.map +0 -1
  385. package/dist/esm/parquetjs/parquet-thrift/PageHeader.js +0 -233
  386. package/dist/esm/parquetjs/parquet-thrift/PageHeader.js.map +0 -1
  387. package/dist/esm/parquetjs/parquet-thrift/PageLocation.js +0 -128
  388. package/dist/esm/parquetjs/parquet-thrift/PageLocation.js.map +0 -1
  389. package/dist/esm/parquetjs/parquet-thrift/PageType.js +0 -9
  390. package/dist/esm/parquetjs/parquet-thrift/PageType.js.map +0 -1
  391. package/dist/esm/parquetjs/parquet-thrift/RowGroup.js +0 -178
  392. package/dist/esm/parquetjs/parquet-thrift/RowGroup.js.map +0 -1
  393. package/dist/esm/parquetjs/parquet-thrift/SchemaElement.js +0 -270
  394. package/dist/esm/parquetjs/parquet-thrift/SchemaElement.js.map +0 -1
  395. package/dist/esm/parquetjs/parquet-thrift/SortingColumn.js +0 -119
  396. package/dist/esm/parquetjs/parquet-thrift/SortingColumn.js.map +0 -1
  397. package/dist/esm/parquetjs/parquet-thrift/Statistics.js +0 -183
  398. package/dist/esm/parquetjs/parquet-thrift/Statistics.js.map +0 -1
  399. package/dist/esm/parquetjs/parquet-thrift/StringType.js +0 -39
  400. package/dist/esm/parquetjs/parquet-thrift/StringType.js.map +0 -1
  401. package/dist/esm/parquetjs/parquet-thrift/TimeType.js +0 -96
  402. package/dist/esm/parquetjs/parquet-thrift/TimeType.js.map +0 -1
  403. package/dist/esm/parquetjs/parquet-thrift/TimeUnit.js +0 -126
  404. package/dist/esm/parquetjs/parquet-thrift/TimeUnit.js.map +0 -1
  405. package/dist/esm/parquetjs/parquet-thrift/TimestampType.js +0 -96
  406. package/dist/esm/parquetjs/parquet-thrift/TimestampType.js.map +0 -1
  407. package/dist/esm/parquetjs/parquet-thrift/Type.js +0 -13
  408. package/dist/esm/parquetjs/parquet-thrift/Type.js.map +0 -1
  409. package/dist/esm/parquetjs/parquet-thrift/TypeDefinedOrder.js +0 -39
  410. package/dist/esm/parquetjs/parquet-thrift/TypeDefinedOrder.js.map +0 -1
  411. package/dist/esm/parquetjs/parquet-thrift/UUIDType.js +0 -39
  412. package/dist/esm/parquetjs/parquet-thrift/UUIDType.js.map +0 -1
  413. package/dist/esm/parquetjs/parquet-thrift/index.js +0 -44
  414. package/dist/esm/parquetjs/parquet-thrift/index.js.map +0 -1
  415. package/dist/esm/parquetjs/parser/decoders.js +0 -300
  416. package/dist/esm/parquetjs/parser/decoders.js.map +0 -1
  417. package/dist/esm/parquetjs/parser/parquet-cursor.js +0 -90
  418. package/dist/esm/parquetjs/parser/parquet-cursor.js.map +0 -1
  419. package/dist/esm/parquetjs/parser/parquet-envelope-reader.js +0 -155
  420. package/dist/esm/parquetjs/parser/parquet-envelope-reader.js.map +0 -1
  421. package/dist/esm/parquetjs/parser/parquet-reader.js +0 -120
  422. package/dist/esm/parquetjs/parser/parquet-reader.js.map +0 -1
  423. package/dist/esm/parquetjs/schema/declare.js +0 -13
  424. package/dist/esm/parquetjs/schema/declare.js.map +0 -1
  425. package/dist/esm/parquetjs/schema/schema.js +0 -176
  426. package/dist/esm/parquetjs/schema/schema.js.map +0 -1
  427. package/dist/esm/parquetjs/schema/shred.js +0 -162
  428. package/dist/esm/parquetjs/schema/shred.js.map +0 -1
  429. package/dist/esm/parquetjs/schema/types.js +0 -476
  430. package/dist/esm/parquetjs/schema/types.js.map +0 -1
  431. package/dist/esm/parquetjs/utils/buffer-utils.js +0 -12
  432. package/dist/esm/parquetjs/utils/buffer-utils.js.map +0 -1
  433. package/dist/esm/parquetjs/utils/file-utils.js +0 -34
  434. package/dist/esm/parquetjs/utils/file-utils.js.map +0 -1
  435. package/dist/esm/parquetjs/utils/read-utils.js +0 -105
  436. package/dist/esm/parquetjs/utils/read-utils.js.map +0 -1
  437. package/dist/esm/workers/parquet-worker.js +0 -4
  438. package/dist/esm/workers/parquet-worker.js.map +0 -1
@@ -1,875 +0,0 @@
1
- "use strict";
2
-
3
- var _interopRequireDefault = require("@babel/runtime/helpers/interopRequireDefault");
4
-
5
- var _typeof = require("@babel/runtime/helpers/typeof");
6
-
7
- Object.defineProperty(exports, "__esModule", {
8
- value: true
9
- });
10
- exports.ParquetTransformer = exports.ParquetEnvelopeWriter = exports.ParquetWriter = void 0;
11
-
12
- var _regenerator = _interopRequireDefault(require("@babel/runtime/regenerator"));
13
-
14
- var _assertThisInitialized2 = _interopRequireDefault(require("@babel/runtime/helpers/assertThisInitialized"));
15
-
16
- var _inherits2 = _interopRequireDefault(require("@babel/runtime/helpers/inherits"));
17
-
18
- var _possibleConstructorReturn2 = _interopRequireDefault(require("@babel/runtime/helpers/possibleConstructorReturn"));
19
-
20
- var _getPrototypeOf2 = _interopRequireDefault(require("@babel/runtime/helpers/getPrototypeOf"));
21
-
22
- var _asyncToGenerator2 = _interopRequireDefault(require("@babel/runtime/helpers/asyncToGenerator"));
23
-
24
- var _classCallCheck2 = _interopRequireDefault(require("@babel/runtime/helpers/classCallCheck"));
25
-
26
- var _createClass2 = _interopRequireDefault(require("@babel/runtime/helpers/createClass"));
27
-
28
- var _defineProperty2 = _interopRequireDefault(require("@babel/runtime/helpers/defineProperty"));
29
-
30
- var _stream = require("stream");
31
-
32
- var _codecs = require("../codecs");
33
-
34
- var Compression = _interopRequireWildcard(require("../compression"));
35
-
36
- var Shred = _interopRequireWildcard(require("../schema/shred"));
37
-
38
- var _parquetThrift = require("../parquet-thrift");
39
-
40
- var _fileUtils = require("../utils/file-utils");
41
-
42
- var _readUtils = require("../utils/read-utils");
43
-
44
- var _nodeInt = _interopRequireDefault(require("node-int64"));
45
-
46
- function _getRequireWildcardCache(nodeInterop) { if (typeof WeakMap !== "function") return null; var cacheBabelInterop = new WeakMap(); var cacheNodeInterop = new WeakMap(); return (_getRequireWildcardCache = function _getRequireWildcardCache(nodeInterop) { return nodeInterop ? cacheNodeInterop : cacheBabelInterop; })(nodeInterop); }
47
-
48
- function _interopRequireWildcard(obj, nodeInterop) { if (!nodeInterop && obj && obj.__esModule) { return obj; } if (obj === null || _typeof(obj) !== "object" && typeof obj !== "function") { return { default: obj }; } var cache = _getRequireWildcardCache(nodeInterop); if (cache && cache.has(obj)) { return cache.get(obj); } var newObj = {}; var hasPropertyDescriptor = Object.defineProperty && Object.getOwnPropertyDescriptor; for (var key in obj) { if (key !== "default" && Object.prototype.hasOwnProperty.call(obj, key)) { var desc = hasPropertyDescriptor ? Object.getOwnPropertyDescriptor(obj, key) : null; if (desc && (desc.get || desc.set)) { Object.defineProperty(newObj, key, desc); } else { newObj[key] = obj[key]; } } } newObj.default = obj; if (cache) { cache.set(obj, newObj); } return newObj; }
49
-
50
- function _createForOfIteratorHelper(o, allowArrayLike) { var it = typeof Symbol !== "undefined" && o[Symbol.iterator] || o["@@iterator"]; if (!it) { if (Array.isArray(o) || (it = _unsupportedIterableToArray(o)) || allowArrayLike && o && typeof o.length === "number") { if (it) o = it; var i = 0; var F = function F() {}; return { s: F, n: function n() { if (i >= o.length) return { done: true }; return { done: false, value: o[i++] }; }, e: function e(_e) { throw _e; }, f: F }; } throw new TypeError("Invalid attempt to iterate non-iterable instance.\nIn order to be iterable, non-array objects must have a [Symbol.iterator]() method."); } var normalCompletion = true, didErr = false, err; return { s: function s() { it = it.call(o); }, n: function n() { var step = it.next(); normalCompletion = step.done; return step; }, e: function e(_e2) { didErr = true; err = _e2; }, f: function f() { try { if (!normalCompletion && it.return != null) it.return(); } finally { if (didErr) throw err; } } }; }
51
-
52
- function _unsupportedIterableToArray(o, minLen) { if (!o) return; if (typeof o === "string") return _arrayLikeToArray(o, minLen); var n = Object.prototype.toString.call(o).slice(8, -1); if (n === "Object" && o.constructor) n = o.constructor.name; if (n === "Map" || n === "Set") return Array.from(o); if (n === "Arguments" || /^(?:Ui|I)nt(?:8|16|32)(?:Clamped)?Array$/.test(n)) return _arrayLikeToArray(o, minLen); }
53
-
54
- function _arrayLikeToArray(arr, len) { if (len == null || len > arr.length) len = arr.length; for (var i = 0, arr2 = new Array(len); i < len; i++) { arr2[i] = arr[i]; } return arr2; }
55
-
56
- function _createSuper(Derived) { var hasNativeReflectConstruct = _isNativeReflectConstruct(); return function _createSuperInternal() { var Super = (0, _getPrototypeOf2.default)(Derived), result; if (hasNativeReflectConstruct) { var NewTarget = (0, _getPrototypeOf2.default)(this).constructor; result = Reflect.construct(Super, arguments, NewTarget); } else { result = Super.apply(this, arguments); } return (0, _possibleConstructorReturn2.default)(this, result); }; }
57
-
58
- function _isNativeReflectConstruct() { if (typeof Reflect === "undefined" || !Reflect.construct) return false; if (Reflect.construct.sham) return false; if (typeof Proxy === "function") return true; try { Boolean.prototype.valueOf.call(Reflect.construct(Boolean, [], function () {})); return true; } catch (e) { return false; } }
59
-
60
- var PARQUET_MAGIC = 'PAR1';
61
- var PARQUET_VERSION = 1;
62
- var PARQUET_DEFAULT_PAGE_SIZE = 8192;
63
- var PARQUET_DEFAULT_ROW_GROUP_SIZE = 4096;
64
- var PARQUET_RDLVL_TYPE = 'INT32';
65
- var PARQUET_RDLVL_ENCODING = 'RLE';
66
-
67
- var ParquetWriter = function () {
68
- function ParquetWriter(schema, envelopeWriter, opts) {
69
- (0, _classCallCheck2.default)(this, ParquetWriter);
70
- (0, _defineProperty2.default)(this, "schema", void 0);
71
- (0, _defineProperty2.default)(this, "envelopeWriter", void 0);
72
- (0, _defineProperty2.default)(this, "rowBuffer", void 0);
73
- (0, _defineProperty2.default)(this, "rowGroupSize", void 0);
74
- (0, _defineProperty2.default)(this, "closed", void 0);
75
- (0, _defineProperty2.default)(this, "userMetadata", void 0);
76
- this.schema = schema;
77
- this.envelopeWriter = envelopeWriter;
78
- this.rowBuffer = {};
79
- this.rowGroupSize = opts.rowGroupSize || PARQUET_DEFAULT_ROW_GROUP_SIZE;
80
- this.closed = false;
81
- this.userMetadata = {};
82
- this.writeHeader();
83
- }
84
-
85
- (0, _createClass2.default)(ParquetWriter, [{
86
- key: "writeHeader",
87
- value: function () {
88
- var _writeHeader = (0, _asyncToGenerator2.default)(_regenerator.default.mark(function _callee() {
89
- return _regenerator.default.wrap(function _callee$(_context) {
90
- while (1) {
91
- switch (_context.prev = _context.next) {
92
- case 0:
93
- _context.prev = 0;
94
- _context.next = 3;
95
- return this.envelopeWriter.writeHeader();
96
-
97
- case 3:
98
- _context.next = 10;
99
- break;
100
-
101
- case 5:
102
- _context.prev = 5;
103
- _context.t0 = _context["catch"](0);
104
- _context.next = 9;
105
- return this.envelopeWriter.close();
106
-
107
- case 9:
108
- throw _context.t0;
109
-
110
- case 10:
111
- case "end":
112
- return _context.stop();
113
- }
114
- }
115
- }, _callee, this, [[0, 5]]);
116
- }));
117
-
118
- function writeHeader() {
119
- return _writeHeader.apply(this, arguments);
120
- }
121
-
122
- return writeHeader;
123
- }()
124
- }, {
125
- key: "appendRow",
126
- value: function () {
127
- var _appendRow = (0, _asyncToGenerator2.default)(_regenerator.default.mark(function _callee2(row) {
128
- return _regenerator.default.wrap(function _callee2$(_context2) {
129
- while (1) {
130
- switch (_context2.prev = _context2.next) {
131
- case 0:
132
- if (!this.closed) {
133
- _context2.next = 2;
134
- break;
135
- }
136
-
137
- throw new Error('writer was closed');
138
-
139
- case 2:
140
- Shred.shredRecord(this.schema, row, this.rowBuffer);
141
-
142
- if (this.rowBuffer.rowCount >= this.rowGroupSize) {
143
- this.rowBuffer = {};
144
- }
145
-
146
- case 4:
147
- case "end":
148
- return _context2.stop();
149
- }
150
- }
151
- }, _callee2, this);
152
- }));
153
-
154
- function appendRow(_x) {
155
- return _appendRow.apply(this, arguments);
156
- }
157
-
158
- return appendRow;
159
- }()
160
- }, {
161
- key: "close",
162
- value: function () {
163
- var _close = (0, _asyncToGenerator2.default)(_regenerator.default.mark(function _callee3(callback) {
164
- return _regenerator.default.wrap(function _callee3$(_context3) {
165
- while (1) {
166
- switch (_context3.prev = _context3.next) {
167
- case 0:
168
- if (!this.closed) {
169
- _context3.next = 2;
170
- break;
171
- }
172
-
173
- throw new Error('writer was closed');
174
-
175
- case 2:
176
- this.closed = true;
177
-
178
- if (this.rowBuffer.rowCount > 0 || this.rowBuffer.rowCount >= this.rowGroupSize) {
179
- this.rowBuffer = {};
180
- }
181
-
182
- _context3.next = 6;
183
- return this.envelopeWriter.writeFooter(this.userMetadata);
184
-
185
- case 6:
186
- _context3.next = 8;
187
- return this.envelopeWriter.close();
188
-
189
- case 8:
190
- if (callback) {
191
- callback();
192
- }
193
-
194
- case 9:
195
- case "end":
196
- return _context3.stop();
197
- }
198
- }
199
- }, _callee3, this);
200
- }));
201
-
202
- function close(_x2) {
203
- return _close.apply(this, arguments);
204
- }
205
-
206
- return close;
207
- }()
208
- }, {
209
- key: "setMetadata",
210
- value: function setMetadata(key, value) {
211
- this.userMetadata[String(key)] = String(value);
212
- }
213
- }, {
214
- key: "setRowGroupSize",
215
- value: function setRowGroupSize(cnt) {
216
- this.rowGroupSize = cnt;
217
- }
218
- }, {
219
- key: "setPageSize",
220
- value: function setPageSize(cnt) {
221
- this.envelopeWriter.setPageSize(cnt);
222
- }
223
- }], [{
224
- key: "openFile",
225
- value: function () {
226
- var _openFile = (0, _asyncToGenerator2.default)(_regenerator.default.mark(function _callee4(schema, path, opts) {
227
- var outputStream;
228
- return _regenerator.default.wrap(function _callee4$(_context4) {
229
- while (1) {
230
- switch (_context4.prev = _context4.next) {
231
- case 0:
232
- _context4.next = 2;
233
- return (0, _fileUtils.osopen)(path, opts);
234
-
235
- case 2:
236
- outputStream = _context4.sent;
237
- return _context4.abrupt("return", ParquetWriter.openStream(schema, outputStream, opts));
238
-
239
- case 4:
240
- case "end":
241
- return _context4.stop();
242
- }
243
- }
244
- }, _callee4);
245
- }));
246
-
247
- function openFile(_x3, _x4, _x5) {
248
- return _openFile.apply(this, arguments);
249
- }
250
-
251
- return openFile;
252
- }()
253
- }, {
254
- key: "openStream",
255
- value: function () {
256
- var _openStream = (0, _asyncToGenerator2.default)(_regenerator.default.mark(function _callee5(schema, outputStream, opts) {
257
- var envelopeWriter;
258
- return _regenerator.default.wrap(function _callee5$(_context5) {
259
- while (1) {
260
- switch (_context5.prev = _context5.next) {
261
- case 0:
262
- if (!opts) {
263
- opts = {};
264
- }
265
-
266
- _context5.next = 3;
267
- return ParquetEnvelopeWriter.openStream(schema, outputStream, opts);
268
-
269
- case 3:
270
- envelopeWriter = _context5.sent;
271
- return _context5.abrupt("return", new ParquetWriter(schema, envelopeWriter, opts));
272
-
273
- case 5:
274
- case "end":
275
- return _context5.stop();
276
- }
277
- }
278
- }, _callee5);
279
- }));
280
-
281
- function openStream(_x6, _x7, _x8) {
282
- return _openStream.apply(this, arguments);
283
- }
284
-
285
- return openStream;
286
- }()
287
- }]);
288
- return ParquetWriter;
289
- }();
290
-
291
- exports.ParquetWriter = ParquetWriter;
292
-
293
- var ParquetEnvelopeWriter = function () {
294
- function ParquetEnvelopeWriter(schema, writeFn, closeFn, fileOffset, opts) {
295
- (0, _classCallCheck2.default)(this, ParquetEnvelopeWriter);
296
- (0, _defineProperty2.default)(this, "schema", void 0);
297
- (0, _defineProperty2.default)(this, "write", void 0);
298
- (0, _defineProperty2.default)(this, "close", void 0);
299
- (0, _defineProperty2.default)(this, "offset", void 0);
300
- (0, _defineProperty2.default)(this, "rowCount", void 0);
301
- (0, _defineProperty2.default)(this, "rowGroups", void 0);
302
- (0, _defineProperty2.default)(this, "pageSize", void 0);
303
- (0, _defineProperty2.default)(this, "useDataPageV2", void 0);
304
- this.schema = schema;
305
- this.write = writeFn;
306
- this.close = closeFn;
307
- this.offset = fileOffset;
308
- this.rowCount = 0;
309
- this.rowGroups = [];
310
- this.pageSize = opts.pageSize || PARQUET_DEFAULT_PAGE_SIZE;
311
- this.useDataPageV2 = 'useDataPageV2' in opts ? Boolean(opts.useDataPageV2) : false;
312
- }
313
-
314
- (0, _createClass2.default)(ParquetEnvelopeWriter, [{
315
- key: "writeSection",
316
- value: function writeSection(buf) {
317
- this.offset += buf.length;
318
- return this.write(buf);
319
- }
320
- }, {
321
- key: "writeHeader",
322
- value: function writeHeader() {
323
- return this.writeSection(Buffer.from(PARQUET_MAGIC));
324
- }
325
- }, {
326
- key: "writeRowGroup",
327
- value: function () {
328
- var _writeRowGroup = (0, _asyncToGenerator2.default)(_regenerator.default.mark(function _callee6(records) {
329
- var rgroup;
330
- return _regenerator.default.wrap(function _callee6$(_context6) {
331
- while (1) {
332
- switch (_context6.prev = _context6.next) {
333
- case 0:
334
- _context6.next = 2;
335
- return encodeRowGroup(this.schema, records, {
336
- baseOffset: this.offset,
337
- pageSize: this.pageSize,
338
- useDataPageV2: this.useDataPageV2
339
- });
340
-
341
- case 2:
342
- rgroup = _context6.sent;
343
- this.rowCount += records.rowCount;
344
- this.rowGroups.push(rgroup.metadata);
345
- _context6.next = 7;
346
- return this.writeSection(rgroup.body);
347
-
348
- case 7:
349
- return _context6.abrupt("return", _context6.sent);
350
-
351
- case 8:
352
- case "end":
353
- return _context6.stop();
354
- }
355
- }
356
- }, _callee6, this);
357
- }));
358
-
359
- function writeRowGroup(_x9) {
360
- return _writeRowGroup.apply(this, arguments);
361
- }
362
-
363
- return writeRowGroup;
364
- }()
365
- }, {
366
- key: "writeFooter",
367
- value: function writeFooter(userMetadata) {
368
- if (!userMetadata) {
369
- userMetadata = {};
370
- }
371
-
372
- return this.writeSection(encodeFooter(this.schema, this.rowCount, this.rowGroups, userMetadata));
373
- }
374
- }, {
375
- key: "setPageSize",
376
- value: function setPageSize(cnt) {
377
- this.pageSize = cnt;
378
- }
379
- }], [{
380
- key: "openStream",
381
- value: function () {
382
- var _openStream2 = (0, _asyncToGenerator2.default)(_regenerator.default.mark(function _callee7(schema, outputStream, opts) {
383
- var writeFn, closeFn;
384
- return _regenerator.default.wrap(function _callee7$(_context7) {
385
- while (1) {
386
- switch (_context7.prev = _context7.next) {
387
- case 0:
388
- writeFn = _fileUtils.oswrite.bind(undefined, outputStream);
389
- closeFn = _fileUtils.osclose.bind(undefined, outputStream);
390
- return _context7.abrupt("return", new ParquetEnvelopeWriter(schema, writeFn, closeFn, 0, opts));
391
-
392
- case 3:
393
- case "end":
394
- return _context7.stop();
395
- }
396
- }
397
- }, _callee7);
398
- }));
399
-
400
- function openStream(_x10, _x11, _x12) {
401
- return _openStream2.apply(this, arguments);
402
- }
403
-
404
- return openStream;
405
- }()
406
- }]);
407
- return ParquetEnvelopeWriter;
408
- }();
409
-
410
- exports.ParquetEnvelopeWriter = ParquetEnvelopeWriter;
411
-
412
- var ParquetTransformer = function (_Transform) {
413
- (0, _inherits2.default)(ParquetTransformer, _Transform);
414
-
415
- var _super = _createSuper(ParquetTransformer);
416
-
417
- function ParquetTransformer(schema) {
418
- var _this;
419
-
420
- var opts = arguments.length > 1 && arguments[1] !== undefined ? arguments[1] : {};
421
- (0, _classCallCheck2.default)(this, ParquetTransformer);
422
- _this = _super.call(this, {
423
- objectMode: true
424
- });
425
- (0, _defineProperty2.default)((0, _assertThisInitialized2.default)(_this), "writer", void 0);
426
-
427
- var writeProxy = function (t) {
428
- return function () {
429
- var _ref = (0, _asyncToGenerator2.default)(_regenerator.default.mark(function _callee8(b) {
430
- return _regenerator.default.wrap(function _callee8$(_context8) {
431
- while (1) {
432
- switch (_context8.prev = _context8.next) {
433
- case 0:
434
- t.push(b);
435
-
436
- case 1:
437
- case "end":
438
- return _context8.stop();
439
- }
440
- }
441
- }, _callee8);
442
- }));
443
-
444
- return function (_x13) {
445
- return _ref.apply(this, arguments);
446
- };
447
- }();
448
- }((0, _assertThisInitialized2.default)(_this));
449
-
450
- _this.writer = new ParquetWriter(schema, new ParquetEnvelopeWriter(schema, writeProxy, (0, _asyncToGenerator2.default)(_regenerator.default.mark(function _callee9() {
451
- return _regenerator.default.wrap(function _callee9$(_context9) {
452
- while (1) {
453
- switch (_context9.prev = _context9.next) {
454
- case 0:
455
- case "end":
456
- return _context9.stop();
457
- }
458
- }
459
- }, _callee9);
460
- })), 0, opts), opts);
461
- return _this;
462
- }
463
-
464
- (0, _createClass2.default)(ParquetTransformer, [{
465
- key: "_transform",
466
- value: function _transform(row, encoding, callback) {
467
- if (row) {
468
- return this.writer.appendRow(row).then(callback);
469
- }
470
-
471
- callback();
472
- return Promise.resolve();
473
- }
474
- }, {
475
- key: "_flush",
476
- value: function () {
477
- var _flush2 = (0, _asyncToGenerator2.default)(_regenerator.default.mark(function _callee10(callback) {
478
- return _regenerator.default.wrap(function _callee10$(_context10) {
479
- while (1) {
480
- switch (_context10.prev = _context10.next) {
481
- case 0:
482
- _context10.next = 2;
483
- return this.writer.close(callback);
484
-
485
- case 2:
486
- case "end":
487
- return _context10.stop();
488
- }
489
- }
490
- }, _callee10, this);
491
- }));
492
-
493
- function _flush(_x14) {
494
- return _flush2.apply(this, arguments);
495
- }
496
-
497
- return _flush;
498
- }()
499
- }]);
500
- return ParquetTransformer;
501
- }(_stream.Transform);
502
-
503
- exports.ParquetTransformer = ParquetTransformer;
504
-
505
- function encodeValues(type, encoding, values, opts) {
506
- if (!(encoding in _codecs.PARQUET_CODECS)) {
507
- throw new Error("invalid encoding: ".concat(encoding));
508
- }
509
-
510
- return _codecs.PARQUET_CODECS[encoding].encodeValues(type, values, opts);
511
- }
512
-
513
- function encodeDataPage(_x15, _x16) {
514
- return _encodeDataPage.apply(this, arguments);
515
- }
516
-
517
- function _encodeDataPage() {
518
- _encodeDataPage = (0, _asyncToGenerator2.default)(_regenerator.default.mark(function _callee11(column, data) {
519
- var rLevelsBuf, dLevelsBuf, valuesBuf, dataBuf, compressedBuf, header, headerBuf, page;
520
- return _regenerator.default.wrap(function _callee11$(_context11) {
521
- while (1) {
522
- switch (_context11.prev = _context11.next) {
523
- case 0:
524
- rLevelsBuf = Buffer.alloc(0);
525
-
526
- if (column.rLevelMax > 0) {
527
- rLevelsBuf = encodeValues(PARQUET_RDLVL_TYPE, PARQUET_RDLVL_ENCODING, data.rlevels, {
528
- bitWidth: (0, _readUtils.getBitWidth)(column.rLevelMax)
529
- });
530
- }
531
-
532
- dLevelsBuf = Buffer.alloc(0);
533
-
534
- if (column.dLevelMax > 0) {
535
- dLevelsBuf = encodeValues(PARQUET_RDLVL_TYPE, PARQUET_RDLVL_ENCODING, data.dlevels, {
536
- bitWidth: (0, _readUtils.getBitWidth)(column.dLevelMax)
537
- });
538
- }
539
-
540
- valuesBuf = encodeValues(column.primitiveType, column.encoding, data.values, {
541
- typeLength: column.typeLength,
542
- bitWidth: column.typeLength
543
- });
544
- dataBuf = Buffer.concat([rLevelsBuf, dLevelsBuf, valuesBuf]);
545
- _context11.next = 8;
546
- return Compression.deflate(column.compression, dataBuf);
547
-
548
- case 8:
549
- compressedBuf = _context11.sent;
550
- header = new _parquetThrift.PageHeader({
551
- type: _parquetThrift.PageType.DATA_PAGE,
552
- data_page_header: new _parquetThrift.DataPageHeader({
553
- num_values: data.count,
554
- encoding: _parquetThrift.Encoding[column.encoding],
555
- definition_level_encoding: _parquetThrift.Encoding[PARQUET_RDLVL_ENCODING],
556
- repetition_level_encoding: _parquetThrift.Encoding[PARQUET_RDLVL_ENCODING]
557
- }),
558
- uncompressed_page_size: dataBuf.length,
559
- compressed_page_size: compressedBuf.length
560
- });
561
- headerBuf = (0, _readUtils.serializeThrift)(header);
562
- page = Buffer.concat([headerBuf, compressedBuf]);
563
- return _context11.abrupt("return", {
564
- header: header,
565
- headerSize: headerBuf.length,
566
- page: page
567
- });
568
-
569
- case 13:
570
- case "end":
571
- return _context11.stop();
572
- }
573
- }
574
- }, _callee11);
575
- }));
576
- return _encodeDataPage.apply(this, arguments);
577
- }
578
-
579
- function encodeDataPageV2(_x17, _x18, _x19) {
580
- return _encodeDataPageV.apply(this, arguments);
581
- }
582
-
583
- function _encodeDataPageV() {
584
- _encodeDataPageV = (0, _asyncToGenerator2.default)(_regenerator.default.mark(function _callee12(column, data, rowCount) {
585
- var valuesBuf, compressedBuf, rLevelsBuf, dLevelsBuf, header, headerBuf, page;
586
- return _regenerator.default.wrap(function _callee12$(_context12) {
587
- while (1) {
588
- switch (_context12.prev = _context12.next) {
589
- case 0:
590
- valuesBuf = encodeValues(column.primitiveType, column.encoding, data.values, {
591
- typeLength: column.typeLength,
592
- bitWidth: column.typeLength
593
- });
594
- _context12.next = 3;
595
- return Compression.deflate(column.compression, valuesBuf);
596
-
597
- case 3:
598
- compressedBuf = _context12.sent;
599
- rLevelsBuf = Buffer.alloc(0);
600
-
601
- if (column.rLevelMax > 0) {
602
- rLevelsBuf = encodeValues(PARQUET_RDLVL_TYPE, PARQUET_RDLVL_ENCODING, data.rlevels, {
603
- bitWidth: (0, _readUtils.getBitWidth)(column.rLevelMax),
604
- disableEnvelope: true
605
- });
606
- }
607
-
608
- dLevelsBuf = Buffer.alloc(0);
609
-
610
- if (column.dLevelMax > 0) {
611
- dLevelsBuf = encodeValues(PARQUET_RDLVL_TYPE, PARQUET_RDLVL_ENCODING, data.dlevels, {
612
- bitWidth: (0, _readUtils.getBitWidth)(column.dLevelMax),
613
- disableEnvelope: true
614
- });
615
- }
616
-
617
- header = new _parquetThrift.PageHeader({
618
- type: _parquetThrift.PageType.DATA_PAGE_V2,
619
- data_page_header_v2: new _parquetThrift.DataPageHeaderV2({
620
- num_values: data.count,
621
- num_nulls: data.count - data.values.length,
622
- num_rows: rowCount,
623
- encoding: _parquetThrift.Encoding[column.encoding],
624
- definition_levels_byte_length: dLevelsBuf.length,
625
- repetition_levels_byte_length: rLevelsBuf.length,
626
- is_compressed: column.compression !== 'UNCOMPRESSED'
627
- }),
628
- uncompressed_page_size: rLevelsBuf.length + dLevelsBuf.length + valuesBuf.length,
629
- compressed_page_size: rLevelsBuf.length + dLevelsBuf.length + compressedBuf.length
630
- });
631
- headerBuf = (0, _readUtils.serializeThrift)(header);
632
- page = Buffer.concat([headerBuf, rLevelsBuf, dLevelsBuf, compressedBuf]);
633
- return _context12.abrupt("return", {
634
- header: header,
635
- headerSize: headerBuf.length,
636
- page: page
637
- });
638
-
639
- case 12:
640
- case "end":
641
- return _context12.stop();
642
- }
643
- }
644
- }, _callee12);
645
- }));
646
- return _encodeDataPageV.apply(this, arguments);
647
- }
648
-
649
- function encodeColumnChunk(_x20, _x21, _x22, _x23) {
650
- return _encodeColumnChunk.apply(this, arguments);
651
- }
652
-
653
- function _encodeColumnChunk() {
654
- _encodeColumnChunk = (0, _asyncToGenerator2.default)(_regenerator.default.mark(function _callee13(column, buffer, offset, opts) {
655
- var data, baseOffset, pageBuf, total_uncompressed_size, total_compressed_size, result, metadata, metadataOffset, body;
656
- return _regenerator.default.wrap(function _callee13$(_context13) {
657
- while (1) {
658
- switch (_context13.prev = _context13.next) {
659
- case 0:
660
- data = buffer.columnData[column.path.join()];
661
- baseOffset = (opts.baseOffset || 0) + offset;
662
- total_uncompressed_size = 0;
663
- total_compressed_size = 0;
664
-
665
- if (!opts.useDataPageV2) {
666
- _context13.next = 10;
667
- break;
668
- }
669
-
670
- _context13.next = 7;
671
- return encodeDataPageV2(column, data, buffer.rowCount);
672
-
673
- case 7:
674
- _context13.t0 = _context13.sent;
675
- _context13.next = 13;
676
- break;
677
-
678
- case 10:
679
- _context13.next = 12;
680
- return encodeDataPage(column, data);
681
-
682
- case 12:
683
- _context13.t0 = _context13.sent;
684
-
685
- case 13:
686
- result = _context13.t0;
687
- pageBuf = result.page;
688
- total_uncompressed_size += result.header.uncompressed_page_size + result.headerSize;
689
- total_compressed_size += result.header.compressed_page_size + result.headerSize;
690
- metadata = new _parquetThrift.ColumnMetaData({
691
- path_in_schema: column.path,
692
- num_values: data.count,
693
- data_page_offset: baseOffset,
694
- encodings: [],
695
- total_uncompressed_size: total_uncompressed_size,
696
- total_compressed_size: total_compressed_size,
697
- type: _parquetThrift.Type[column.primitiveType],
698
- codec: _parquetThrift.CompressionCodec[column.compression]
699
- });
700
- metadata.encodings.push(_parquetThrift.Encoding[PARQUET_RDLVL_ENCODING]);
701
- metadata.encodings.push(_parquetThrift.Encoding[column.encoding]);
702
- metadataOffset = baseOffset + pageBuf.length;
703
- body = Buffer.concat([pageBuf, (0, _readUtils.serializeThrift)(metadata)]);
704
- return _context13.abrupt("return", {
705
- body: body,
706
- metadata: metadata,
707
- metadataOffset: metadataOffset
708
- });
709
-
710
- case 23:
711
- case "end":
712
- return _context13.stop();
713
- }
714
- }
715
- }, _callee13);
716
- }));
717
- return _encodeColumnChunk.apply(this, arguments);
718
- }
719
-
720
- function encodeRowGroup(_x24, _x25, _x26) {
721
- return _encodeRowGroup.apply(this, arguments);
722
- }
723
-
724
- function _encodeRowGroup() {
725
- _encodeRowGroup = (0, _asyncToGenerator2.default)(_regenerator.default.mark(function _callee14(schema, data, opts) {
726
- var metadata, body, _iterator2, _step2, field, cchunkData, cchunk;
727
-
728
- return _regenerator.default.wrap(function _callee14$(_context14) {
729
- while (1) {
730
- switch (_context14.prev = _context14.next) {
731
- case 0:
732
- metadata = new _parquetThrift.RowGroup({
733
- num_rows: data.rowCount,
734
- columns: [],
735
- total_byte_size: 0
736
- });
737
- body = Buffer.alloc(0);
738
- _iterator2 = _createForOfIteratorHelper(schema.fieldList);
739
- _context14.prev = 3;
740
-
741
- _iterator2.s();
742
-
743
- case 5:
744
- if ((_step2 = _iterator2.n()).done) {
745
- _context14.next = 18;
746
- break;
747
- }
748
-
749
- field = _step2.value;
750
-
751
- if (!field.isNested) {
752
- _context14.next = 9;
753
- break;
754
- }
755
-
756
- return _context14.abrupt("continue", 16);
757
-
758
- case 9:
759
- _context14.next = 11;
760
- return encodeColumnChunk(field, data, body.length, opts);
761
-
762
- case 11:
763
- cchunkData = _context14.sent;
764
- cchunk = new _parquetThrift.ColumnChunk({
765
- file_offset: cchunkData.metadataOffset,
766
- meta_data: cchunkData.metadata
767
- });
768
- metadata.columns.push(cchunk);
769
- metadata.total_byte_size = new _nodeInt.default(Number(metadata.total_byte_size) + cchunkData.body.length);
770
- body = Buffer.concat([body, cchunkData.body]);
771
-
772
- case 16:
773
- _context14.next = 5;
774
- break;
775
-
776
- case 18:
777
- _context14.next = 23;
778
- break;
779
-
780
- case 20:
781
- _context14.prev = 20;
782
- _context14.t0 = _context14["catch"](3);
783
-
784
- _iterator2.e(_context14.t0);
785
-
786
- case 23:
787
- _context14.prev = 23;
788
-
789
- _iterator2.f();
790
-
791
- return _context14.finish(23);
792
-
793
- case 26:
794
- return _context14.abrupt("return", {
795
- body: body,
796
- metadata: metadata
797
- });
798
-
799
- case 27:
800
- case "end":
801
- return _context14.stop();
802
- }
803
- }
804
- }, _callee14, null, [[3, 20, 23, 26]]);
805
- }));
806
- return _encodeRowGroup.apply(this, arguments);
807
- }
808
-
809
- function encodeFooter(schema, rowCount, rowGroups, userMetadata) {
810
- var metadata = new _parquetThrift.FileMetaData({
811
- version: PARQUET_VERSION,
812
- created_by: 'parquets',
813
- num_rows: rowCount,
814
- row_groups: rowGroups,
815
- schema: [],
816
- key_value_metadata: []
817
- });
818
-
819
- for (var key in userMetadata) {
820
- var _metadata$key_value_m, _metadata$key_value_m2;
821
-
822
- var kv = new _parquetThrift.KeyValue({
823
- key: key,
824
- value: userMetadata[key]
825
- });
826
- (_metadata$key_value_m = metadata.key_value_metadata) === null || _metadata$key_value_m === void 0 ? void 0 : (_metadata$key_value_m2 = _metadata$key_value_m.push) === null || _metadata$key_value_m2 === void 0 ? void 0 : _metadata$key_value_m2.call(_metadata$key_value_m, kv);
827
- }
828
-
829
- {
830
- var schemaRoot = new _parquetThrift.SchemaElement({
831
- name: 'root',
832
- num_children: Object.keys(schema.fields).length
833
- });
834
- metadata.schema.push(schemaRoot);
835
- }
836
-
837
- var _iterator = _createForOfIteratorHelper(schema.fieldList),
838
- _step;
839
-
840
- try {
841
- for (_iterator.s(); !(_step = _iterator.n()).done;) {
842
- var field = _step.value;
843
- var relt = _parquetThrift.FieldRepetitionType[field.repetitionType];
844
- var schemaElem = new _parquetThrift.SchemaElement({
845
- name: field.name,
846
- repetition_type: relt
847
- });
848
-
849
- if (field.isNested) {
850
- schemaElem.num_children = field.fieldCount;
851
- } else {
852
- schemaElem.type = _parquetThrift.Type[field.primitiveType];
853
- }
854
-
855
- if (field.originalType) {
856
- schemaElem.converted_type = _parquetThrift.ConvertedType[field.originalType];
857
- }
858
-
859
- schemaElem.type_length = field.typeLength;
860
- metadata.schema.push(schemaElem);
861
- }
862
- } catch (err) {
863
- _iterator.e(err);
864
- } finally {
865
- _iterator.f();
866
- }
867
-
868
- var metadataEncoded = (0, _readUtils.serializeThrift)(metadata);
869
- var footerEncoded = Buffer.alloc(metadataEncoded.length + 8);
870
- metadataEncoded.copy(footerEncoded);
871
- footerEncoded.writeUInt32LE(metadataEncoded.length, metadataEncoded.length);
872
- footerEncoded.write(PARQUET_MAGIC, metadataEncoded.length + 4);
873
- return footerEncoded;
874
- }
875
- //# sourceMappingURL=writer.js.map