zsv 1.3.1 → 1.4.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (229) hide show
  1. checksums.yaml +4 -4
  2. data/CHANGELOG.md +13 -0
  3. data/README.md +41 -3
  4. data/ext/zsv/extconf.rb +1 -1
  5. data/lib/zsv/version.rb +1 -1
  6. metadata +6 -226
  7. data/ext/zsv/vendor/zsv-1.3.0/app/2db.c +0 -756
  8. data/ext/zsv/vendor/zsv-1.3.0/app/2json.c +0 -381
  9. data/ext/zsv/vendor/zsv-1.3.0/app/2tsv.c +0 -228
  10. data/ext/zsv/vendor/zsv-1.3.0/app/builtin/help.c +0 -123
  11. data/ext/zsv/vendor/zsv-1.3.0/app/builtin/license.c +0 -39
  12. data/ext/zsv/vendor/zsv-1.3.0/app/builtin/register.c +0 -104
  13. data/ext/zsv/vendor/zsv-1.3.0/app/builtin/thirdparty.c +0 -41
  14. data/ext/zsv/vendor/zsv-1.3.0/app/builtin/unregister.c +0 -1
  15. data/ext/zsv/vendor/zsv-1.3.0/app/builtin/version.c +0 -14
  16. data/ext/zsv/vendor/zsv-1.3.0/app/check/simdutf_wrapper.h +0 -19
  17. data/ext/zsv/vendor/zsv-1.3.0/app/check/utf8.c +0 -116
  18. data/ext/zsv/vendor/zsv-1.3.0/app/check.c +0 -194
  19. data/ext/zsv/vendor/zsv-1.3.0/app/cli.c +0 -796
  20. data/ext/zsv/vendor/zsv-1.3.0/app/cli_const.h +0 -41
  21. data/ext/zsv/vendor/zsv-1.3.0/app/cli_export.h +0 -16
  22. data/ext/zsv/vendor/zsv-1.3.0/app/cli_ini.c +0 -280
  23. data/ext/zsv/vendor/zsv-1.3.0/app/cli_internal.h +0 -36
  24. data/ext/zsv/vendor/zsv-1.3.0/app/compare.c +0 -913
  25. data/ext/zsv/vendor/zsv-1.3.0/app/compare.h +0 -23
  26. data/ext/zsv/vendor/zsv-1.3.0/app/compare_added_column.c +0 -20
  27. data/ext/zsv/vendor/zsv-1.3.0/app/compare_internal.h +0 -140
  28. data/ext/zsv/vendor/zsv-1.3.0/app/compare_sort.c +0 -91
  29. data/ext/zsv/vendor/zsv-1.3.0/app/compare_unique_colname.c +0 -81
  30. data/ext/zsv/vendor/zsv-1.3.0/app/count-pull.c +0 -82
  31. data/ext/zsv/vendor/zsv-1.3.0/app/count.c +0 -404
  32. data/ext/zsv/vendor/zsv-1.3.0/app/desc.c +0 -569
  33. data/ext/zsv/vendor/zsv-1.3.0/app/echo.c +0 -365
  34. data/ext/zsv/vendor/zsv-1.3.0/app/ext_example/my_extension.c +0 -366
  35. data/ext/zsv/vendor/zsv-1.3.0/app/ext_example/mysheet_extension.c +0 -341
  36. data/ext/zsv/vendor/zsv-1.3.0/app/ext_template/YOUR_EXTENSION_zsvext.c +0 -263
  37. data/ext/zsv/vendor/zsv-1.3.0/app/external/inih/ini.c +0 -298
  38. data/ext/zsv/vendor/zsv-1.3.0/app/external/inih/ini.h +0 -157
  39. data/ext/zsv/vendor/zsv-1.3.0/app/external/json_writer-1.01/json_numeric.c +0 -177
  40. data/ext/zsv/vendor/zsv-1.3.0/app/external/json_writer-1.01/jsonwriter.c +0 -444
  41. data/ext/zsv/vendor/zsv-1.3.0/app/external/json_writer-1.01/jsonwriter.h +0 -145
  42. data/ext/zsv/vendor/zsv-1.3.0/app/external/json_writer-1.01/utils.c +0 -110
  43. data/ext/zsv/vendor/zsv-1.3.0/app/external/memfile-1.0/include/memfile.h +0 -15
  44. data/ext/zsv/vendor/zsv-1.3.0/app/external/memfile-1.0/src/memfile.c +0 -64
  45. data/ext/zsv/vendor/zsv-1.3.0/app/external/sglib/sglib.h +0 -1955
  46. data/ext/zsv/vendor/zsv-1.3.0/app/external/simdutf/simdutf.h +0 -6802
  47. data/ext/zsv/vendor/zsv-1.3.0/app/external/sqlite3/sqlite3.c +0 -230517
  48. data/ext/zsv/vendor/zsv-1.3.0/app/external/sqlite3/sqlite3.h +0 -12174
  49. data/ext/zsv/vendor/zsv-1.3.0/app/external/sqlite3/sqlite3_and_csv_vtab.c +0 -2
  50. data/ext/zsv/vendor/zsv-1.3.0/app/external/sqlite3/sqlite3_csv_vtab-mem.c +0 -142
  51. data/ext/zsv/vendor/zsv-1.3.0/app/external/sqlite3/sqlite3_csv_vtab-mem.h +0 -49
  52. data/ext/zsv/vendor/zsv-1.3.0/app/external/sqlite3/sqlite3_csv_vtab-zsv.c +0 -485
  53. data/ext/zsv/vendor/zsv-1.3.0/app/external/sqlite3/sqlite3_csv_vtab.c +0 -1015
  54. data/ext/zsv/vendor/zsv-1.3.0/app/external/sqlite3/sqlite3ext.h +0 -663
  55. data/ext/zsv/vendor/zsv-1.3.0/app/external/sqlite3/vtab_helper.c +0 -85
  56. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/build/yajl-2.1.1/include/yajl/yajl_common.h +0 -75
  57. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/build/yajl-2.1.1/include/yajl/yajl_gen.h +0 -167
  58. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/build/yajl-2.1.1/include/yajl/yajl_parse.h +0 -228
  59. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/build/yajl-2.1.1/include/yajl/yajl_tree.h +0 -186
  60. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/build/yajl-2.1.1/include/yajl/yajl_version.h +0 -23
  61. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/api/yajl_common.h +0 -76
  62. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/api/yajl_gen.h +0 -167
  63. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/api/yajl_parse.h +0 -238
  64. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/api/yajl_tree.h +0 -186
  65. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/yajl.c +0 -184
  66. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/yajl_alloc.c +0 -52
  67. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/yajl_alloc.h +0 -34
  68. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/yajl_buf.c +0 -103
  69. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/yajl_buf.h +0 -57
  70. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/yajl_bytestack.h +0 -69
  71. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/yajl_encode.c +0 -220
  72. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/yajl_encode.h +0 -34
  73. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/yajl_gen.c +0 -362
  74. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/yajl_lex.c +0 -764
  75. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/yajl_lex.h +0 -117
  76. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/yajl_parser.c +0 -508
  77. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/yajl_parser.h +0 -78
  78. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/yajl_tree.c +0 -505
  79. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl/src/yajl_version.c +0 -7
  80. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl_helper/yajl_helper/json_value.h +0 -59
  81. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl_helper/yajl_helper/yajl_helper.h +0 -208
  82. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl_helper/yajl_helper.c +0 -795
  83. data/ext/zsv/vendor/zsv-1.3.0/app/external/yajl_helper/yajl_helper_internal.h +0 -28
  84. data/ext/zsv/vendor/zsv-1.3.0/app/flatten.c +0 -851
  85. data/ext/zsv/vendor/zsv-1.3.0/app/jq.c +0 -106
  86. data/ext/zsv/vendor/zsv-1.3.0/app/jq.h +0 -6
  87. data/ext/zsv/vendor/zsv-1.3.0/app/mv.c +0 -113
  88. data/ext/zsv/vendor/zsv-1.3.0/app/noop.c +0 -90
  89. data/ext/zsv/vendor/zsv-1.3.0/app/overwrite.c +0 -295
  90. data/ext/zsv/vendor/zsv-1.3.0/app/paste.c +0 -175
  91. data/ext/zsv/vendor/zsv-1.3.0/app/pretty.c +0 -693
  92. data/ext/zsv/vendor/zsv-1.3.0/app/prop.c +0 -980
  93. data/ext/zsv/vendor/zsv-1.3.0/app/rm.c +0 -131
  94. data/ext/zsv/vendor/zsv-1.3.0/app/select/fixed.c +0 -130
  95. data/ext/zsv/vendor/zsv-1.3.0/app/select/internal.h +0 -118
  96. data/ext/zsv/vendor/zsv-1.3.0/app/select/parallel.c +0 -45
  97. data/ext/zsv/vendor/zsv-1.3.0/app/select/parallel.h +0 -41
  98. data/ext/zsv/vendor/zsv-1.3.0/app/select/processing.c +0 -107
  99. data/ext/zsv/vendor/zsv-1.3.0/app/select/rand.c +0 -20
  100. data/ext/zsv/vendor/zsv-1.3.0/app/select/regex.c +0 -61
  101. data/ext/zsv/vendor/zsv-1.3.0/app/select/search.c +0 -14
  102. data/ext/zsv/vendor/zsv-1.3.0/app/select/selection.c +0 -192
  103. data/ext/zsv/vendor/zsv-1.3.0/app/select/usage.c +0 -72
  104. data/ext/zsv/vendor/zsv-1.3.0/app/select-pull.c +0 -812
  105. data/ext/zsv/vendor/zsv-1.3.0/app/select.c +0 -753
  106. data/ext/zsv/vendor/zsv-1.3.0/app/serialize.c +0 -372
  107. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/curses.h +0 -15
  108. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/cursor.c +0 -119
  109. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/errors.c +0 -45
  110. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/file.c +0 -63
  111. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/file.h +0 -12
  112. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/filter.c +0 -166
  113. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/handlers.c +0 -214
  114. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/handlers_internal.h +0 -128
  115. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/help.c +0 -43
  116. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/index.c +0 -81
  117. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/index.h +0 -25
  118. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/key-bindings.c +0 -325
  119. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/key-bindings.h +0 -73
  120. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/lexer.c +0 -203
  121. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/newline_handler.c +0 -7
  122. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/pivot.c +0 -318
  123. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/procedure.c +0 -134
  124. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/procedure.h +0 -119
  125. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/read-data.c +0 -322
  126. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/screen_buffer.c +0 -203
  127. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/screen_buffer.h +0 -36
  128. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/sheet-sql.c +0 -167
  129. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/sheet_internal.h +0 -36
  130. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/sqlfilter.c +0 -153
  131. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/terminfo.c +0 -32
  132. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/transformation.c +0 -312
  133. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/transformation.h +0 -29
  134. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/ui_buffer.c +0 -266
  135. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/usage.c +0 -9
  136. data/ext/zsv/vendor/zsv-1.3.0/app/sheet/utf8-width.c +0 -60
  137. data/ext/zsv/vendor/zsv-1.3.0/app/sheet.c +0 -1007
  138. data/ext/zsv/vendor/zsv-1.3.0/app/sql.c +0 -453
  139. data/ext/zsv/vendor/zsv-1.3.0/app/sql_internal.c +0 -101
  140. data/ext/zsv/vendor/zsv-1.3.0/app/sql_internal.h +0 -49
  141. data/ext/zsv/vendor/zsv-1.3.0/app/stack.c +0 -393
  142. data/ext/zsv/vendor/zsv-1.3.0/app/utils/arg.c +0 -322
  143. data/ext/zsv/vendor/zsv-1.3.0/app/utils/cache.c +0 -228
  144. data/ext/zsv/vendor/zsv-1.3.0/app/utils/cat.c +0 -91
  145. data/ext/zsv/vendor/zsv-1.3.0/app/utils/chunk.c +0 -240
  146. data/ext/zsv/vendor/zsv-1.3.0/app/utils/chunk.h +0 -63
  147. data/ext/zsv/vendor/zsv-1.3.0/app/utils/clock.c +0 -57
  148. data/ext/zsv/vendor/zsv-1.3.0/app/utils/db.c +0 -148
  149. data/ext/zsv/vendor/zsv-1.3.0/app/utils/dirs-no-jq.c +0 -2
  150. data/ext/zsv/vendor/zsv-1.3.0/app/utils/dirs.c +0 -427
  151. data/ext/zsv/vendor/zsv-1.3.0/app/utils/dirs_from_json.c +0 -253
  152. data/ext/zsv/vendor/zsv-1.3.0/app/utils/dirs_to_json.c +0 -121
  153. data/ext/zsv/vendor/zsv-1.3.0/app/utils/dl.c +0 -20
  154. data/ext/zsv/vendor/zsv-1.3.0/app/utils/emcc/fs_api.c +0 -159
  155. data/ext/zsv/vendor/zsv-1.3.0/app/utils/err.c +0 -24
  156. data/ext/zsv/vendor/zsv-1.3.0/app/utils/file-mem.c +0 -180
  157. data/ext/zsv/vendor/zsv-1.3.0/app/utils/file.c +0 -256
  158. data/ext/zsv/vendor/zsv-1.3.0/app/utils/index.c +0 -197
  159. data/ext/zsv/vendor/zsv-1.3.0/app/utils/index.h +0 -49
  160. data/ext/zsv/vendor/zsv-1.3.0/app/utils/jq.c +0 -400
  161. data/ext/zsv/vendor/zsv-1.3.0/app/utils/json.c +0 -120
  162. data/ext/zsv/vendor/zsv-1.3.0/app/utils/mem.c +0 -18
  163. data/ext/zsv/vendor/zsv-1.3.0/app/utils/memmem.c +0 -132
  164. data/ext/zsv/vendor/zsv-1.3.0/app/utils/os.c +0 -178
  165. data/ext/zsv/vendor/zsv-1.3.0/app/utils/overwrite.c +0 -258
  166. data/ext/zsv/vendor/zsv-1.3.0/app/utils/overwrite_writer.c +0 -246
  167. data/ext/zsv/vendor/zsv-1.3.0/app/utils/pcre2-8/pcre2-8-test.c +0 -123
  168. data/ext/zsv/vendor/zsv-1.3.0/app/utils/pcre2-8/pcre2-8.c +0 -153
  169. data/ext/zsv/vendor/zsv-1.3.0/app/utils/pcre2-8/pcre2-8.h +0 -54
  170. data/ext/zsv/vendor/zsv-1.3.0/app/utils/prop.c +0 -267
  171. data/ext/zsv/vendor/zsv-1.3.0/app/utils/signal.c +0 -53
  172. data/ext/zsv/vendor/zsv-1.3.0/app/utils/string.c +0 -357
  173. data/ext/zsv/vendor/zsv-1.3.0/app/utils/win/dir_exists_longpath.c +0 -83
  174. data/ext/zsv/vendor/zsv-1.3.0/app/utils/win/dl.c +0 -33
  175. data/ext/zsv/vendor/zsv-1.3.0/app/utils/win/fopen_longpath.c +0 -184
  176. data/ext/zsv/vendor/zsv-1.3.0/app/utils/win/foreach_dirent_longpath.c +0 -292
  177. data/ext/zsv/vendor/zsv-1.3.0/app/utils/win/io.c +0 -259
  178. data/ext/zsv/vendor/zsv-1.3.0/app/utils/win/io.h +0 -13
  179. data/ext/zsv/vendor/zsv-1.3.0/app/utils/win/mkdir_longpath.c +0 -255
  180. data/ext/zsv/vendor/zsv-1.3.0/app/utils/win/remove_longpath.c +0 -96
  181. data/ext/zsv/vendor/zsv-1.3.0/app/utils/writer.c +0 -361
  182. data/ext/zsv/vendor/zsv-1.3.0/app/zsv_command.h +0 -40
  183. data/ext/zsv/vendor/zsv-1.3.0/app/zsv_command_standalone.c +0 -16
  184. data/ext/zsv/vendor/zsv-1.3.0/app/zsv_main.h +0 -44
  185. data/ext/zsv/vendor/zsv-1.3.0/examples/js/zsv_parser_api_dummy.c +0 -3
  186. data/ext/zsv/vendor/zsv-1.3.0/examples/lib/parse_by_chunk.c +0 -100
  187. data/ext/zsv/vendor/zsv-1.3.0/examples/lib/print_my_column.c +0 -143
  188. data/ext/zsv/vendor/zsv-1.3.0/examples/lib/pull.c +0 -89
  189. data/ext/zsv/vendor/zsv-1.3.0/examples/lib/simple.c +0 -123
  190. data/ext/zsv/vendor/zsv-1.3.0/fuzz/fuzz.c +0 -16
  191. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/api.h +0 -336
  192. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/common.h +0 -361
  193. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/ext/implementation.h +0 -62
  194. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/ext/implementation_private.h +0 -113
  195. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/ext/sheet.h +0 -73
  196. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/ext.h +0 -329
  197. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/arg.h +0 -90
  198. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/cache.h +0 -49
  199. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/clock.h +0 -36
  200. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/compiler.h +0 -58
  201. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/db.h +0 -19
  202. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/dirs.h +0 -147
  203. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/dl.h +0 -22
  204. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/emcc/fs_api.h +0 -28
  205. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/err.h +0 -22
  206. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/file-mem.h +0 -17
  207. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/file.h +0 -99
  208. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/jq.h +0 -65
  209. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/json.h +0 -19
  210. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/mem.h +0 -19
  211. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/memmem.h +0 -13
  212. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/os.h +0 -54
  213. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/overwrite.h +0 -71
  214. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/overwrite_writer.h +0 -53
  215. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/prop.h +0 -107
  216. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/signal.h +0 -18
  217. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/sql.h +0 -11
  218. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/string.h +0 -148
  219. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/utf8.h +0 -41
  220. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/win/dl.h +0 -25
  221. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/utils/writer.h +0 -101
  222. data/ext/zsv/vendor/zsv-1.3.0/include/zsv/zsv_export.h +0 -33
  223. data/ext/zsv/vendor/zsv-1.3.0/include/zsv.h +0 -20
  224. data/ext/zsv/vendor/zsv-1.3.0/src/vector_delim.c +0 -60
  225. data/ext/zsv/vendor/zsv-1.3.0/src/zsv.c +0 -484
  226. data/ext/zsv/vendor/zsv-1.3.0/src/zsv_internal.c +0 -731
  227. data/ext/zsv/vendor/zsv-1.3.0/src/zsv_scan_delim.c +0 -285
  228. data/ext/zsv/vendor/zsv-1.3.0/src/zsv_scan_fixed.c +0 -88
  229. data/ext/zsv/vendor/zsv-1.3.0/src/zsv_strencode.c +0 -51
@@ -1,484 +0,0 @@
1
- /*
2
- * Copyright (C) 2021 Tai Chi Minh Ralph Eastwood (self), Matt Wong (Guarnerix Inc dba Liquidaty)
3
- * All rights reserved
4
- *
5
- * This file is part of zsv/lib, distributed under the license defined at
6
- * https://opensource.org/licenses/MIT
7
- */
8
-
9
- #ifndef ZSV_MIN_SCANNER_BUFFSIZE
10
- #define ZSV_MIN_SCANNER_BUFFSIZE 4096
11
- #endif
12
-
13
- #include "zsv.h"
14
- #include <zsv/utils/compiler.h>
15
- #ifdef ZSV_EXTRAS
16
- #include <zsv/utils/arg.h>
17
- #endif
18
-
19
- static struct zsv_cell zsv_get_cell_1(zsv_parser parser, size_t ix);
20
- static struct zsv_cell zsv_get_cell_with_overwrite(zsv_parser parser, size_t col_ix);
21
- #include "zsv_internal.c"
22
-
23
- #ifndef ZSV_VERSION
24
- #define ZSV_VERSION "unknown"
25
- #endif
26
-
27
- ZSV_EXPORT
28
- const char *zsv_lib_version(void) {
29
- return ZSV_VERSION;
30
- }
31
-
32
- #include "zsv_strencode.c"
33
-
34
- /**
35
- * When we parse a chunk, if it was not the first parse call, we might have a partial
36
- * row at the end of our buffer that must be moved. The reason we do this at the beginning
37
- * of a parse and not at the end of the prior parse is so that between chunks, the input
38
- * chunk remains available in a contiguous block of one or more rows
39
- */
40
- // __attribute__((always_inline))
41
- inline static size_t scanner_pre_parse(struct zsv_scanner *scanner) {
42
- scanner->last = '\0';
43
- if (VERY_LIKELY(scanner->old_bytes_read)) {
44
- scanner->last = scanner->buff.buff[scanner->old_bytes_read - 1];
45
- if (scanner->row_start < scanner->old_bytes_read) {
46
- size_t len = scanner->old_bytes_read - scanner->row_start;
47
- memmove(scanner->buff.buff, scanner->buff.buff + scanner->row_start, len);
48
- scanner->partial_row_length = len;
49
- } else {
50
- scanner->cell_start = 0;
51
- scanner->row_start = 0;
52
- zsv_clear_cell(scanner);
53
- }
54
- scanner->cell_start -= scanner->row_start;
55
- for (size_t i2 = 0; i2 < scanner->row.used; i2++)
56
- scanner->row.cells[i2].str -= scanner->row_start;
57
- scanner->row_start = 0;
58
- scanner->old_bytes_read = 0;
59
- }
60
-
61
- scanner->cum_scanned_length += scanner->scanned_length - scanner->partial_row_length;
62
-
63
- size_t capacity = scanner->buff.size - scanner->partial_row_length;
64
- if (VERY_UNLIKELY(capacity == 0)) {
65
- // our row size was too small to fit a single row of data
66
- scanner->errprintf(scanner->errf, "Warning: row %zu truncated\n", scanner->data_row_count);
67
- if (scanner->mode == ZSV_MODE_FIXED) {
68
- if (VERY_UNLIKELY(row_fx(scanner, scanner->buff.buff, 0, scanner->buff.size)))
69
- return zsv_status_cancelled;
70
- } else if (VERY_UNLIKELY(row_dl(scanner)))
71
- return zsv_status_cancelled;
72
-
73
- // throw away the next row end
74
- scanner->buffer_exceeded = 1;
75
- scanner->opts.row_handler = zsv_throwaway_row;
76
- scanner->opts.ctx = scanner;
77
-
78
- scanner->partial_row_length = 0;
79
- capacity = scanner->buff.size;
80
- }
81
- return capacity;
82
- }
83
-
84
- /**
85
- * apply --header-row option
86
- */
87
- static enum zsv_status zsv_insert_string(struct zsv_scanner *scanner) {
88
- // to do: replace below with
89
- // return parse_bytes(scanner, bytes, len);
90
- size_t len = strlen(scanner->insert_string);
91
- if (len > scanner->buff.size - scanner->partial_row_length)
92
- len = scanner->buff.size - 1; // to do: throw an error instead
93
- memcpy(scanner->buff.buff + scanner->partial_row_length, scanner->insert_string, len);
94
- if (scanner->buff.buff[len] != '\n')
95
- scanner->buff.buff[len] = '\n';
96
- enum zsv_status stat = zsv_scan(scanner, scanner->buff.buff, len + 1);
97
- scanner->insert_string = NULL;
98
- return stat;
99
- }
100
-
101
- /**
102
- * Read the next chunk of data from our input stream and parse it, calling our
103
- * custom handlers as each cell and row are parsed
104
- */
105
- ZSV_EXPORT
106
- enum zsv_status zsv_parse_more(struct zsv_scanner *scanner) {
107
- if (VERY_UNLIKELY(scanner->insert_string != NULL))
108
- zsv_insert_string(scanner);
109
-
110
- size_t capacity = scanner_pre_parse(scanner);
111
- size_t bytes_read;
112
- if (VERY_UNLIKELY(scanner->checked_bom == 0)) {
113
- #ifdef ZSV_EXTRAS
114
- // initialize progress timer
115
- if (scanner->opts.progress.seconds_interval)
116
- scanner->progress.last_time = time(NULL);
117
- #endif
118
- size_t bom_len = strlen(ZSV_BOM);
119
- scanner->checked_bom = 1;
120
- if ((bytes_read = scanner->read(scanner->buff.buff, 1, bom_len, scanner->in)) == bom_len &&
121
- !memcmp(scanner->buff.buff, ZSV_BOM, bom_len)) {
122
- // have bom. disregard what we just read
123
- bytes_read = scanner->read(scanner->buff.buff, 1, capacity, scanner->in);
124
- scanner->had_bom = 1;
125
- } else { // no BOM. keep the bytes we just read
126
- // bytes_read = bom_len + scanner->read(scanner->buff.buff + bom_len, 1, capacity - bom_len, scanner->in);
127
- if (bytes_read == bom_len) // maybe we only read < 3 bytes
128
- bytes_read += scanner->read(scanner->buff.buff + bom_len, 1, capacity - bom_len, scanner->in);
129
- }
130
- } else // already checked bom. read as usual
131
- bytes_read = scanner->read(scanner->buff.buff + scanner->partial_row_length, 1, capacity, scanner->in);
132
- scanner->started = 1;
133
- if (VERY_UNLIKELY(scanner->filter != NULL))
134
- bytes_read = scanner->filter(scanner->filter_ctx, scanner->buff.buff + scanner->partial_row_length, bytes_read);
135
- if (VERY_LIKELY(bytes_read))
136
- return zsv_scan(scanner, scanner->buff.buff, bytes_read);
137
-
138
- scanner->scanned_length = scanner->partial_row_length;
139
- return zsv_status_no_more_input;
140
- }
141
-
142
- ZSV_EXPORT
143
- void zsv_abort(zsv_parser parser) {
144
- parser->abort = 1;
145
- }
146
-
147
- ZSV_EXPORT
148
- char zsv_row_is_blank(zsv_parser parser) {
149
- return zsv_internal_row_is_blank(parser);
150
- }
151
-
152
- static void zsv_pull_row(void *ctx) {
153
- zsv_parser parser = ctx;
154
- parser->pull.now = 1;
155
- parser->pull.row_used = parser->row.used;
156
- }
157
-
158
- /**
159
- * For pull parsing, use zsv_next_row(). Not quite as fast as push parsing, but pretty close
160
- * @return zsv_status_row on success
161
- */
162
- ZSV_EXPORT
163
- enum zsv_status zsv_next_row(zsv_parser parser) {
164
- if (VERY_UNLIKELY(!parser->pull.regs)) {
165
- if (parser->started)
166
- return zsv_status_error; // error: already started a push parser
167
- if (!(parser->pull.regs = calloc(1, sizeof(*parser->pull.regs))))
168
- return zsv_status_memory;
169
- parser->mode = ZSV_MODE_DELIM_PULL;
170
- zsv_set_row_handler(parser, zsv_pull_row);
171
- zsv_set_context(parser, parser);
172
- if (parser->insert_string != NULL)
173
- parser->pull.stat = zsv_insert_string(parser);
174
- if (parser->pull.stat == zsv_status_row)
175
- return parser->pull.stat;
176
- }
177
- if (VERY_LIKELY(parser->pull.stat == zsv_status_row))
178
- parser->pull.stat = zsv_scan_delim_pull(parser, parser->pull.buff, parser->pull.bytes_read);
179
- if (VERY_UNLIKELY(parser->pull.stat == zsv_status_ok)) {
180
- do {
181
- parser->pull.stat = zsv_parse_more(parser); // should return zsv_status_row or zsv_status_no_more_input
182
- } while (parser->pull.stat == zsv_status_ok);
183
- if (VERY_LIKELY(parser->pull.stat == zsv_status_row))
184
- return parser->pull.stat;
185
- }
186
-
187
- if (VERY_UNLIKELY(parser->pull.stat == zsv_status_no_more_input)) {
188
- parser->pull.now = 0;
189
- zsv_finish(parser);
190
-
191
- parser->pull.stat = zsv_status_done;
192
- if (parser->pull.now) {
193
- parser->pull.now = 0;
194
- parser->row.used = parser->pull.row_used;
195
- return zsv_status_row;
196
- }
197
- }
198
- return parser->pull.stat;
199
- }
200
-
201
- // to do: rename to zsv_column_count(). rename all other zsv_hand to just zsv_
202
- ZSV_EXPORT
203
- size_t zsv_cell_count(zsv_parser parser) {
204
- return parser->row.used;
205
- }
206
-
207
- ZSV_EXPORT
208
- void zsv_set_row_handler(zsv_parser parser, void (*row_handler)(void *ctx)) {
209
- if (parser->opts.row_handler == parser->opts_orig.row_handler)
210
- parser->opts.row_handler = row_handler;
211
- parser->opts_orig.row_handler = row_handler;
212
- }
213
-
214
- ZSV_EXPORT
215
- void zsv_set_context(zsv_parser parser, void *ctx) {
216
- if (parser->opts.ctx == parser->opts_orig.ctx)
217
- parser->opts.ctx = ctx;
218
- parser->opts_orig.ctx = ctx;
219
- }
220
-
221
- ZSV_EXPORT
222
- void zsv_set_read(zsv_parser parser, size_t (*read_func)(void *restrict, size_t n, size_t size, void *restrict)) {
223
- parser->read = read_func;
224
- }
225
-
226
- ZSV_EXPORT
227
- void zsv_set_input(zsv_parser parser, void *in) {
228
- parser->in = in;
229
- }
230
-
231
- ZSV_EXPORT
232
- char zsv_quoted(zsv_parser parser) {
233
- return parser->quoted || parser->opts.no_quotes;
234
- }
235
-
236
- static struct zsv_cell zsv_get_cell_1(zsv_parser parser, size_t ix) {
237
- if (VERY_LIKELY(ix < parser->row.used))
238
- return parser->row.cells[ix];
239
-
240
- struct zsv_cell c = {0, 0, 0, 0};
241
- return c;
242
- }
243
-
244
- // to do: benchmark returning zsv_cell struct vs just a zsv_cell pointer
245
- ZSV_EXPORT
246
- struct zsv_cell zsv_get_cell(zsv_parser parser, size_t ix) {
247
- return parser->get_cell(parser, ix);
248
- }
249
-
250
- /**
251
- * `zsv_get_cell_len()` is not needed in most cases, but may be useful in
252
- * restrictive cases such as when calling from Javascript into wasm
253
- */
254
- ZSV_EXPORT
255
- size_t zsv_get_cell_len(zsv_parser parser, size_t ix) {
256
- if (ix < parser->row.used)
257
- return parser->row.cells[ix].len;
258
- return 0;
259
- }
260
-
261
- ZSV_EXPORT
262
- unsigned char *zsv_get_cell_str(zsv_parser parser, size_t ix) {
263
- struct zsv_cell c = zsv_get_cell_1(parser, ix);
264
- return c.len ? c.str : NULL;
265
- }
266
-
267
- ZSV_EXPORT enum zsv_status zsv_set_fixed_offsets(zsv_parser parser, size_t count, size_t *offsets) {
268
- if (!count) {
269
- parser->errprintf(parser->errf, "Fixed offset count must be greater than zero\n");
270
- return zsv_status_invalid_option;
271
- }
272
- if (offsets[0] == 0)
273
- parser->errprintf(parser->errf, "Warning: first cell width is zero\n");
274
- for (size_t i = 1; i < count; i++) {
275
- if (offsets[i - 1] > offsets[i]) {
276
- parser->errprintf(parser->errf, "Invalid offset %zu may not exceed prior offset %zu\n", offsets[i],
277
- offsets[i - 1]);
278
- return zsv_status_invalid_option;
279
- } else if (offsets[i - 1] == offsets[i])
280
- parser->errprintf(parser->errf, "Warning: offset %zu repeated, will always yield empty cell\n", offsets[i - 1]);
281
- }
282
-
283
- if (offsets[count - 1] > parser->buff.size) {
284
- parser->errprintf(parser->errf, "Offset %zu exceeds total buffer size %zu\n", offsets[count - 1],
285
- parser->buff.size);
286
- return zsv_status_invalid_option;
287
- }
288
- if (parser->cum_scanned_length) {
289
- parser->errprintf(parser->errf, "Scanner mode cannot be changed after parsing has begun\n");
290
- return zsv_status_invalid_option;
291
- }
292
-
293
- free(parser->fixed.offsets);
294
- parser->fixed.offsets = calloc(count, sizeof(*parser->fixed.offsets));
295
- if (parser->fixed.offsets == NULL) {
296
- parser->errprintf(parser->errf, "Out of memory!\n");
297
- return zsv_status_memory;
298
- }
299
- parser->fixed.count = count;
300
- for (unsigned i = 0; i < count; i++)
301
- parser->fixed.offsets[i] = offsets[i];
302
-
303
- parser->mode = ZSV_MODE_FIXED;
304
- parser->checked_bom = 1;
305
-
306
- set_callbacks(parser);
307
-
308
- return zsv_status_ok;
309
- }
310
-
311
- ZSV_EXPORT
312
- int zsv_peek(zsv_parser z) {
313
- if (z->scanned_length + 1 < z->buff.size)
314
- return z->buff.buff[z->scanned_length + 1];
315
- return -1;
316
- }
317
-
318
- /**
319
- * Create a zsv parser
320
- * @param opts
321
- * @returns parser handle
322
- */
323
- ZSV_EXPORT
324
- zsv_parser zsv_new(struct zsv_opts *opts) {
325
- struct zsv_opts tmp;
326
- if (!opts) {
327
- opts = &tmp;
328
- memset(opts, 0, sizeof(*opts));
329
- }
330
-
331
- if (!opts->max_row_size)
332
- opts->max_row_size = ZSV_ROW_MAX_SIZE_DEFAULT;
333
- if (!opts->max_columns)
334
- opts->max_columns = ZSV_MAX_COLS_DEFAULT;
335
- if (opts->delimiter == '\n' || opts->delimiter == '\r' || opts->delimiter == '"') {
336
- int (*errprintf)(void *, const char *fmt, ...) = opts->errprintf ? opts->errprintf : zsv_generic_fprintf;
337
- errprintf(opts->errf ? opts->errf : stderr, "Invalid delimiter\n");
338
- return NULL;
339
- }
340
- struct zsv_scanner *scanner = calloc(1, sizeof(*scanner));
341
- if (scanner) {
342
- if (zsv_scanner_init(scanner, opts)) {
343
- zsv_delete(scanner);
344
- scanner = NULL;
345
- }
346
- }
347
- return scanner;
348
- }
349
-
350
- ZSV_EXPORT
351
- enum zsv_status zsv_finish(struct zsv_scanner *scanner) {
352
- enum zsv_status stat = zsv_status_ok;
353
- if (!scanner)
354
- return zsv_status_error;
355
- if (!scanner->abort) {
356
- if (scanner->mode == ZSV_MODE_FIXED) {
357
- if (scanner->partial_row_length && memchr("\n\r", scanner->buff.buff[scanner->partial_row_length - 1], 2))
358
- scanner->partial_row_length--;
359
- if (scanner->partial_row_length)
360
- return row_fx(scanner, scanner->buff.buff, 0, scanner->partial_row_length);
361
- return zsv_status_ok;
362
- }
363
-
364
- if ((scanner->quoted & ZSV_PARSER_QUOTE_UNCLOSED) && scanner->partial_row_length > scanner->cell_start) {
365
- int quote = '"';
366
- scanner->quoted |= ZSV_PARSER_QUOTE_CLOSED;
367
- scanner->quoted -= ZSV_PARSER_QUOTE_UNCLOSED;
368
- if (scanner->last == quote)
369
- scanner->quote_close_position = scanner->partial_row_length - scanner->cell_start;
370
- else {
371
- scanner->quote_close_position = scanner->partial_row_length - scanner->cell_start;
372
- scanner->scanned_length++;
373
- }
374
- }
375
- }
376
-
377
- if (!scanner->finished) {
378
- scanner->finished = 1;
379
- if (!scanner->abort) {
380
- if (scanner->scanned_length > 0 && scanner->scanned_length >= scanner->cell_start)
381
- cell_dl(scanner, scanner->buff.buff + scanner->cell_start, scanner->scanned_length - scanner->cell_start);
382
- if (scanner->have_cell) {
383
- if (row_dl(scanner))
384
- stat = zsv_status_cancelled;
385
- }
386
- } else
387
- stat = zsv_status_cancelled;
388
- #ifdef ZSV_EXTRAS
389
- if (scanner->opts.completed.callback)
390
- scanner->opts.completed.callback(scanner->opts.completed.ctx, stat);
391
- #endif
392
- }
393
- return stat;
394
- }
395
-
396
- ZSV_EXPORT
397
- enum zsv_status zsv_delete(zsv_parser parser) {
398
- if (parser) {
399
- if (parser->free_buff && parser->buff.buff)
400
- free(parser->buff.buff);
401
-
402
- free(parser->row.cells);
403
- free(parser->fixed.offsets);
404
- collate_header_destroy(&parser->collate_header);
405
- free(parser->pull.regs);
406
-
407
- #ifdef ZSV_EXTRAS
408
- if (parser->overwrite.close)
409
- parser->overwrite.close(parser->overwrite.ctx);
410
- #endif
411
-
412
- if (parser->errclose)
413
- parser->errclose(parser->errf);
414
- free(parser);
415
- }
416
- return zsv_status_ok;
417
- }
418
-
419
- ZSV_EXPORT
420
- const unsigned char *zsv_parse_status_desc(enum zsv_status status) {
421
- switch (status) {
422
- case zsv_status_ok:
423
- return (unsigned char *)"OK";
424
- case zsv_status_cancelled:
425
- return (unsigned char *)"User cancelled";
426
- case zsv_status_no_more_input:
427
- return (unsigned char *)"No more input";
428
- case zsv_status_invalid_option:
429
- return (unsigned char *)"Invalid option";
430
- case zsv_status_memory:
431
- return (unsigned char *)"Out of memory";
432
- case zsv_status_done:
433
- return (unsigned char *)"No more rows to pull";
434
- case zsv_status_row:
435
- return (unsigned char *)"Row successfully pulled";
436
- case zsv_status_error:
437
- return (unsigned char *)"Unexpected error";
438
- #ifdef ZSV_EXTRAS
439
- case zsv_status_max_rows_read:
440
- return (unsigned char *)"Maximum specified rows have been parsed";
441
- #endif
442
- }
443
- return (unsigned char *)"Unknown";
444
- }
445
-
446
- ZSV_EXPORT
447
- size_t zsv_scanned_length(zsv_parser parser) {
448
- return parser->scanned_length;
449
- }
450
-
451
- ZSV_EXPORT
452
- size_t zsv_cum_scanned_length(zsv_parser parser) {
453
- return parser->cum_scanned_length + (parser->finished ? 0 : parser->scanned_length) +
454
- (parser->had_bom ? strlen(ZSV_BOM) : 0);
455
- }
456
-
457
- ZSV_EXPORT
458
- size_t zsv_row_length_raw_bytes(zsv_parser parser) {
459
- return parser->scanned_length - parser->row_start;
460
- }
461
-
462
- /**
463
- * @param parser parser handle
464
- * @param buff the input buffer. Note: this buffer may not overlap with
465
- * the parser buffer!
466
- * @param len length of the input to parse
467
- */
468
- enum zsv_status zsv_parse_bytes(struct zsv_scanner *scanner, const unsigned char *bytes, size_t len) {
469
- enum zsv_status stat = zsv_status_ok;
470
- const unsigned char *cursor = bytes;
471
- while (len && stat == zsv_status_ok) {
472
- size_t capacity = scanner_pre_parse(scanner);
473
- size_t this_chunk_size = len > capacity ? capacity : len;
474
- memcpy(scanner->buff.buff + scanner->partial_row_length, cursor, this_chunk_size);
475
- cursor += this_chunk_size;
476
- len -= this_chunk_size;
477
- if (scanner->filter)
478
- this_chunk_size =
479
- scanner->filter(scanner->filter_ctx, scanner->buff.buff + scanner->partial_row_length, this_chunk_size);
480
- if (this_chunk_size)
481
- stat = zsv_scan(scanner, scanner->buff.buff, this_chunk_size);
482
- }
483
- return stat;
484
- }