jtcsv 2.2.8 → 3.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (246) hide show
  1. package/README.md +204 -115
  2. package/bin/jtcsv.ts +2612 -0
  3. package/browser.d.ts +142 -0
  4. package/dist/benchmark.js +446 -0
  5. package/dist/benchmark.js.map +1 -0
  6. package/dist/bin/jtcsv.js +1940 -0
  7. package/dist/bin/jtcsv.js.map +1 -0
  8. package/dist/csv-to-json.js +1262 -0
  9. package/dist/csv-to-json.js.map +1 -0
  10. package/dist/errors.js +291 -0
  11. package/dist/errors.js.map +1 -0
  12. package/dist/eslint.config.js +147 -0
  13. package/dist/eslint.config.js.map +1 -0
  14. package/dist/index-core.js +95 -0
  15. package/dist/index-core.js.map +1 -0
  16. package/dist/index.js +93 -0
  17. package/dist/index.js.map +1 -0
  18. package/dist/json-save.js +229 -0
  19. package/dist/json-save.js.map +1 -0
  20. package/dist/json-to-csv.js +576 -0
  21. package/dist/json-to-csv.js.map +1 -0
  22. package/dist/jtcsv-core.cjs.js +1736 -0
  23. package/dist/jtcsv-core.cjs.js.map +1 -0
  24. package/dist/jtcsv-core.esm.js +1708 -0
  25. package/dist/jtcsv-core.esm.js.map +1 -0
  26. package/dist/jtcsv-core.umd.js +1742 -0
  27. package/dist/jtcsv-core.umd.js.map +1 -0
  28. package/dist/jtcsv-full.cjs.js +2241 -0
  29. package/dist/jtcsv-full.cjs.js.map +1 -0
  30. package/dist/jtcsv-full.esm.js +2209 -0
  31. package/dist/jtcsv-full.esm.js.map +1 -0
  32. package/dist/jtcsv-full.umd.js +2247 -0
  33. package/dist/jtcsv-full.umd.js.map +1 -0
  34. package/dist/jtcsv-workers.esm.js +768 -0
  35. package/dist/jtcsv-workers.esm.js.map +1 -0
  36. package/dist/jtcsv-workers.umd.js +782 -0
  37. package/dist/jtcsv-workers.umd.js.map +1 -0
  38. package/dist/jtcsv.cjs.js +1996 -2048
  39. package/dist/jtcsv.cjs.js.map +1 -1
  40. package/dist/jtcsv.esm.js +1992 -2048
  41. package/dist/jtcsv.esm.js.map +1 -1
  42. package/dist/jtcsv.umd.js +2157 -2209
  43. package/dist/jtcsv.umd.js.map +1 -1
  44. package/dist/plugins/express-middleware/index.js +350 -0
  45. package/dist/plugins/express-middleware/index.js.map +1 -0
  46. package/dist/plugins/fastify-plugin/index.js +315 -0
  47. package/dist/plugins/fastify-plugin/index.js.map +1 -0
  48. package/dist/plugins/hono/index.js +111 -0
  49. package/dist/plugins/hono/index.js.map +1 -0
  50. package/dist/plugins/nestjs/index.js +112 -0
  51. package/dist/plugins/nestjs/index.js.map +1 -0
  52. package/dist/plugins/nuxt/index.js +53 -0
  53. package/dist/plugins/nuxt/index.js.map +1 -0
  54. package/dist/plugins/remix/index.js +133 -0
  55. package/dist/plugins/remix/index.js.map +1 -0
  56. package/dist/plugins/sveltekit/index.js +155 -0
  57. package/dist/plugins/sveltekit/index.js.map +1 -0
  58. package/dist/plugins/trpc/index.js +136 -0
  59. package/dist/plugins/trpc/index.js.map +1 -0
  60. package/dist/run-demo.js +49 -0
  61. package/dist/run-demo.js.map +1 -0
  62. package/dist/src/browser/browser-functions.js +193 -0
  63. package/dist/src/browser/browser-functions.js.map +1 -0
  64. package/dist/src/browser/core.js +123 -0
  65. package/dist/src/browser/core.js.map +1 -0
  66. package/dist/src/browser/csv-to-json-browser.js +353 -0
  67. package/dist/src/browser/csv-to-json-browser.js.map +1 -0
  68. package/dist/src/browser/errors-browser.js +219 -0
  69. package/dist/src/browser/errors-browser.js.map +1 -0
  70. package/dist/src/browser/extensions/plugins.js +106 -0
  71. package/dist/src/browser/extensions/plugins.js.map +1 -0
  72. package/dist/src/browser/extensions/workers.js +66 -0
  73. package/dist/src/browser/extensions/workers.js.map +1 -0
  74. package/dist/src/browser/index.js +140 -0
  75. package/dist/src/browser/index.js.map +1 -0
  76. package/dist/src/browser/json-to-csv-browser.js +225 -0
  77. package/dist/src/browser/json-to-csv-browser.js.map +1 -0
  78. package/dist/src/browser/streams.js +340 -0
  79. package/dist/src/browser/streams.js.map +1 -0
  80. package/dist/src/browser/workers/csv-parser.worker.js +264 -0
  81. package/dist/src/browser/workers/csv-parser.worker.js.map +1 -0
  82. package/dist/src/browser/workers/worker-pool.js +338 -0
  83. package/dist/src/browser/workers/worker-pool.js.map +1 -0
  84. package/dist/src/core/delimiter-cache.js +196 -0
  85. package/dist/src/core/delimiter-cache.js.map +1 -0
  86. package/dist/src/core/node-optimizations.js +279 -0
  87. package/dist/src/core/node-optimizations.js.map +1 -0
  88. package/dist/src/core/plugin-system.js +399 -0
  89. package/dist/src/core/plugin-system.js.map +1 -0
  90. package/dist/src/core/transform-hooks.js +348 -0
  91. package/dist/src/core/transform-hooks.js.map +1 -0
  92. package/dist/src/engines/fast-path-engine-new.js +262 -0
  93. package/dist/src/engines/fast-path-engine-new.js.map +1 -0
  94. package/dist/src/engines/fast-path-engine.js +671 -0
  95. package/dist/src/engines/fast-path-engine.js.map +1 -0
  96. package/dist/src/errors.js +18 -0
  97. package/dist/src/errors.js.map +1 -0
  98. package/dist/src/formats/ndjson-parser.js +332 -0
  99. package/dist/src/formats/ndjson-parser.js.map +1 -0
  100. package/dist/src/formats/tsv-parser.js +230 -0
  101. package/dist/src/formats/tsv-parser.js.map +1 -0
  102. package/dist/src/index-with-plugins.js +259 -0
  103. package/dist/src/index-with-plugins.js.map +1 -0
  104. package/dist/src/types/index.js +3 -0
  105. package/dist/src/types/index.js.map +1 -0
  106. package/dist/src/utils/bom-utils.js +267 -0
  107. package/dist/src/utils/bom-utils.js.map +1 -0
  108. package/dist/src/utils/encoding-support.js +77 -0
  109. package/dist/src/utils/encoding-support.js.map +1 -0
  110. package/dist/src/utils/schema-validator.js +609 -0
  111. package/dist/src/utils/schema-validator.js.map +1 -0
  112. package/dist/src/utils/transform-loader.js +281 -0
  113. package/dist/src/utils/transform-loader.js.map +1 -0
  114. package/dist/src/utils/validators.js +40 -0
  115. package/dist/src/utils/validators.js.map +1 -0
  116. package/dist/src/utils/zod-adapter.js +144 -0
  117. package/dist/src/utils/zod-adapter.js.map +1 -0
  118. package/dist/src/web-server/index.js +648 -0
  119. package/dist/src/web-server/index.js.map +1 -0
  120. package/dist/src/workers/csv-multithreaded.js +211 -0
  121. package/dist/src/workers/csv-multithreaded.js.map +1 -0
  122. package/dist/src/workers/csv-parser.worker.js +179 -0
  123. package/dist/src/workers/csv-parser.worker.js.map +1 -0
  124. package/dist/src/workers/worker-pool.js +228 -0
  125. package/dist/src/workers/worker-pool.js.map +1 -0
  126. package/dist/stream-csv-to-json.js +665 -0
  127. package/dist/stream-csv-to-json.js.map +1 -0
  128. package/dist/stream-json-to-csv.js +389 -0
  129. package/dist/stream-json-to-csv.js.map +1 -0
  130. package/examples/advanced/conditional-transformations.ts +446 -0
  131. package/examples/advanced/csv-parser.worker.ts +89 -0
  132. package/examples/advanced/nested-objects-example.ts +306 -0
  133. package/examples/advanced/performance-optimization.ts +504 -0
  134. package/examples/advanced/run-demo-server.ts +116 -0
  135. package/examples/advanced/web-worker-usage.html +874 -0
  136. package/examples/async-multithreaded-example.ts +335 -0
  137. package/examples/cli-advanced-usage.md +290 -0
  138. package/examples/{cli-batch-processing.js → cli-batch-processing.ts} +38 -38
  139. package/examples/{cli-tool.js → cli-tool.ts} +5 -8
  140. package/examples/{error-handling.js → error-handling.ts} +356 -324
  141. package/examples/{express-api.js → express-api.ts} +161 -164
  142. package/examples/{large-dataset-example.js → large-dataset-example.ts} +201 -182
  143. package/examples/{ndjson-processing.js → ndjson-processing.ts} +456 -434
  144. package/examples/{plugin-excel-exporter.js → plugin-excel-exporter.ts} +6 -7
  145. package/examples/react-integration.tsx +637 -0
  146. package/examples/{schema-validation.js → schema-validation.ts} +2 -2
  147. package/examples/simple-usage.ts +194 -0
  148. package/examples/{streaming-example.js → streaming-example.ts} +12 -12
  149. package/index.d.ts +187 -18
  150. package/package.json +75 -81
  151. package/plugins.d.ts +37 -0
  152. package/schema.d.ts +103 -0
  153. package/src/browser/browser-functions.ts +402 -0
  154. package/src/browser/core.ts +152 -0
  155. package/src/browser/csv-to-json-browser.d.ts +3 -0
  156. package/src/browser/csv-to-json-browser.ts +494 -0
  157. package/src/browser/{errors-browser.js → errors-browser.ts} +305 -197
  158. package/src/browser/extensions/plugins.ts +93 -0
  159. package/src/browser/extensions/workers.ts +39 -0
  160. package/src/browser/globals.d.ts +5 -0
  161. package/src/browser/index.ts +192 -0
  162. package/src/browser/json-to-csv-browser.d.ts +3 -0
  163. package/src/browser/json-to-csv-browser.ts +338 -0
  164. package/src/browser/streams.ts +403 -0
  165. package/src/browser/workers/{csv-parser.worker.js → csv-parser.worker.ts} +3 -3
  166. package/src/browser/workers/{worker-pool.js → worker-pool.ts} +51 -30
  167. package/src/core/delimiter-cache.ts +320 -0
  168. package/src/core/{node-optimizations.js → node-optimizations.ts} +448 -407
  169. package/src/core/plugin-system.ts +588 -0
  170. package/src/core/transform-hooks.ts +566 -0
  171. package/src/engines/{fast-path-engine-new.js → fast-path-engine-new.ts} +11 -2
  172. package/src/engines/{fast-path-engine.js → fast-path-engine.ts} +79 -53
  173. package/src/errors.ts +1 -0
  174. package/src/formats/{ndjson-parser.js → ndjson-parser.ts} +24 -16
  175. package/src/formats/{tsv-parser.js → tsv-parser.ts} +18 -17
  176. package/src/{index-with-plugins.js → index-with-plugins.ts} +381 -357
  177. package/src/types/index.ts +275 -0
  178. package/src/utils/bom-utils.ts +373 -0
  179. package/src/utils/encoding-support.ts +155 -0
  180. package/src/utils/{schema-validator.js → schema-validator.ts} +814 -589
  181. package/src/utils/transform-loader.ts +389 -0
  182. package/src/utils/validators.ts +35 -0
  183. package/src/utils/zod-adapter.ts +280 -0
  184. package/src/web-server/{index.js → index.ts} +19 -19
  185. package/src/workers/csv-multithreaded.ts +310 -0
  186. package/src/workers/csv-parser.worker.ts +227 -0
  187. package/src/workers/worker-pool.ts +409 -0
  188. package/bin/jtcsv.js +0 -2462
  189. package/csv-to-json.js +0 -688
  190. package/errors.js +0 -208
  191. package/examples/simple-usage.js +0 -282
  192. package/index.js +0 -68
  193. package/json-save.js +0 -254
  194. package/json-to-csv.js +0 -526
  195. package/plugins/README.md +0 -91
  196. package/plugins/express-middleware/README.md +0 -64
  197. package/plugins/express-middleware/example.js +0 -136
  198. package/plugins/express-middleware/index.d.ts +0 -114
  199. package/plugins/express-middleware/index.js +0 -360
  200. package/plugins/express-middleware/package.json +0 -52
  201. package/plugins/fastify-plugin/index.js +0 -406
  202. package/plugins/fastify-plugin/package.json +0 -55
  203. package/plugins/hono/README.md +0 -28
  204. package/plugins/hono/index.d.ts +0 -12
  205. package/plugins/hono/index.js +0 -36
  206. package/plugins/hono/package.json +0 -35
  207. package/plugins/nestjs/README.md +0 -35
  208. package/plugins/nestjs/index.d.ts +0 -25
  209. package/plugins/nestjs/index.js +0 -77
  210. package/plugins/nestjs/package.json +0 -37
  211. package/plugins/nextjs-api/README.md +0 -57
  212. package/plugins/nextjs-api/examples/ConverterComponent.jsx +0 -386
  213. package/plugins/nextjs-api/examples/api-convert.js +0 -69
  214. package/plugins/nextjs-api/index.js +0 -387
  215. package/plugins/nextjs-api/package.json +0 -63
  216. package/plugins/nextjs-api/route.js +0 -371
  217. package/plugins/nuxt/README.md +0 -24
  218. package/plugins/nuxt/index.js +0 -21
  219. package/plugins/nuxt/package.json +0 -35
  220. package/plugins/nuxt/runtime/composables/useJtcsv.js +0 -6
  221. package/plugins/nuxt/runtime/plugin.js +0 -6
  222. package/plugins/remix/README.md +0 -26
  223. package/plugins/remix/index.d.ts +0 -16
  224. package/plugins/remix/index.js +0 -62
  225. package/plugins/remix/package.json +0 -35
  226. package/plugins/sveltekit/README.md +0 -28
  227. package/plugins/sveltekit/index.d.ts +0 -17
  228. package/plugins/sveltekit/index.js +0 -54
  229. package/plugins/sveltekit/package.json +0 -33
  230. package/plugins/trpc/README.md +0 -25
  231. package/plugins/trpc/index.d.ts +0 -7
  232. package/plugins/trpc/index.js +0 -32
  233. package/plugins/trpc/package.json +0 -34
  234. package/src/browser/browser-functions.js +0 -219
  235. package/src/browser/csv-to-json-browser.js +0 -700
  236. package/src/browser/index.js +0 -113
  237. package/src/browser/json-to-csv-browser.js +0 -309
  238. package/src/browser/streams.js +0 -393
  239. package/src/core/delimiter-cache.js +0 -186
  240. package/src/core/plugin-system.js +0 -476
  241. package/src/core/transform-hooks.js +0 -350
  242. package/src/errors.js +0 -26
  243. package/src/utils/transform-loader.js +0 -205
  244. package/stream-csv-to-json.js +0 -542
  245. package/stream-json-to-csv.js +0 -464
  246. /package/examples/{web-workers-advanced.js → web-workers-advanced.ts} +0 -0
@@ -0,0 +1,671 @@
1
+ "use strict";
2
+ Object.defineProperty(exports, "__esModule", { value: true });
3
+ class FastPathEngine {
4
+ constructor() {
5
+ this.compilers = new Map();
6
+ this.rowCompilers = new Map();
7
+ this.stats = {
8
+ simpleParserCount: 0,
9
+ quoteAwareParserCount: 0,
10
+ standardParserCount: 0,
11
+ cacheHits: 0,
12
+ cacheMisses: 0
13
+ };
14
+ }
15
+ _hasQuotes(csv) {
16
+ return csv.indexOf('"') !== -1;
17
+ }
18
+ _hasEscapedQuotes(csv) {
19
+ return csv.indexOf('""') !== -1;
20
+ }
21
+ _hasBackslashes(csv) {
22
+ return csv.indexOf('\\') !== -1;
23
+ }
24
+ _getStructureForParse(csv, options) {
25
+ const sampleSize = Math.min(1000, csv.length);
26
+ const sample = csv.substring(0, sampleSize);
27
+ const structure = this.analyzeStructure(sample, options);
28
+ const hasBackslashes = this._hasBackslashes(csv);
29
+ const hasQuotes = structure.hasQuotes ? true : this._hasQuotes(csv);
30
+ const hasEscapedQuotes = structure.hasEscapedQuotes
31
+ ? true
32
+ : (hasQuotes ? this._hasEscapedQuotes(csv) : false);
33
+ let normalized = {
34
+ ...structure,
35
+ hasQuotes,
36
+ hasEscapedQuotes,
37
+ hasBackslashes
38
+ };
39
+ if (structure.recommendedEngine === 'SIMPLE' && hasQuotes) {
40
+ normalized = {
41
+ ...normalized,
42
+ hasNewlinesInFields: true,
43
+ recommendedEngine: 'QUOTE_AWARE'
44
+ };
45
+ }
46
+ if (options && options.forceEngine) {
47
+ normalized = {
48
+ ...normalized,
49
+ recommendedEngine: options.forceEngine
50
+ };
51
+ }
52
+ return normalized;
53
+ }
54
+ analyzeStructure(sample, options = {}) {
55
+ const delimiter = options.delimiter || this._detectDelimiter(sample);
56
+ const lines = sample.split('\n').slice(0, 10);
57
+ let hasQuotes = false;
58
+ let hasNewlinesInFields = false;
59
+ let hasEscapedQuotes = false;
60
+ let maxFields = 0;
61
+ let totalFields = 0;
62
+ for (const line of lines) {
63
+ if (line.includes('"')) {
64
+ hasQuotes = true;
65
+ if (line.includes('""')) {
66
+ hasEscapedQuotes = true;
67
+ }
68
+ }
69
+ const quoteCount = (line.match(/"/g) || []).length;
70
+ if (quoteCount % 2 !== 0) {
71
+ hasNewlinesInFields = true;
72
+ }
73
+ const fieldCount = line.split(delimiter).length;
74
+ totalFields += fieldCount;
75
+ if (fieldCount > maxFields) {
76
+ maxFields = fieldCount;
77
+ }
78
+ }
79
+ const avgFieldsPerLine = totalFields / lines.length;
80
+ const fieldConsistency = maxFields === avgFieldsPerLine;
81
+ return {
82
+ delimiter,
83
+ hasQuotes,
84
+ hasEscapedQuotes,
85
+ hasNewlinesInFields,
86
+ fieldConsistency,
87
+ avgFieldsPerLine,
88
+ maxFields,
89
+ recommendedEngine: this._selectEngine(hasQuotes, hasNewlinesInFields, fieldConsistency)
90
+ };
91
+ }
92
+ _detectDelimiter(sample) {
93
+ const candidates = [',', ';', '\t', '|'];
94
+ const firstLine = sample.split('\n')[0];
95
+ let bestDelimiter = ',';
96
+ let bestScore = 0;
97
+ for (const delimiter of candidates) {
98
+ const fields = firstLine.split(delimiter);
99
+ const score = fields.length;
100
+ if (score === 1 && !firstLine.includes(delimiter)) {
101
+ continue;
102
+ }
103
+ const avgLength = fields.reduce((sum, field) => sum + field.length, 0) / fields.length;
104
+ const variance = fields.reduce((sum, field) => sum + Math.pow(field.length - avgLength, 2), 0) / fields.length;
105
+ const finalScore = score / (variance + 1);
106
+ if (finalScore > bestScore) {
107
+ bestScore = finalScore;
108
+ bestDelimiter = delimiter;
109
+ }
110
+ }
111
+ return bestDelimiter;
112
+ }
113
+ _selectEngine(hasQuotes, hasNewlinesInFields, _fieldConsistency) {
114
+ if (!hasQuotes && !hasNewlinesInFields) {
115
+ return 'SIMPLE';
116
+ }
117
+ if (hasQuotes && !hasNewlinesInFields) {
118
+ return 'QUOTE_AWARE';
119
+ }
120
+ return 'STANDARD';
121
+ }
122
+ _createSimpleParser(structure) {
123
+ const { delimiter, hasBackslashes } = structure;
124
+ return (csv) => {
125
+ const rows = [];
126
+ if (hasBackslashes) {
127
+ this._emitSimpleRowsEscaped(csv, delimiter, (row) => rows.push(row));
128
+ }
129
+ else {
130
+ this._emitSimpleRows(csv, delimiter, (row) => rows.push(row));
131
+ }
132
+ return rows;
133
+ };
134
+ }
135
+ _emitSimpleRows(csv, delimiter, onRow) {
136
+ let currentRow = [];
137
+ let rowHasData = false;
138
+ let fieldStart = 0;
139
+ let i = 0;
140
+ while (i <= csv.length) {
141
+ const char = i < csv.length ? csv[i] : '\n';
142
+ if (!rowHasData && char !== '\r' && char !== '\n' && char !== ' ' && char !== '\t') {
143
+ rowHasData = true;
144
+ }
145
+ if (char === delimiter || char === '\n' || char === '\r' || i === csv.length) {
146
+ const field = csv.slice(fieldStart, i);
147
+ currentRow.push(field);
148
+ if (char === '\n' || char === '\r' || i === csv.length) {
149
+ if (rowHasData) {
150
+ onRow(currentRow);
151
+ }
152
+ currentRow = [];
153
+ rowHasData = false;
154
+ }
155
+ if (char === '\r' && csv[i + 1] === '\n') {
156
+ i++;
157
+ }
158
+ fieldStart = i + 1;
159
+ }
160
+ i++;
161
+ }
162
+ }
163
+ _emitSimpleRowsEscaped(csv, delimiter, onRow) {
164
+ let currentRow = [];
165
+ let currentField = '';
166
+ let rowHasData = false;
167
+ let escapeNext = false;
168
+ let i = 0;
169
+ while (i <= csv.length) {
170
+ const char = i < csv.length ? csv[i] : '\n';
171
+ const nextChar = i + 1 < csv.length ? csv[i + 1] : '';
172
+ if (!rowHasData && char !== '\r' && char !== '\n' && char !== ' ' && char !== '\t') {
173
+ rowHasData = true;
174
+ }
175
+ if (escapeNext) {
176
+ currentField += char;
177
+ escapeNext = false;
178
+ i++;
179
+ continue;
180
+ }
181
+ if (char === '\\') {
182
+ if (i + 1 >= csv.length) {
183
+ currentField += '\\';
184
+ i++;
185
+ continue;
186
+ }
187
+ if (nextChar === '\\') {
188
+ currentField += '\\';
189
+ i += 2;
190
+ continue;
191
+ }
192
+ if (nextChar === '\n' || nextChar === '\r') {
193
+ currentField += '\\';
194
+ i++;
195
+ continue;
196
+ }
197
+ escapeNext = true;
198
+ i++;
199
+ continue;
200
+ }
201
+ if (char === delimiter || char === '\n' || char === '\r' || i === csv.length) {
202
+ currentRow.push(currentField);
203
+ currentField = '';
204
+ if (char === '\n' || char === '\r' || i === csv.length) {
205
+ if (rowHasData) {
206
+ onRow(currentRow);
207
+ }
208
+ currentRow = [];
209
+ rowHasData = false;
210
+ }
211
+ if (char === '\r' && csv[i + 1] === '\n') {
212
+ i++;
213
+ }
214
+ i++;
215
+ continue;
216
+ }
217
+ currentField += char;
218
+ i++;
219
+ }
220
+ }
221
+ *_simpleRowsGenerator(csv, delimiter) {
222
+ let currentRow = [];
223
+ let rowHasData = false;
224
+ let fieldStart = 0;
225
+ let i = 0;
226
+ while (i <= csv.length) {
227
+ const char = i < csv.length ? csv[i] : '\n';
228
+ if (char !== '\r' && char !== '\n' && char !== ' ' && char !== '\t') {
229
+ rowHasData = true;
230
+ }
231
+ if (char === delimiter || char === '\n' || char === '\r' || i === csv.length) {
232
+ const field = csv.slice(fieldStart, i);
233
+ currentRow.push(field);
234
+ if (char === '\n' || char === '\r' || i === csv.length) {
235
+ if (rowHasData) {
236
+ yield currentRow;
237
+ }
238
+ currentRow = [];
239
+ rowHasData = false;
240
+ }
241
+ if (char === '\r' && csv[i + 1] === '\n') {
242
+ i++;
243
+ }
244
+ fieldStart = i + 1;
245
+ }
246
+ i++;
247
+ }
248
+ }
249
+ *_simpleEscapedRowsGenerator(csv, delimiter) {
250
+ let currentRow = [];
251
+ let currentField = '';
252
+ let rowHasData = false;
253
+ let escapeNext = false;
254
+ let i = 0;
255
+ while (i <= csv.length) {
256
+ const char = i < csv.length ? csv[i] : '\n';
257
+ const nextChar = i + 1 < csv.length ? csv[i + 1] : '';
258
+ if (char !== '\r' && char !== '\n' && char !== ' ' && char !== '\t') {
259
+ rowHasData = true;
260
+ }
261
+ if (escapeNext) {
262
+ currentField += char;
263
+ escapeNext = false;
264
+ i++;
265
+ continue;
266
+ }
267
+ if (char === '\\') {
268
+ if (i + 1 >= csv.length) {
269
+ currentField += '\\';
270
+ i++;
271
+ continue;
272
+ }
273
+ if (nextChar === '\\') {
274
+ currentField += '\\';
275
+ i += 2;
276
+ continue;
277
+ }
278
+ if (nextChar === '\n' || nextChar === '\r') {
279
+ currentField += '\\';
280
+ i++;
281
+ continue;
282
+ }
283
+ escapeNext = true;
284
+ i++;
285
+ continue;
286
+ }
287
+ if (char === delimiter || char === '\n' || char === '\r' || i === csv.length) {
288
+ currentRow.push(currentField);
289
+ currentField = '';
290
+ if (char === '\n' || char === '\r' || i === csv.length) {
291
+ if (rowHasData) {
292
+ yield currentRow;
293
+ }
294
+ currentRow = [];
295
+ rowHasData = false;
296
+ }
297
+ if (char === '\r' && csv[i + 1] === '\n') {
298
+ i++;
299
+ }
300
+ i++;
301
+ continue;
302
+ }
303
+ currentField += char;
304
+ i++;
305
+ }
306
+ }
307
+ _createSimpleRowEmitter(structure) {
308
+ const { delimiter, hasBackslashes } = structure;
309
+ return (csv, onRow) => {
310
+ if (hasBackslashes) {
311
+ this._emitSimpleRowsEscaped(csv, delimiter, onRow);
312
+ }
313
+ else {
314
+ this._emitSimpleRows(csv, delimiter, onRow);
315
+ }
316
+ };
317
+ }
318
+ _createQuoteAwareParser(structure) {
319
+ const { delimiter, hasEscapedQuotes, hasBackslashes } = structure;
320
+ return (csv) => {
321
+ const rows = [];
322
+ const iterator = hasBackslashes
323
+ ? this._quoteAwareEscapedRowsGenerator(csv, delimiter, hasEscapedQuotes)
324
+ : this._quoteAwareRowsGenerator(csv, delimiter, hasEscapedQuotes);
325
+ for (const row of iterator) {
326
+ rows.push(row);
327
+ }
328
+ return rows;
329
+ };
330
+ }
331
+ _createQuoteAwareRowEmitter(structure) {
332
+ const { delimiter, hasEscapedQuotes, hasBackslashes } = structure;
333
+ return (csv, onRow) => {
334
+ const iterator = hasBackslashes
335
+ ? this._quoteAwareEscapedRowsGenerator(csv, delimiter, hasEscapedQuotes)
336
+ : this._quoteAwareRowsGenerator(csv, delimiter, hasEscapedQuotes);
337
+ for (const row of iterator) {
338
+ onRow(row);
339
+ }
340
+ };
341
+ }
342
+ *_quoteAwareRowsGenerator(csv, delimiter, hasEscapedQuotes) {
343
+ let currentRow = [];
344
+ let currentField = '';
345
+ let rowHasData = false;
346
+ let insideQuotes = false;
347
+ let lineNumber = 1;
348
+ let i = 0;
349
+ while (i < csv.length) {
350
+ const char = csv[i];
351
+ const nextChar = csv[i + 1];
352
+ if (char !== '\r' && char !== '\n' && char !== ' ' && char !== '\t') {
353
+ rowHasData = true;
354
+ }
355
+ if (char === '"') {
356
+ if (insideQuotes) {
357
+ if (hasEscapedQuotes && nextChar === '"') {
358
+ const afterNext = csv[i + 2];
359
+ const isLineEnd = i + 2 >= csv.length || afterNext === '\n' || afterNext === '\r';
360
+ currentField += '"';
361
+ if (isLineEnd) {
362
+ insideQuotes = false;
363
+ i += 2;
364
+ continue;
365
+ }
366
+ i += 2;
367
+ let j = i;
368
+ while (j < csv.length && (csv[j] === ' ' || csv[j] === '\t')) {
369
+ j++;
370
+ }
371
+ if (j >= csv.length || csv[j] === delimiter || csv[j] === '\n' || csv[j] === '\r') {
372
+ insideQuotes = false;
373
+ }
374
+ continue;
375
+ }
376
+ if (nextChar === delimiter || nextChar === '\n' || nextChar === '\r' || i + 1 >= csv.length) {
377
+ insideQuotes = false;
378
+ i++;
379
+ continue;
380
+ }
381
+ if (nextChar === ' ' || nextChar === '\t') {
382
+ let j = i + 1;
383
+ while (j < csv.length && (csv[j] === ' ' || csv[j] === '\t')) {
384
+ j++;
385
+ }
386
+ if (j >= csv.length || csv[j] === delimiter || csv[j] === '\n' || csv[j] === '\r') {
387
+ insideQuotes = false;
388
+ i++;
389
+ continue;
390
+ }
391
+ }
392
+ currentField += '"';
393
+ i++;
394
+ continue;
395
+ }
396
+ insideQuotes = true;
397
+ i++;
398
+ continue;
399
+ }
400
+ if (!insideQuotes && (char === delimiter || char === '\n' || char === '\r')) {
401
+ currentRow.push(currentField);
402
+ currentField = '';
403
+ if (char === '\n' || char === '\r') {
404
+ if (rowHasData) {
405
+ yield currentRow;
406
+ }
407
+ currentRow = [];
408
+ rowHasData = false;
409
+ lineNumber++;
410
+ if (char === '\r' && nextChar === '\n') {
411
+ i++;
412
+ }
413
+ }
414
+ i++;
415
+ continue;
416
+ }
417
+ currentField += char;
418
+ i++;
419
+ }
420
+ if (insideQuotes) {
421
+ const error = new Error('Unclosed quotes in CSV');
422
+ error.code = 'FAST_PATH_UNCLOSED_QUOTES';
423
+ error.lineNumber = lineNumber;
424
+ throw error;
425
+ }
426
+ if (currentField !== '' || currentRow.length > 0) {
427
+ currentRow.push(currentField);
428
+ if (rowHasData) {
429
+ yield currentRow;
430
+ }
431
+ }
432
+ }
433
+ *_quoteAwareEscapedRowsGenerator(csv, delimiter, hasEscapedQuotes) {
434
+ let currentRow = [];
435
+ let currentField = '';
436
+ let rowHasData = false;
437
+ let insideQuotes = false;
438
+ let escapeNext = false;
439
+ let lineNumber = 1;
440
+ let i = 0;
441
+ while (i < csv.length) {
442
+ const char = csv[i];
443
+ const nextChar = csv[i + 1];
444
+ if (char !== '\r' && char !== '\n' && char !== ' ' && char !== '\t') {
445
+ rowHasData = true;
446
+ }
447
+ if (escapeNext) {
448
+ currentField += char;
449
+ escapeNext = false;
450
+ i++;
451
+ continue;
452
+ }
453
+ if (char === '\\') {
454
+ if (i + 1 >= csv.length) {
455
+ currentField += '\\';
456
+ i++;
457
+ continue;
458
+ }
459
+ if (!insideQuotes && (nextChar === '\n' || nextChar === '\r')) {
460
+ currentField += '\\';
461
+ i++;
462
+ continue;
463
+ }
464
+ if (nextChar === '\\') {
465
+ currentField += '\\';
466
+ i += 2;
467
+ continue;
468
+ }
469
+ escapeNext = true;
470
+ i++;
471
+ continue;
472
+ }
473
+ if (char === '"') {
474
+ if (insideQuotes) {
475
+ if (hasEscapedQuotes && nextChar === '"') {
476
+ const afterNext = csv[i + 2];
477
+ const isLineEnd = i + 2 >= csv.length || afterNext === '\n' || afterNext === '\r';
478
+ currentField += '"';
479
+ if (isLineEnd) {
480
+ insideQuotes = false;
481
+ i += 2;
482
+ continue;
483
+ }
484
+ i += 2;
485
+ let j = i;
486
+ while (j < csv.length && (csv[j] === ' ' || csv[j] === '\t')) {
487
+ j++;
488
+ }
489
+ if (j >= csv.length || csv[j] === delimiter || csv[j] === '\n' || csv[j] === '\r') {
490
+ insideQuotes = false;
491
+ }
492
+ continue;
493
+ }
494
+ if (nextChar === delimiter || nextChar === '\n' || nextChar === '\r' || i + 1 >= csv.length) {
495
+ insideQuotes = false;
496
+ i++;
497
+ continue;
498
+ }
499
+ if (nextChar === ' ' || nextChar === '\t') {
500
+ let j = i + 1;
501
+ while (j < csv.length && (csv[j] === ' ' || csv[j] === '\t')) {
502
+ j++;
503
+ }
504
+ if (j >= csv.length || csv[j] === delimiter || csv[j] === '\n' || csv[j] === '\r') {
505
+ insideQuotes = false;
506
+ i++;
507
+ continue;
508
+ }
509
+ }
510
+ currentField += '"';
511
+ i++;
512
+ continue;
513
+ }
514
+ insideQuotes = true;
515
+ i++;
516
+ continue;
517
+ }
518
+ if (!insideQuotes && (char === delimiter || char === '\n' || char === '\r')) {
519
+ currentRow.push(currentField);
520
+ currentField = '';
521
+ if (char === '\n' || char === '\r') {
522
+ if (rowHasData) {
523
+ yield currentRow;
524
+ }
525
+ currentRow = [];
526
+ rowHasData = false;
527
+ lineNumber++;
528
+ if (char === '\r' && nextChar === '\n') {
529
+ i++;
530
+ }
531
+ }
532
+ i++;
533
+ continue;
534
+ }
535
+ currentField += char;
536
+ i++;
537
+ }
538
+ if (escapeNext) {
539
+ currentField += '\\';
540
+ }
541
+ if (insideQuotes) {
542
+ const error = new Error('Unclosed quotes in CSV');
543
+ error.code = 'FAST_PATH_UNCLOSED_QUOTES';
544
+ error.lineNumber = lineNumber;
545
+ throw error;
546
+ }
547
+ if (currentField !== '' || currentRow.length > 0) {
548
+ currentRow.push(currentField);
549
+ if (rowHasData) {
550
+ yield currentRow;
551
+ }
552
+ }
553
+ }
554
+ compileParser(structure) {
555
+ const cacheKey = JSON.stringify(structure);
556
+ if (this.compilers.has(cacheKey)) {
557
+ this.stats.cacheHits++;
558
+ return this.compilers.get(cacheKey);
559
+ }
560
+ this.stats.cacheMisses++;
561
+ let parser;
562
+ switch (structure.recommendedEngine) {
563
+ case 'SIMPLE':
564
+ parser = this._createSimpleParser(structure);
565
+ this.stats.simpleParserCount++;
566
+ break;
567
+ case 'QUOTE_AWARE':
568
+ parser = this._createQuoteAwareParser(structure);
569
+ this.stats.quoteAwareParserCount++;
570
+ break;
571
+ case 'STANDARD':
572
+ parser = this._createQuoteAwareParser(structure);
573
+ this.stats.standardParserCount++;
574
+ break;
575
+ default:
576
+ parser = this._createQuoteAwareParser(structure);
577
+ this.stats.standardParserCount++;
578
+ }
579
+ this.compilers.set(cacheKey, parser);
580
+ return parser;
581
+ }
582
+ compileRowEmitter(structure) {
583
+ const cacheKey = JSON.stringify(structure);
584
+ if (this.rowCompilers.has(cacheKey)) {
585
+ return this.rowCompilers.get(cacheKey);
586
+ }
587
+ let emitter;
588
+ switch (structure.recommendedEngine) {
589
+ case 'SIMPLE':
590
+ emitter = this._createSimpleRowEmitter(structure);
591
+ break;
592
+ case 'QUOTE_AWARE':
593
+ emitter = this._createQuoteAwareRowEmitter(structure);
594
+ break;
595
+ case 'STANDARD':
596
+ emitter = this._createQuoteAwareRowEmitter(structure);
597
+ break;
598
+ default:
599
+ emitter = this._createQuoteAwareRowEmitter(structure);
600
+ }
601
+ this.rowCompilers.set(cacheKey, emitter);
602
+ return emitter;
603
+ }
604
+ *iterateRows(csv, options = {}) {
605
+ const structure = this._getStructureForParse(csv, options);
606
+ const useEscapes = structure.hasBackslashes;
607
+ switch (structure.recommendedEngine) {
608
+ case 'SIMPLE':
609
+ if (useEscapes) {
610
+ yield* this._simpleEscapedRowsGenerator(csv, structure.delimiter);
611
+ }
612
+ else {
613
+ yield* this._simpleRowsGenerator(csv, structure.delimiter);
614
+ }
615
+ break;
616
+ case 'QUOTE_AWARE':
617
+ if (useEscapes) {
618
+ yield* this._quoteAwareEscapedRowsGenerator(csv, structure.delimiter, structure.hasEscapedQuotes);
619
+ }
620
+ else {
621
+ yield* this._quoteAwareRowsGenerator(csv, structure.delimiter, structure.hasEscapedQuotes);
622
+ }
623
+ break;
624
+ case 'STANDARD':
625
+ if (useEscapes) {
626
+ yield* this._quoteAwareEscapedRowsGenerator(csv, structure.delimiter, structure.hasEscapedQuotes);
627
+ }
628
+ else {
629
+ yield* this._quoteAwareRowsGenerator(csv, structure.delimiter, structure.hasEscapedQuotes);
630
+ }
631
+ break;
632
+ default:
633
+ if (useEscapes) {
634
+ yield* this._quoteAwareEscapedRowsGenerator(csv, structure.delimiter, structure.hasEscapedQuotes);
635
+ }
636
+ else {
637
+ yield* this._quoteAwareRowsGenerator(csv, structure.delimiter, structure.hasEscapedQuotes);
638
+ }
639
+ }
640
+ }
641
+ parse(csv, options = {}) {
642
+ const structure = this._getStructureForParse(csv, options);
643
+ const parser = this.compileParser(structure);
644
+ return parser(csv);
645
+ }
646
+ parseRows(csv, options = {}, onRow) {
647
+ for (const row of this.iterateRows(csv, options)) {
648
+ onRow(row);
649
+ }
650
+ }
651
+ getStats() {
652
+ return {
653
+ ...this.stats,
654
+ totalParsers: this.compilers.size,
655
+ hitRate: this.stats.cacheHits / (this.stats.cacheHits + this.stats.cacheMisses) || 0
656
+ };
657
+ }
658
+ reset() {
659
+ this.compilers.clear();
660
+ this.rowCompilers.clear();
661
+ this.stats = {
662
+ simpleParserCount: 0,
663
+ quoteAwareParserCount: 0,
664
+ standardParserCount: 0,
665
+ cacheHits: 0,
666
+ cacheMisses: 0
667
+ };
668
+ }
669
+ }
670
+ exports.default = FastPathEngine;
671
+ //# sourceMappingURL=fast-path-engine.js.map