@loaders.gl/csv 3.1.0-alpha.4 → 3.1.0-alpha.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/dist.min.js +1 -1
- package/dist/es5/bundle.js +1 -1
- package/dist/es5/bundle.js.map +1 -1
- package/dist/es5/csv-loader.js +85 -135
- package/dist/es5/csv-loader.js.map +1 -1
- package/dist/es5/index.js +1 -1
- package/dist/es5/lib/async-iterator-streamer.js +15 -108
- package/dist/es5/lib/async-iterator-streamer.js.map +1 -1
- package/dist/es5/papaparse/async-iterator-streamer.js +15 -108
- package/dist/es5/papaparse/async-iterator-streamer.js.map +1 -1
- package/dist/esm/csv-loader.js +3 -3
- package/dist/esm/csv-loader.js.map +1 -1
- package/package.json +4 -4
package/dist/dist.min.js
CHANGED
|
@@ -5,5 +5,5 @@ v5.0.0-beta.0
|
|
|
5
5
|
https://github.com/mholt/PapaParse
|
|
6
6
|
License: MIT
|
|
7
7
|
*/
|
|
8
|
-
var r="undefined"!=typeof self?self:"undefined"!=typeof window?window:void 0!==r?r:{},i={};function s(e){this._handle=null,this._finished=!1,this._completed=!1,this._input=null,this._baseIndex=0,this._partialLine="",this._rowCount=0,this._start=0,this._nextChunk=null,this.isFirstChunk=!0,this._completeResults={data:[],errors:[],meta:{}},function(e){var t=l(e);t.chunkSize=parseInt(t.chunkSize),e.step||e.chunk||(t.chunkSize=null);this._handle=new a(t),this._handle.streamer=this,this._config=t}.call(this,e),this.parseChunk=function(e,t){if(this.isFirstChunk&&u(this._config.beforeFirstChunk)){var r=this._config.beforeFirstChunk(e);void 0!==r&&(e=r)}this.isFirstChunk=!1;var i=this._partialLine+e;this._partialLine="";var s=this._handle.parse(i,this._baseIndex,!this._finished);if(!this._handle.paused()&&!this._handle.aborted()){var n=s.meta.cursor;this._finished||(this._partialLine=i.substring(n-this._baseIndex),this._baseIndex=n),s&&s.data&&(this._rowCount+=s.data.length);var a=this._finished||this._config.preview&&this._rowCount>=this._config.preview;if(u(this._config.chunk)&&!t){if(this._config.chunk(s,this._handle),this._handle.paused()||this._handle.aborted())return;s=void 0,this._completeResults=void 0}return this._config.step||this._config.chunk||(this._completeResults.data=this._completeResults.data.concat(s.data),this._completeResults.errors=this._completeResults.errors.concat(s.errors),this._completeResults.meta=s.meta),this._completed||!a||!u(this._config.complete)||s&&s.meta.aborted||(this._config.complete(this._completeResults,this._input),this._completed=!0),a||s&&s.meta.paused||this._nextChunk(),s}},this._sendError=function(e){u(this._config.error)&&this._config.error(e)}}function n(e){var t;e=e||{},s.call(this,e),this.stream=function(e){return t=e,this._nextChunk()},this._nextChunk=function(){if(!this._finished){var e=this._config.chunkSize,r=e?t.substr(0,e):t;return t=e?t.substr(e):"",this._finished=!t,this.parseChunk(r)}}}function a(e){var t,r,s,n=/^\s*-?(\d*\.?\d+|\d+\.?\d*)(e[-+]?\d+)?\s*$/i,a=/(\d{4}-[01]\d-[0-3]\dT[0-2]\d:[0-5]\d:[0-5]\d\.\d+([+-][0-2]\d:[0-5]\d|Z))|(\d{4}-[01]\d-[0-3]\dT[0-2]\d:[0-5]\d:[0-5]\d([+-][0-2]\d:[0-5]\d|Z))|(\d{4}-[01]\d-[0-3]\dT[0-2]\d:[0-5]\d([+-][0-2]\d:[0-5]\d|Z))/,c=this,d=0,f=0,p=!1,g=!1,m=[],y={data:[],errors:[],meta:{}};if(u(e.step)){var b=e.step;e.step=function(t){if(y=t,_())v();else{if(v(),!y.data||0===y.data.length)return;d+=t.data.length,e.preview&&d>e.preview?r.abort():b(y,c)}}}function w(t){return"greedy"===e.skipEmptyLines?""===t.join("").trim():1===t.length&&0===t[0].length}function v(){if(y&&s&&(C("Delimiter","UndetectableDelimiter","Unable to auto-detect delimiting character; defaulted to '"+i.DefaultDelimiter+"'"),s=!1),e.skipEmptyLines)for(var t=0;t<y.data.length;t++)w(y.data[t])&&y.data.splice(t--,1);return _()&&function(){if(!y)return;function t(t){u(e.transformHeader)&&(t=e.transformHeader(t)),m.push(t)}if(Array.isArray(y.data[0])){for(var r=0;_()&&r<y.data.length;r++)y.data[r].forEach(t);y.data.splice(0,1)}else y.data.forEach(t)}(),function(){if(!y||!y.data||!e.header&&!e.dynamicTyping&&!e.transform)return y;function t(t,r){var i,s=e.header?{}:[];for(i=0;i<t.length;i++){var n=i,a=t[i];e.header&&(n=i>=m.length?"__parsed_extra":m[i]),e.transform&&(a=e.transform(a,n)),a=A(n,a),"__parsed_extra"===n?(s[n]=s[n]||[],s[n].push(a)):s[n]=a}return e.header&&(i>m.length?C("FieldMismatch","TooManyFields","Too many fields: expected "+m.length+" fields but parsed "+i,f+r):i<m.length&&C("FieldMismatch","TooFewFields","Too few fields: expected "+m.length+" fields but parsed "+i,f+r)),s}var r=1;!y.data[0]||Array.isArray(y.data[0])?(y.data=y.data.map(t),r=y.data.length):y.data=t(y.data,0);e.header&&y.meta&&(y.meta.fields=m);return f+=r,y}()}function _(){return e.header&&0===m.length}function A(t,r){return function(t){return e.dynamicTypingFunction&&void 0===e.dynamicTyping[t]&&(e.dynamicTyping[t]=e.dynamicTypingFunction(t)),!0===(e.dynamicTyping[t]||e.dynamicTyping)}(t)?"true"===r||"TRUE"===r||"false"!==r&&"FALSE"!==r&&(n.test(r)?parseFloat(r):a.test(r)?new Date(r):""===r?null:r):r}function C(e,t,r,i){y.errors.push({type:e,code:t,message:r,row:i})}this.parse=function(n,a,c){var d=e.quoteChar||'"';if(e.newline||(e.newline=function(e,t){e=e.substr(0,1048576);var r=new RegExp(o(t)+"([^]*?)"+o(t),"gm"),i=(e=e.replace(r,"")).split("\r"),s=e.split("\n"),n=s.length>1&&s[0].length<i[0].length;if(1===i.length||n)return"\n";for(var a=0,h=0;h<i.length;h++)"\n"===i[h][0]&&a++;return a>=i.length/2?"\r\n":"\r"}(n,d)),s=!1,e.delimiter)u(e.delimiter)&&(e.delimiter=e.delimiter(n),y.meta.delimiter=e.delimiter);else{var f=function(t,r,s,n,a){var o,l,u;a=a||[",","\t","|",";",i.RECORD_SEP,i.UNIT_SEP];for(var c=0;c<a.length;c++){var d=a[c],f=0,p=0,g=0;u=void 0;for(var m=new h({comments:n,delimiter:d,newline:r,preview:10}).parse(t),y=0;y<m.data.length;y++)if(s&&w(m.data[y]))g++;else{var b=m.data[y].length;p+=b,void 0!==u?b>1&&(f+=Math.abs(b-u),u=b):u=0}m.data.length>0&&(p/=m.data.length-g),(void 0===l||f>l)&&p>1.99&&(l=f,o=d)}return e.delimiter=o,{successful:!!o,bestDelimiter:o}}(n,e.newline,e.skipEmptyLines,e.comments,e.delimitersToGuess);f.successful?e.delimiter=f.bestDelimiter:(s=!0,e.delimiter=i.DefaultDelimiter),y.meta.delimiter=e.delimiter}var g=l(e);return e.preview&&e.header&&g.preview++,t=n,r=new h(g),y=r.parse(t,a,c),v(),p?{meta:{paused:!0}}:y||{meta:{paused:!1}}},this.paused=function(){return p},this.pause=function(){p=!0,r.abort(),t=t.substr(r.getCharIndex())},this.resume=function(){p=!1,c.streamer.parseChunk(t,!0)},this.aborted=function(){return g},this.abort=function(){g=!0,r.abort(),y.meta.aborted=!0,u(e.complete)&&e.complete(y),t=""}}function o(e){return e.replace(/[.*+?^${}()|[\]\\]/g,"\\$&")}function h(e){var t,r=(e=e||{}).delimiter,s=e.newline,n=e.comments,a=e.step,h=e.preview,l=e.fastMode,c=t=void 0===e.quoteChar?'"':e.quoteChar;if(void 0!==e.escapeChar&&(c=e.escapeChar),("string"!=typeof r||i.BAD_DELIMITERS.indexOf(r)>-1)&&(r=","),n===r)throw new Error("Comment character same as delimiter");!0===n?n="#":("string"!=typeof n||i.BAD_DELIMITERS.indexOf(n)>-1)&&(n=!1),"\n"!==s&&"\r"!==s&&"\r\n"!==s&&(s="\n");var d=0,f=!1;this.parse=function(e,i,p){if("string"!=typeof e)throw new Error("Input must be a string");var g=e.length,m=r.length,y=s.length,b=n.length,w=u(a);d=0;var v=[],_=[],A=[],C=0;if(!e)return F();if(l||!1!==l&&-1===e.indexOf(t)){for(var x=e.split(s),R=0;R<x.length;R++){if(A=x[R],d+=A.length,R!==x.length-1)d+=s.length;else if(p)return F();if(!n||A.substr(0,b)!==n){if(w){if(v=[],B(A.split(r)),I(),f)return F()}else B(A.split(r));if(h&&R>=h)return v=v.slice(0,h),F(!0)}}return F()}for(var E,k=e.indexOf(r,d),O=e.indexOf(s,d),T=new RegExp(o(c)+o(t),"g");;)if(e[d]!==t)if(n&&0===A.length&&e.substr(d,b)===n){if(-1===O)return F();d=O+y,O=e.indexOf(s,d),k=e.indexOf(r,d)}else if(-1!==k&&(k<O||-1===O))A.push(e.substring(d,k)),d=k+m,k=e.indexOf(r,d);else{if(-1===O)break;if(A.push(e.substring(d,O)),P(O+y),w&&(I(),f))return F();if(h&&v.length>=h)return F(!0)}else{for(E=d,d++;;){if(-1===(E=e.indexOf(t,E+1)))return p||_.push({type:"Quotes",code:"MissingQuotes",message:"Quoted field unterminated",row:v.length,index:d}),M();if(E===g-1)return M(e.substring(d,E).replace(T,t));if(t!==c||e[E+1]!==c){if(t===c||0===E||e[E-1]!==c){var S=D(-1===O?k:Math.min(k,O));if(e[E+1+S]===r){if(A.push(e.substring(d,E).replace(T,t)),d=E+1+S+m,k=e.indexOf(r,d),O=e.indexOf(s,d),w&&(I(),f))return F();if(h&&v.length>=h)return F(!0);break}var j=D(O);if(e.substr(E+1+j,y)===s){if(A.push(e.substring(d,E).replace(T,t)),P(E+1+j+y),k=e.indexOf(r,d),w&&(I(),f))return F();if(h&&v.length>=h)return F(!0);break}_.push({type:"Quotes",code:"InvalidQuotes",message:"Trailing quote on quoted field is malformed",row:v.length,index:d}),E++}}else E++}if(w&&(I(),f))return F();if(h&&v.length>=h)return F(!0)}return M();function B(e){v.push(e),C=d}function D(t){var r=0;if(-1!==t){var i=e.substring(E+1,t);i&&""===i.trim()&&(r=i.length)}return r}function M(t){return p||(void 0===t&&(t=e.substr(d)),A.push(t),d=g,B(A),w&&I()),F()}function P(t){d=t,B(A),A=[],O=e.indexOf(s,d)}function F(e,t){return{data:t||!1?v[0]:v,errors:_,meta:{delimiter:r,linebreak:s,aborted:f,truncated:!!e,cursor:C+(i||0)}}}function I(){a(F(void 0,!0)),v=[],_=[]}},this.abort=function(){f=!0},this.getCharIndex=function(){return d}}function l(e){if("object"!=typeof e||null===e)return e;var t=Array.isArray(e)?[]:{};for(var r in e)t[r]=l(e[r]);return t}function u(e){return"function"==typeof e}e.exports=i,i.parse=function(e,t,r){var s=(t=t||{}).dynamicTyping||!1;u(s)&&(t.dynamicTypingFunction=s,s={});if(t.dynamicTyping=s,t.transform=!!u(t.transform)&&t.transform,t.worker&&i.WORKERS_SUPPORTED){var a=newWorker();return a.userStep=t.step,a.userChunk=t.chunk,a.userComplete=t.complete,a.userError=t.error,t.step=u(t.step),t.chunk=u(t.chunk),t.complete=u(t.complete),t.error=u(t.error),delete t.worker,void a.postMessage({input:e,config:t,workerId:a.id})}var o=null;"string"==typeof e&&(o=new n(t));o||(o=new r(t));return o.stream(e)},i.unparse=function(e,t){var r=!1,s=!0,n=",",a="\r\n",h='"',l=h+h,u=!1,c=null;!function(){if("object"!=typeof t)return;"string"!=typeof t.delimiter||i.BAD_DELIMITERS.filter((function(e){return-1!==t.delimiter.indexOf(e)})).length||(n=t.delimiter);("boolean"==typeof t.quotes||Array.isArray(t.quotes))&&(r=t.quotes);"boolean"!=typeof t.skipEmptyLines&&"string"!=typeof t.skipEmptyLines||(u=t.skipEmptyLines);"string"==typeof t.newline&&(a=t.newline);"string"==typeof t.quoteChar&&(h=t.quoteChar);"boolean"==typeof t.header&&(s=t.header);if(Array.isArray(t.columns)){if(0===t.columns.length)throw new Error("Option columns is empty");c=t.columns}void 0!==t.escapeChar&&(l=t.escapeChar+h)}();var d=new RegExp(o(h),"g");"string"==typeof e&&(e=JSON.parse(e));if(Array.isArray(e)){if(!e.length||Array.isArray(e[0]))return p(null,e,u);if("object"==typeof e[0])return p(c||f(e[0]),e,u)}else if("object"==typeof e)return"string"==typeof e.data&&(e.data=JSON.parse(e.data)),Array.isArray(e.data)&&(e.fields||(e.fields=e.meta&&e.meta.fields),e.fields||(e.fields=Array.isArray(e.data[0])?e.fields:f(e.data[0])),Array.isArray(e.data[0])||"object"==typeof e.data[0]||(e.data=[e.data])),p(e.fields||[],e.data||[],u);throw new Error("Unable to serialize unrecognized input");function f(e){if("object"!=typeof e)return[];var t=[];for(var r in e)t.push(r);return t}function p(e,t,r){var i="";"string"==typeof e&&(e=JSON.parse(e)),"string"==typeof t&&(t=JSON.parse(t));var o=Array.isArray(e)&&e.length>0,h=!Array.isArray(t[0]);if(o&&s){for(var l=0;l<e.length;l++)l>0&&(i+=n),i+=g(e[l],l);t.length>0&&(i+=a)}for(var u=0;u<t.length;u++){var c=o?e.length:t[u].length,d=!1,f=o?0===Object.keys(t[u]).length:0===t[u].length;if(r&&!o&&(d="greedy"===r?""===t[u].join("").trim():1===t[u].length&&0===t[u][0].length),"greedy"===r&&o){for(var p=[],m=0;m<c;m++){var y=h?e[m]:m;p.push(t[u][y])}d=""===p.join("").trim()}if(!d){for(var b=0;b<c;b++){b>0&&!f&&(i+=n);var w=o&&h?e[b]:b;i+=g(t[u][w],b)}u<t.length-1&&(!r||c>0&&!f)&&(i+=a)}}return i}function g(e,t){return null==e?"":e.constructor===Date?JSON.stringify(e).slice(1,25):(e=e.toString().replace(d,l),"boolean"==typeof r&&r||Array.isArray(r)&&r[t]||function(e,t){for(var r=0;r<t.length;r++)if(e.indexOf(t[r])>-1)return!0;return!1}(e,i.BAD_DELIMITERS)||e.indexOf(n)>-1||" "===e.charAt(0)||" "===e.charAt(e.length-1)?h+e+h:e)}},i.RECORD_SEP=String.fromCharCode(30),i.UNIT_SEP=String.fromCharCode(31),i.BYTE_ORDER_MARK="\ufeff",i.BAD_DELIMITERS=["\r","\n",'"',i.BYTE_ORDER_MARK],i.WORKERS_SUPPORTED=!1,i.NODE_STREAM_INPUT=1,i.LocalChunkSize=10485760,i.RemoteChunkSize=5242880,i.DefaultDelimiter=",",i.Parser=h,i.ParserHandle=a,i.ChunkStreamer=s,i.StringStreamer=n,n.prototype=Object.create(n.prototype),n.prototype.constructor=n},function(e,t,r){const i=r(2);globalThis.loaders=globalThis.loaders||{},e.exports=Object.assign(globalThis.loaders,i)},function(e,t,r){"use strict";function i(e,t){if(!e)throw new Error("null row");if(!t)throw new Error("no headers");const r={};for(let i=0;i<t.length;i++)r[t[i]]=e[i];return r}function s(e,t){if(!e)throw new Error("null row");if(!t)throw new Error("no headers");const r=new Array(t.length);for(let i=0;i<t.length;i++)r[i]=e[t[i]];return r}let n;function a(e,t,r){return t in e?Object.defineProperty(e,t,{value:r,enumerable:!0,configurable:!0,writable:!0}):e[t]=r,e}r.r(t),r.d(t,"CSVLoader",(function(){return C}));class o extends Array{enqueue(e){return this.push(e)}dequeue(){return this.shift()}}n=Symbol.asyncIterator;class h{constructor(){a(this,"_values",void 0),a(this,"_settlers",void 0),a(this,"_closed",void 0),this._values=new o,this._settlers=new o,this._closed=!1}close(){for(;this._settlers.length>0;)this._settlers.dequeue().resolve({done:!0});this._closed=!0}[n](){return this}enqueue(e){if(this._closed)throw new Error("Closed");if(this._settlers.length>0){if(this._values.length>0)throw new Error("Illegal internal state");const t=this._settlers.dequeue();e instanceof Error?t.reject(e):t.resolve({value:e})}else this._values.enqueue(e)}next(){if(this._values.length>0){const e=this._values.dequeue();return e instanceof Error?Promise.reject(e):Promise.resolve({value:e})}if(this._closed){if(this._settlers.length>0)throw new Error("Illegal internal state");return Promise.resolve({done:!0})}return new Promise((e,t)=>{this._settlers.enqueue({resolve:e,reject:t})})}}function l(e,t,r){return t in e?Object.defineProperty(e,t,{value:r,enumerable:!0,configurable:!0,writable:!0}):e[t]=r,e}class u{constructor(e,t){if(l(this,"schema",void 0),l(this,"options",void 0),l(this,"length",0),l(this,"rows",null),l(this,"cursor",0),l(this,"_headers",[]),this.options=t,this.schema=e,!Array.isArray(e)){this._headers=[];for(const t in e)this._headers[e[t].index]=e[t].name}}rowCount(){return this.length}addArrayRow(e,t){Number.isFinite(t)&&(this.cursor=t),this.rows=this.rows||new Array(100),this.rows[this.length]=e,this.length++}addObjectRow(e,t){Number.isFinite(t)&&(this.cursor=t),this.rows=this.rows||new Array(100),this.rows[this.length]=e,this.length++}getBatch(){let e=this.rows;if(!e)return null;e=e.slice(0,this.length),this.rows=null;return{shape:this.options.shape,batchType:"data",data:e,length:this.length,schema:this.schema,cursor:this.cursor}}}function c(e,t,r){return t in e?Object.defineProperty(e,t,{value:r,enumerable:!0,configurable:!0,writable:!0}):e[t]=r,e}class d{constructor(e,t){if(c(this,"schema",void 0),c(this,"options",void 0),c(this,"length",0),c(this,"objectRows",null),c(this,"arrayRows",null),c(this,"cursor",0),c(this,"_headers",[]),this.options=t,this.schema=e,!Array.isArray(e)){this._headers=[];for(const t in e)this._headers[e[t].index]=e[t].name}}rowCount(){return this.length}addArrayRow(e,t){switch(Number.isFinite(t)&&(this.cursor=t),this.options.shape){case"object-row-table":const r=i(e,this._headers);this.addObjectRow(r,t);break;case"array-row-table":this.arrayRows=this.arrayRows||new Array(100),this.arrayRows[this.length]=e,this.length++}}addObjectRow(e,t){switch(Number.isFinite(t)&&(this.cursor=t),this.options.shape){case"array-row-table":const r=s(e,this._headers);this.addArrayRow(r,t);break;case"object-row-table":this.objectRows=this.objectRows||new Array(100),this.objectRows[this.length]=e,this.length++}}getBatch(){let e=this.arrayRows||this.objectRows;return e?(e=e.slice(0,this.length),this.arrayRows=null,this.objectRows=null,{shape:this.options.shape,batchType:"data",data:e,length:this.length,schema:this.schema,cursor:this.cursor}):null}}function f(e,t,r){return t in e?Object.defineProperty(e,t,{value:r,enumerable:!0,configurable:!0,writable:!0}):e[t]=r,e}class p{constructor(e,t){f(this,"schema",void 0),f(this,"length",0),f(this,"allocated",0),f(this,"columns",{}),this.schema=e,this._reallocateColumns()}rowCount(){return this.length}addArrayRow(e){this._reallocateColumns();let t=0;for(const r in this.columns)this.columns[r][this.length]=e[t++];this.length++}addObjectRow(e){this._reallocateColumns();for(const t in e)this.columns[t][this.length]=e[t];this.length++}getBatch(){this._pruneColumns();const e=Array.isArray(this.schema)?this.columns:{};if(!Array.isArray(this.schema))for(const t in this.schema){const r=this.schema[t];e[r.name]=this.columns[r.index]}this.columns={};return{shape:"columnar-table",batchType:"data",data:e,schema:this.schema,length:this.length}}_reallocateColumns(){if(!(this.length<this.allocated)){this.allocated=this.allocated>0?this.allocated*=2:100,this.columns={};for(const e in this.schema){const t=this.schema[e],r=t.type||Float32Array,i=this.columns[t.index];if(i&&ArrayBuffer.isView(i)){const e=new r(this.allocated);e.set(i),this.columns[t.index]=e}else i?(i.length=this.allocated,this.columns[t.index]=i):this.columns[t.index]=new r(this.allocated)}}}_pruneColumns(){for(const[e,t]of Object.entries(this.columns))this.columns[e]=t.slice(0,this.length)}}function g(e,t,r){return t in e?Object.defineProperty(e,t,{value:r,enumerable:!0,configurable:!0,writable:!0}):e[t]=r,e}const m={shape:"array-row-table",batchSize:"auto",batchDebounceMs:0,limit:0,_limitMB:0};class y{constructor(e,t){g(this,"schema",void 0),g(this,"options",void 0),g(this,"aggregator",null),g(this,"batchCount",0),g(this,"bytesUsed",0),g(this,"isChunkComplete",!1),g(this,"lastBatchEmittedMs",Date.now()),g(this,"totalLength",0),g(this,"totalBytes",0),g(this,"rowBytes",0),this.schema=e,this.options={...m,...t}}limitReached(){var e,t;return!!(Boolean(null===(e=this.options)||void 0===e?void 0:e.limit)&&this.totalLength>=this.options.limit)||!!(Boolean(null===(t=this.options)||void 0===t?void 0:t._limitMB)&&this.totalBytes/1e6>=this.options._limitMB)}addRow(e){this.limitReached()||(this.totalLength++,this.rowBytes=this.rowBytes||this._estimateRowMB(e),this.totalBytes+=this.rowBytes,Array.isArray(e)?this.addArrayRow(e):this.addObjectRow(e))}addArrayRow(e){if(!this.aggregator){const e=this._getTableBatchType();this.aggregator=new e(this.schema,this.options)}this.aggregator.addArrayRow(e)}addObjectRow(e){if(!this.aggregator){const e=this._getTableBatchType();this.aggregator=new e(this.schema,this.options)}this.aggregator.addObjectRow(e)}chunkComplete(e){e instanceof ArrayBuffer&&(this.bytesUsed+=e.byteLength),"string"==typeof e&&(this.bytesUsed+=e.length),this.isChunkComplete=!0}getFullBatch(e){return this._isFull()?this._getBatch(e):null}getFinalBatch(e){return this._getBatch(e)}_estimateRowMB(e){return Array.isArray(e)?8*e.length:8*Object.keys(e).length}_isFull(){if(!this.aggregator||0===this.aggregator.rowCount())return!1;if("auto"===this.options.batchSize){if(!this.isChunkComplete)return!1}else if(this.options.batchSize>this.aggregator.rowCount())return!1;return!(this.options.batchDebounceMs>Date.now()-this.lastBatchEmittedMs)&&(this.isChunkComplete=!1,this.lastBatchEmittedMs=Date.now(),!0)}_getBatch(e){if(!this.aggregator)return null;null!=e&&e.bytesUsed&&(this.bytesUsed=e.bytesUsed);const t=this.aggregator.getBatch();return t.count=this.batchCount,t.bytesUsed=this.bytesUsed,Object.assign(t,e),this.batchCount++,this.aggregator=null,t}_getTableBatchType(){switch(this.options.shape){case"row-table":return u;case"array-row-table":case"object-row-table":return d;case"columnar-table":return p;case"arrow-table":if(!y.ArrowBatch)throw new Error("TableBatchBuilder");return y.ArrowBatch;default:throw new Error("TableBatchBuilder")}}}g(y,"ArrowBatch",void 0);var b=r(0),w=r.n(b);const{ChunkStreamer:v}=w.a;function _(e){e=e||{},v.call(this,e),this.textDecoder=new TextDecoder(this._config.encoding),this.stream=async function(e){this._input=e;try{for await(const t of e)this.parseChunk(this.getStringChunk(t));this._finished=!0,this.parseChunk("")}catch(e){this._sendError(e)}},this._nextChunk=function(){},this.getStringChunk=function(e){return"string"==typeof e?e:this.textDecoder.decode(e,{stream:!0})}}_.prototype=Object.create(v.prototype),_.prototype.constructor=_;const A={csv:{shape:"object-row-table",optimizeMemoryUsage:!1,header:"auto",columnPrefix:"column",quoteChar:'"',escapeChar:'"',dynamicTyping:!0,comments:!1,skipEmptyLines:!0,delimitersToGuess:[",","\t","|",";"]}},C={id:"csv",module:"csv",name:"CSV",version:"3.1.0-alpha.4",extensions:["csv","tsv","dsv"],mimeTypes:["text/csv","text/tab-separated-values","text/dsv"],category:"table",parse:async(e,t)=>x((new TextDecoder).decode(e),t),parseText:(e,t)=>x(e,t),parseInBatches:function(e,t){var r;"auto"===(t={...t}).batchSize&&(t.batchSize=4e3);const i={...A.csv,...null===(r=t)||void 0===r?void 0:r.csv},s=new h;let n=!0,a=null,o=null,l=null;const u={...i,header:!1,download:!1,chunkSize:5242880,skipEmptyLines:!1,step(e){let r=e.data;if(i.skipEmptyLines){if(""===r.flat().join("").trim())return}const h=e.meta.cursor;if(n&&!a){if("auto"===i.header?R(r):Boolean(i.header))return void(a=r.map(E()))}n&&(n=!1,a||(a=k(i.columnPrefix,r.length)),l=function(e,t){const r=t?{}:[];for(let i=0;i<e.length;i++){const s=t&&t[i]||i;switch(typeof e[i]){case"number":case"boolean":r[s]={name:String(s),index:i,type:Float32Array};break;case"string":default:r[s]={name:String(s),index:i,type:Array}}}return r}(r,a)),i.optimizeMemoryUsage&&(r=JSON.parse(JSON.stringify(r))),o=o||new y(l,{shape:i.shape||"array-row-table",...t});try{o.addRow(r);const e=o&&o.getFullBatch({bytesUsed:h});e&&s.enqueue(e)}catch(e){s.enqueue(e)}},complete(e){try{const t=e.meta.cursor,r=o&&o.getFinalBatch({bytesUsed:t});r&&s.enqueue(r)}catch(e){s.enqueue(e)}s.close()}};return w.a.parse(e,u,_),s},options:A};async function x(e,t){const r={...A.csv,...null==t?void 0:t.csv},n=function(e){return w.a.parse(e,{download:!1,dynamicTyping:!0,preview:1}).data[0]}(e),a="auto"===r.header?R(n):Boolean(r.header),o={...r,header:a,download:!1,transformHeader:a?E():void 0,error:e=>{throw new Error(e)}},h=w.a.parse(e,o);let{data:l}=h;const u=h.meta.fields||k(r.columnPrefix,n.length);switch(r.shape){case"object-row-table":l=l.map(e=>Array.isArray(e)?i(e,u):e);break;case"array-row-table":l=l.map(e=>Array.isArray(e)?e:s(e,u))}return l}function R(e){return e&&e.every(e=>"string"==typeof e)}function E(){const e=new Set;return t=>{let r=t,i=1;for(;e.has(r);)r=`${t}.${i}`,i++;return e.add(r),r}}function k(e,t=0){const r=[];for(let i=0;i<t;i++)r.push(`${e}${i+1}`);return r}}])}));
|
|
8
|
+
var r="undefined"!=typeof self?self:"undefined"!=typeof window?window:void 0!==r?r:{},i={};function s(e){this._handle=null,this._finished=!1,this._completed=!1,this._input=null,this._baseIndex=0,this._partialLine="",this._rowCount=0,this._start=0,this._nextChunk=null,this.isFirstChunk=!0,this._completeResults={data:[],errors:[],meta:{}},function(e){var t=l(e);t.chunkSize=parseInt(t.chunkSize),e.step||e.chunk||(t.chunkSize=null);this._handle=new a(t),this._handle.streamer=this,this._config=t}.call(this,e),this.parseChunk=function(e,t){if(this.isFirstChunk&&u(this._config.beforeFirstChunk)){var r=this._config.beforeFirstChunk(e);void 0!==r&&(e=r)}this.isFirstChunk=!1;var i=this._partialLine+e;this._partialLine="";var s=this._handle.parse(i,this._baseIndex,!this._finished);if(!this._handle.paused()&&!this._handle.aborted()){var n=s.meta.cursor;this._finished||(this._partialLine=i.substring(n-this._baseIndex),this._baseIndex=n),s&&s.data&&(this._rowCount+=s.data.length);var a=this._finished||this._config.preview&&this._rowCount>=this._config.preview;if(u(this._config.chunk)&&!t){if(this._config.chunk(s,this._handle),this._handle.paused()||this._handle.aborted())return;s=void 0,this._completeResults=void 0}return this._config.step||this._config.chunk||(this._completeResults.data=this._completeResults.data.concat(s.data),this._completeResults.errors=this._completeResults.errors.concat(s.errors),this._completeResults.meta=s.meta),this._completed||!a||!u(this._config.complete)||s&&s.meta.aborted||(this._config.complete(this._completeResults,this._input),this._completed=!0),a||s&&s.meta.paused||this._nextChunk(),s}},this._sendError=function(e){u(this._config.error)&&this._config.error(e)}}function n(e){var t;e=e||{},s.call(this,e),this.stream=function(e){return t=e,this._nextChunk()},this._nextChunk=function(){if(!this._finished){var e=this._config.chunkSize,r=e?t.substr(0,e):t;return t=e?t.substr(e):"",this._finished=!t,this.parseChunk(r)}}}function a(e){var t,r,s,n=/^\s*-?(\d*\.?\d+|\d+\.?\d*)(e[-+]?\d+)?\s*$/i,a=/(\d{4}-[01]\d-[0-3]\dT[0-2]\d:[0-5]\d:[0-5]\d\.\d+([+-][0-2]\d:[0-5]\d|Z))|(\d{4}-[01]\d-[0-3]\dT[0-2]\d:[0-5]\d:[0-5]\d([+-][0-2]\d:[0-5]\d|Z))|(\d{4}-[01]\d-[0-3]\dT[0-2]\d:[0-5]\d([+-][0-2]\d:[0-5]\d|Z))/,c=this,d=0,f=0,p=!1,g=!1,m=[],y={data:[],errors:[],meta:{}};if(u(e.step)){var b=e.step;e.step=function(t){if(y=t,_())v();else{if(v(),!y.data||0===y.data.length)return;d+=t.data.length,e.preview&&d>e.preview?r.abort():b(y,c)}}}function w(t){return"greedy"===e.skipEmptyLines?""===t.join("").trim():1===t.length&&0===t[0].length}function v(){if(y&&s&&(C("Delimiter","UndetectableDelimiter","Unable to auto-detect delimiting character; defaulted to '"+i.DefaultDelimiter+"'"),s=!1),e.skipEmptyLines)for(var t=0;t<y.data.length;t++)w(y.data[t])&&y.data.splice(t--,1);return _()&&function(){if(!y)return;function t(t){u(e.transformHeader)&&(t=e.transformHeader(t)),m.push(t)}if(Array.isArray(y.data[0])){for(var r=0;_()&&r<y.data.length;r++)y.data[r].forEach(t);y.data.splice(0,1)}else y.data.forEach(t)}(),function(){if(!y||!y.data||!e.header&&!e.dynamicTyping&&!e.transform)return y;function t(t,r){var i,s=e.header?{}:[];for(i=0;i<t.length;i++){var n=i,a=t[i];e.header&&(n=i>=m.length?"__parsed_extra":m[i]),e.transform&&(a=e.transform(a,n)),a=A(n,a),"__parsed_extra"===n?(s[n]=s[n]||[],s[n].push(a)):s[n]=a}return e.header&&(i>m.length?C("FieldMismatch","TooManyFields","Too many fields: expected "+m.length+" fields but parsed "+i,f+r):i<m.length&&C("FieldMismatch","TooFewFields","Too few fields: expected "+m.length+" fields but parsed "+i,f+r)),s}var r=1;!y.data[0]||Array.isArray(y.data[0])?(y.data=y.data.map(t),r=y.data.length):y.data=t(y.data,0);e.header&&y.meta&&(y.meta.fields=m);return f+=r,y}()}function _(){return e.header&&0===m.length}function A(t,r){return function(t){return e.dynamicTypingFunction&&void 0===e.dynamicTyping[t]&&(e.dynamicTyping[t]=e.dynamicTypingFunction(t)),!0===(e.dynamicTyping[t]||e.dynamicTyping)}(t)?"true"===r||"TRUE"===r||"false"!==r&&"FALSE"!==r&&(n.test(r)?parseFloat(r):a.test(r)?new Date(r):""===r?null:r):r}function C(e,t,r,i){y.errors.push({type:e,code:t,message:r,row:i})}this.parse=function(n,a,c){var d=e.quoteChar||'"';if(e.newline||(e.newline=function(e,t){e=e.substr(0,1048576);var r=new RegExp(o(t)+"([^]*?)"+o(t),"gm"),i=(e=e.replace(r,"")).split("\r"),s=e.split("\n"),n=s.length>1&&s[0].length<i[0].length;if(1===i.length||n)return"\n";for(var a=0,h=0;h<i.length;h++)"\n"===i[h][0]&&a++;return a>=i.length/2?"\r\n":"\r"}(n,d)),s=!1,e.delimiter)u(e.delimiter)&&(e.delimiter=e.delimiter(n),y.meta.delimiter=e.delimiter);else{var f=function(t,r,s,n,a){var o,l,u;a=a||[",","\t","|",";",i.RECORD_SEP,i.UNIT_SEP];for(var c=0;c<a.length;c++){var d=a[c],f=0,p=0,g=0;u=void 0;for(var m=new h({comments:n,delimiter:d,newline:r,preview:10}).parse(t),y=0;y<m.data.length;y++)if(s&&w(m.data[y]))g++;else{var b=m.data[y].length;p+=b,void 0!==u?b>1&&(f+=Math.abs(b-u),u=b):u=0}m.data.length>0&&(p/=m.data.length-g),(void 0===l||f>l)&&p>1.99&&(l=f,o=d)}return e.delimiter=o,{successful:!!o,bestDelimiter:o}}(n,e.newline,e.skipEmptyLines,e.comments,e.delimitersToGuess);f.successful?e.delimiter=f.bestDelimiter:(s=!0,e.delimiter=i.DefaultDelimiter),y.meta.delimiter=e.delimiter}var g=l(e);return e.preview&&e.header&&g.preview++,t=n,r=new h(g),y=r.parse(t,a,c),v(),p?{meta:{paused:!0}}:y||{meta:{paused:!1}}},this.paused=function(){return p},this.pause=function(){p=!0,r.abort(),t=t.substr(r.getCharIndex())},this.resume=function(){p=!1,c.streamer.parseChunk(t,!0)},this.aborted=function(){return g},this.abort=function(){g=!0,r.abort(),y.meta.aborted=!0,u(e.complete)&&e.complete(y),t=""}}function o(e){return e.replace(/[.*+?^${}()|[\]\\]/g,"\\$&")}function h(e){var t,r=(e=e||{}).delimiter,s=e.newline,n=e.comments,a=e.step,h=e.preview,l=e.fastMode,c=t=void 0===e.quoteChar?'"':e.quoteChar;if(void 0!==e.escapeChar&&(c=e.escapeChar),("string"!=typeof r||i.BAD_DELIMITERS.indexOf(r)>-1)&&(r=","),n===r)throw new Error("Comment character same as delimiter");!0===n?n="#":("string"!=typeof n||i.BAD_DELIMITERS.indexOf(n)>-1)&&(n=!1),"\n"!==s&&"\r"!==s&&"\r\n"!==s&&(s="\n");var d=0,f=!1;this.parse=function(e,i,p){if("string"!=typeof e)throw new Error("Input must be a string");var g=e.length,m=r.length,y=s.length,b=n.length,w=u(a);d=0;var v=[],_=[],A=[],C=0;if(!e)return F();if(l||!1!==l&&-1===e.indexOf(t)){for(var x=e.split(s),R=0;R<x.length;R++){if(A=x[R],d+=A.length,R!==x.length-1)d+=s.length;else if(p)return F();if(!n||A.substr(0,b)!==n){if(w){if(v=[],B(A.split(r)),I(),f)return F()}else B(A.split(r));if(h&&R>=h)return v=v.slice(0,h),F(!0)}}return F()}for(var E,k=e.indexOf(r,d),O=e.indexOf(s,d),T=new RegExp(o(c)+o(t),"g");;)if(e[d]!==t)if(n&&0===A.length&&e.substr(d,b)===n){if(-1===O)return F();d=O+y,O=e.indexOf(s,d),k=e.indexOf(r,d)}else if(-1!==k&&(k<O||-1===O))A.push(e.substring(d,k)),d=k+m,k=e.indexOf(r,d);else{if(-1===O)break;if(A.push(e.substring(d,O)),P(O+y),w&&(I(),f))return F();if(h&&v.length>=h)return F(!0)}else{for(E=d,d++;;){if(-1===(E=e.indexOf(t,E+1)))return p||_.push({type:"Quotes",code:"MissingQuotes",message:"Quoted field unterminated",row:v.length,index:d}),M();if(E===g-1)return M(e.substring(d,E).replace(T,t));if(t!==c||e[E+1]!==c){if(t===c||0===E||e[E-1]!==c){var S=D(-1===O?k:Math.min(k,O));if(e[E+1+S]===r){if(A.push(e.substring(d,E).replace(T,t)),d=E+1+S+m,k=e.indexOf(r,d),O=e.indexOf(s,d),w&&(I(),f))return F();if(h&&v.length>=h)return F(!0);break}var j=D(O);if(e.substr(E+1+j,y)===s){if(A.push(e.substring(d,E).replace(T,t)),P(E+1+j+y),k=e.indexOf(r,d),w&&(I(),f))return F();if(h&&v.length>=h)return F(!0);break}_.push({type:"Quotes",code:"InvalidQuotes",message:"Trailing quote on quoted field is malformed",row:v.length,index:d}),E++}}else E++}if(w&&(I(),f))return F();if(h&&v.length>=h)return F(!0)}return M();function B(e){v.push(e),C=d}function D(t){var r=0;if(-1!==t){var i=e.substring(E+1,t);i&&""===i.trim()&&(r=i.length)}return r}function M(t){return p||(void 0===t&&(t=e.substr(d)),A.push(t),d=g,B(A),w&&I()),F()}function P(t){d=t,B(A),A=[],O=e.indexOf(s,d)}function F(e,t){return{data:t||!1?v[0]:v,errors:_,meta:{delimiter:r,linebreak:s,aborted:f,truncated:!!e,cursor:C+(i||0)}}}function I(){a(F(void 0,!0)),v=[],_=[]}},this.abort=function(){f=!0},this.getCharIndex=function(){return d}}function l(e){if("object"!=typeof e||null===e)return e;var t=Array.isArray(e)?[]:{};for(var r in e)t[r]=l(e[r]);return t}function u(e){return"function"==typeof e}e.exports=i,i.parse=function(e,t,r){var s=(t=t||{}).dynamicTyping||!1;u(s)&&(t.dynamicTypingFunction=s,s={});if(t.dynamicTyping=s,t.transform=!!u(t.transform)&&t.transform,t.worker&&i.WORKERS_SUPPORTED){var a=newWorker();return a.userStep=t.step,a.userChunk=t.chunk,a.userComplete=t.complete,a.userError=t.error,t.step=u(t.step),t.chunk=u(t.chunk),t.complete=u(t.complete),t.error=u(t.error),delete t.worker,void a.postMessage({input:e,config:t,workerId:a.id})}var o=null;"string"==typeof e&&(o=new n(t));o||(o=new r(t));return o.stream(e)},i.unparse=function(e,t){var r=!1,s=!0,n=",",a="\r\n",h='"',l=h+h,u=!1,c=null;!function(){if("object"!=typeof t)return;"string"!=typeof t.delimiter||i.BAD_DELIMITERS.filter((function(e){return-1!==t.delimiter.indexOf(e)})).length||(n=t.delimiter);("boolean"==typeof t.quotes||Array.isArray(t.quotes))&&(r=t.quotes);"boolean"!=typeof t.skipEmptyLines&&"string"!=typeof t.skipEmptyLines||(u=t.skipEmptyLines);"string"==typeof t.newline&&(a=t.newline);"string"==typeof t.quoteChar&&(h=t.quoteChar);"boolean"==typeof t.header&&(s=t.header);if(Array.isArray(t.columns)){if(0===t.columns.length)throw new Error("Option columns is empty");c=t.columns}void 0!==t.escapeChar&&(l=t.escapeChar+h)}();var d=new RegExp(o(h),"g");"string"==typeof e&&(e=JSON.parse(e));if(Array.isArray(e)){if(!e.length||Array.isArray(e[0]))return p(null,e,u);if("object"==typeof e[0])return p(c||f(e[0]),e,u)}else if("object"==typeof e)return"string"==typeof e.data&&(e.data=JSON.parse(e.data)),Array.isArray(e.data)&&(e.fields||(e.fields=e.meta&&e.meta.fields),e.fields||(e.fields=Array.isArray(e.data[0])?e.fields:f(e.data[0])),Array.isArray(e.data[0])||"object"==typeof e.data[0]||(e.data=[e.data])),p(e.fields||[],e.data||[],u);throw new Error("Unable to serialize unrecognized input");function f(e){if("object"!=typeof e)return[];var t=[];for(var r in e)t.push(r);return t}function p(e,t,r){var i="";"string"==typeof e&&(e=JSON.parse(e)),"string"==typeof t&&(t=JSON.parse(t));var o=Array.isArray(e)&&e.length>0,h=!Array.isArray(t[0]);if(o&&s){for(var l=0;l<e.length;l++)l>0&&(i+=n),i+=g(e[l],l);t.length>0&&(i+=a)}for(var u=0;u<t.length;u++){var c=o?e.length:t[u].length,d=!1,f=o?0===Object.keys(t[u]).length:0===t[u].length;if(r&&!o&&(d="greedy"===r?""===t[u].join("").trim():1===t[u].length&&0===t[u][0].length),"greedy"===r&&o){for(var p=[],m=0;m<c;m++){var y=h?e[m]:m;p.push(t[u][y])}d=""===p.join("").trim()}if(!d){for(var b=0;b<c;b++){b>0&&!f&&(i+=n);var w=o&&h?e[b]:b;i+=g(t[u][w],b)}u<t.length-1&&(!r||c>0&&!f)&&(i+=a)}}return i}function g(e,t){return null==e?"":e.constructor===Date?JSON.stringify(e).slice(1,25):(e=e.toString().replace(d,l),"boolean"==typeof r&&r||Array.isArray(r)&&r[t]||function(e,t){for(var r=0;r<t.length;r++)if(e.indexOf(t[r])>-1)return!0;return!1}(e,i.BAD_DELIMITERS)||e.indexOf(n)>-1||" "===e.charAt(0)||" "===e.charAt(e.length-1)?h+e+h:e)}},i.RECORD_SEP=String.fromCharCode(30),i.UNIT_SEP=String.fromCharCode(31),i.BYTE_ORDER_MARK="\ufeff",i.BAD_DELIMITERS=["\r","\n",'"',i.BYTE_ORDER_MARK],i.WORKERS_SUPPORTED=!1,i.NODE_STREAM_INPUT=1,i.LocalChunkSize=10485760,i.RemoteChunkSize=5242880,i.DefaultDelimiter=",",i.Parser=h,i.ParserHandle=a,i.ChunkStreamer=s,i.StringStreamer=n,n.prototype=Object.create(n.prototype),n.prototype.constructor=n},function(e,t,r){const i=r(2);globalThis.loaders=globalThis.loaders||{},e.exports=Object.assign(globalThis.loaders,i)},function(e,t,r){"use strict";function i(e,t){if(!e)throw new Error("null row");if(!t)throw new Error("no headers");const r={};for(let i=0;i<t.length;i++)r[t[i]]=e[i];return r}function s(e,t){if(!e)throw new Error("null row");if(!t)throw new Error("no headers");const r=new Array(t.length);for(let i=0;i<t.length;i++)r[i]=e[t[i]];return r}let n;function a(e,t,r){return t in e?Object.defineProperty(e,t,{value:r,enumerable:!0,configurable:!0,writable:!0}):e[t]=r,e}r.r(t),r.d(t,"CSVLoader",(function(){return C}));class o extends Array{enqueue(e){return this.push(e)}dequeue(){return this.shift()}}n=Symbol.asyncIterator;class h{constructor(){a(this,"_values",void 0),a(this,"_settlers",void 0),a(this,"_closed",void 0),this._values=new o,this._settlers=new o,this._closed=!1}close(){for(;this._settlers.length>0;)this._settlers.dequeue().resolve({done:!0});this._closed=!0}[n](){return this}enqueue(e){if(this._closed)throw new Error("Closed");if(this._settlers.length>0){if(this._values.length>0)throw new Error("Illegal internal state");const t=this._settlers.dequeue();e instanceof Error?t.reject(e):t.resolve({value:e})}else this._values.enqueue(e)}next(){if(this._values.length>0){const e=this._values.dequeue();return e instanceof Error?Promise.reject(e):Promise.resolve({value:e})}if(this._closed){if(this._settlers.length>0)throw new Error("Illegal internal state");return Promise.resolve({done:!0})}return new Promise((e,t)=>{this._settlers.enqueue({resolve:e,reject:t})})}}function l(e,t,r){return t in e?Object.defineProperty(e,t,{value:r,enumerable:!0,configurable:!0,writable:!0}):e[t]=r,e}class u{constructor(e,t){if(l(this,"schema",void 0),l(this,"options",void 0),l(this,"length",0),l(this,"rows",null),l(this,"cursor",0),l(this,"_headers",[]),this.options=t,this.schema=e,!Array.isArray(e)){this._headers=[];for(const t in e)this._headers[e[t].index]=e[t].name}}rowCount(){return this.length}addArrayRow(e,t){Number.isFinite(t)&&(this.cursor=t),this.rows=this.rows||new Array(100),this.rows[this.length]=e,this.length++}addObjectRow(e,t){Number.isFinite(t)&&(this.cursor=t),this.rows=this.rows||new Array(100),this.rows[this.length]=e,this.length++}getBatch(){let e=this.rows;if(!e)return null;e=e.slice(0,this.length),this.rows=null;return{shape:this.options.shape,batchType:"data",data:e,length:this.length,schema:this.schema,cursor:this.cursor}}}function c(e,t,r){return t in e?Object.defineProperty(e,t,{value:r,enumerable:!0,configurable:!0,writable:!0}):e[t]=r,e}class d{constructor(e,t){if(c(this,"schema",void 0),c(this,"options",void 0),c(this,"length",0),c(this,"objectRows",null),c(this,"arrayRows",null),c(this,"cursor",0),c(this,"_headers",[]),this.options=t,this.schema=e,!Array.isArray(e)){this._headers=[];for(const t in e)this._headers[e[t].index]=e[t].name}}rowCount(){return this.length}addArrayRow(e,t){switch(Number.isFinite(t)&&(this.cursor=t),this.options.shape){case"object-row-table":const r=i(e,this._headers);this.addObjectRow(r,t);break;case"array-row-table":this.arrayRows=this.arrayRows||new Array(100),this.arrayRows[this.length]=e,this.length++}}addObjectRow(e,t){switch(Number.isFinite(t)&&(this.cursor=t),this.options.shape){case"array-row-table":const r=s(e,this._headers);this.addArrayRow(r,t);break;case"object-row-table":this.objectRows=this.objectRows||new Array(100),this.objectRows[this.length]=e,this.length++}}getBatch(){let e=this.arrayRows||this.objectRows;return e?(e=e.slice(0,this.length),this.arrayRows=null,this.objectRows=null,{shape:this.options.shape,batchType:"data",data:e,length:this.length,schema:this.schema,cursor:this.cursor}):null}}function f(e,t,r){return t in e?Object.defineProperty(e,t,{value:r,enumerable:!0,configurable:!0,writable:!0}):e[t]=r,e}class p{constructor(e,t){f(this,"schema",void 0),f(this,"length",0),f(this,"allocated",0),f(this,"columns",{}),this.schema=e,this._reallocateColumns()}rowCount(){return this.length}addArrayRow(e){this._reallocateColumns();let t=0;for(const r in this.columns)this.columns[r][this.length]=e[t++];this.length++}addObjectRow(e){this._reallocateColumns();for(const t in e)this.columns[t][this.length]=e[t];this.length++}getBatch(){this._pruneColumns();const e=Array.isArray(this.schema)?this.columns:{};if(!Array.isArray(this.schema))for(const t in this.schema){const r=this.schema[t];e[r.name]=this.columns[r.index]}this.columns={};return{shape:"columnar-table",batchType:"data",data:e,schema:this.schema,length:this.length}}_reallocateColumns(){if(!(this.length<this.allocated)){this.allocated=this.allocated>0?this.allocated*=2:100,this.columns={};for(const e in this.schema){const t=this.schema[e],r=t.type||Float32Array,i=this.columns[t.index];if(i&&ArrayBuffer.isView(i)){const e=new r(this.allocated);e.set(i),this.columns[t.index]=e}else i?(i.length=this.allocated,this.columns[t.index]=i):this.columns[t.index]=new r(this.allocated)}}}_pruneColumns(){for(const[e,t]of Object.entries(this.columns))this.columns[e]=t.slice(0,this.length)}}function g(e,t,r){return t in e?Object.defineProperty(e,t,{value:r,enumerable:!0,configurable:!0,writable:!0}):e[t]=r,e}const m={shape:"array-row-table",batchSize:"auto",batchDebounceMs:0,limit:0,_limitMB:0};class y{constructor(e,t){g(this,"schema",void 0),g(this,"options",void 0),g(this,"aggregator",null),g(this,"batchCount",0),g(this,"bytesUsed",0),g(this,"isChunkComplete",!1),g(this,"lastBatchEmittedMs",Date.now()),g(this,"totalLength",0),g(this,"totalBytes",0),g(this,"rowBytes",0),this.schema=e,this.options={...m,...t}}limitReached(){var e,t;return!!(Boolean(null===(e=this.options)||void 0===e?void 0:e.limit)&&this.totalLength>=this.options.limit)||!!(Boolean(null===(t=this.options)||void 0===t?void 0:t._limitMB)&&this.totalBytes/1e6>=this.options._limitMB)}addRow(e){this.limitReached()||(this.totalLength++,this.rowBytes=this.rowBytes||this._estimateRowMB(e),this.totalBytes+=this.rowBytes,Array.isArray(e)?this.addArrayRow(e):this.addObjectRow(e))}addArrayRow(e){if(!this.aggregator){const e=this._getTableBatchType();this.aggregator=new e(this.schema,this.options)}this.aggregator.addArrayRow(e)}addObjectRow(e){if(!this.aggregator){const e=this._getTableBatchType();this.aggregator=new e(this.schema,this.options)}this.aggregator.addObjectRow(e)}chunkComplete(e){e instanceof ArrayBuffer&&(this.bytesUsed+=e.byteLength),"string"==typeof e&&(this.bytesUsed+=e.length),this.isChunkComplete=!0}getFullBatch(e){return this._isFull()?this._getBatch(e):null}getFinalBatch(e){return this._getBatch(e)}_estimateRowMB(e){return Array.isArray(e)?8*e.length:8*Object.keys(e).length}_isFull(){if(!this.aggregator||0===this.aggregator.rowCount())return!1;if("auto"===this.options.batchSize){if(!this.isChunkComplete)return!1}else if(this.options.batchSize>this.aggregator.rowCount())return!1;return!(this.options.batchDebounceMs>Date.now()-this.lastBatchEmittedMs)&&(this.isChunkComplete=!1,this.lastBatchEmittedMs=Date.now(),!0)}_getBatch(e){if(!this.aggregator)return null;null!=e&&e.bytesUsed&&(this.bytesUsed=e.bytesUsed);const t=this.aggregator.getBatch();return t.count=this.batchCount,t.bytesUsed=this.bytesUsed,Object.assign(t,e),this.batchCount++,this.aggregator=null,t}_getTableBatchType(){switch(this.options.shape){case"row-table":return u;case"array-row-table":case"object-row-table":return d;case"columnar-table":return p;case"arrow-table":if(!y.ArrowBatch)throw new Error("TableBatchBuilder");return y.ArrowBatch;default:throw new Error("TableBatchBuilder")}}}g(y,"ArrowBatch",void 0);var b=r(0),w=r.n(b);const{ChunkStreamer:v}=w.a;function _(e){e=e||{},v.call(this,e),this.textDecoder=new TextDecoder(this._config.encoding),this.stream=async function(e){this._input=e;try{for await(const t of e)this.parseChunk(this.getStringChunk(t));this._finished=!0,this.parseChunk("")}catch(e){this._sendError(e)}},this._nextChunk=function(){},this.getStringChunk=function(e){return"string"==typeof e?e:this.textDecoder.decode(e,{stream:!0})}}_.prototype=Object.create(v.prototype),_.prototype.constructor=_;const A={csv:{shape:"object-row-table",optimizeMemoryUsage:!1,header:"auto",columnPrefix:"column",quoteChar:'"',escapeChar:'"',dynamicTyping:!0,comments:!1,skipEmptyLines:!0,delimitersToGuess:[",","\t","|",";"]}},C={id:"csv",module:"csv",name:"CSV",version:"3.1.0-alpha.5",extensions:["csv","tsv","dsv"],mimeTypes:["text/csv","text/tab-separated-values","text/dsv"],category:"table",parse:async(e,t)=>x((new TextDecoder).decode(e),t),parseText:(e,t)=>x(e,t),parseInBatches:function(e,t){var r;"auto"===(t={...t}).batchSize&&(t.batchSize=4e3);const i={...A.csv,...null===(r=t)||void 0===r?void 0:r.csv},s=new h;let n=!0,a=null,o=null,l=null;const u={...i,header:!1,download:!1,chunkSize:5242880,skipEmptyLines:!1,step(e){let r=e.data;if(i.skipEmptyLines){if(""===r.flat().join("").trim())return}const h=e.meta.cursor;if(n&&!a){if("auto"===i.header?R(r):Boolean(i.header))return void(a=r.map(E()))}n&&(n=!1,a||(a=k(i.columnPrefix,r.length)),l=function(e,t){const r=t?{}:[];for(let i=0;i<e.length;i++){const s=t&&t[i]||i;switch(typeof e[i]){case"number":case"boolean":r[s]={name:String(s),index:i,type:Float32Array};break;case"string":default:r[s]={name:String(s),index:i,type:Array}}}return r}(r,a)),i.optimizeMemoryUsage&&(r=JSON.parse(JSON.stringify(r))),o=o||new y(l,{shape:i.shape||"array-row-table",...t});try{o.addRow(r);const e=o&&o.getFullBatch({bytesUsed:h});e&&s.enqueue(e)}catch(e){s.enqueue(e)}},complete(e){try{const t=e.meta.cursor,r=o&&o.getFinalBatch({bytesUsed:t});r&&s.enqueue(r)}catch(e){s.enqueue(e)}s.close()}};return w.a.parse(e,u,_),s},options:A};async function x(e,t){const r={...A.csv,...null==t?void 0:t.csv},n=function(e){return w.a.parse(e,{download:!1,dynamicTyping:!0,preview:1}).data[0]}(e),a="auto"===r.header?R(n):Boolean(r.header),o={...r,header:a,download:!1,transformHeader:a?E():void 0,error:e=>{throw new Error(e)}},h=w.a.parse(e,o);let{data:l}=h;const u=h.meta.fields||k(r.columnPrefix,n.length);switch(r.shape){case"object-row-table":l=l.map(e=>Array.isArray(e)?i(e,u):e);break;case"array-row-table":l=l.map(e=>Array.isArray(e)?e:s(e,u))}return l}function R(e){return e&&e.every(e=>"string"==typeof e)}function E(){const e=new Set;return t=>{let r=t,i=1;for(;e.has(r);)r=`${t}.${i}`,i++;return e.add(r),r}}function k(e,t=0){const r=[];for(let i=0;i<t;i++)r.push(`${e}${i+1}`);return r}}])}));
|
|
9
9
|
//# sourceMappingURL=dist.min.js.map
|
package/dist/es5/bundle.js
CHANGED
package/dist/es5/bundle.js.map
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"sources":["../../src/bundle.ts"],"names":["moduleExports","require","globalThis","loaders","module","exports","Object","assign"],"mappings":";;AACA,
|
|
1
|
+
{"version":3,"sources":["../../src/bundle.ts"],"names":["moduleExports","require","globalThis","loaders","module","exports","Object","assign"],"mappings":";;AACA,MAAMA,aAAa,GAAGC,OAAO,CAAC,SAAD,CAA7B;;AACAC,UAAU,CAACC,OAAX,GAAqBD,UAAU,CAACC,OAAX,IAAsB,EAA3C;AACAC,MAAM,CAACC,OAAP,GAAiBC,MAAM,CAACC,MAAP,CAAcL,UAAU,CAACC,OAAzB,EAAkCH,aAAlC,CAAjB","sourcesContent":["// @ts-nocheck\nconst moduleExports = require('./index');\nglobalThis.loaders = globalThis.loaders || {};\nmodule.exports = Object.assign(globalThis.loaders, moduleExports);\n"],"file":"bundle.js"}
|
package/dist/es5/csv-loader.js
CHANGED
|
@@ -7,26 +7,14 @@ Object.defineProperty(exports, "__esModule", {
|
|
|
7
7
|
});
|
|
8
8
|
exports._typecheckCSVLoader = exports.CSVLoader = void 0;
|
|
9
9
|
|
|
10
|
-
var _regenerator = _interopRequireDefault(require("@babel/runtime/regenerator"));
|
|
11
|
-
|
|
12
|
-
var _typeof2 = _interopRequireDefault(require("@babel/runtime/helpers/typeof"));
|
|
13
|
-
|
|
14
|
-
var _defineProperty2 = _interopRequireDefault(require("@babel/runtime/helpers/defineProperty"));
|
|
15
|
-
|
|
16
|
-
var _asyncToGenerator2 = _interopRequireDefault(require("@babel/runtime/helpers/asyncToGenerator"));
|
|
17
|
-
|
|
18
10
|
var _schema = require("@loaders.gl/schema");
|
|
19
11
|
|
|
20
12
|
var _papaparse = _interopRequireDefault(require("./libs/papaparse"));
|
|
21
13
|
|
|
22
14
|
var _asyncIteratorStreamer = _interopRequireDefault(require("./lib/async-iterator-streamer"));
|
|
23
15
|
|
|
24
|
-
|
|
25
|
-
|
|
26
|
-
function _objectSpread(target) { for (var i = 1; i < arguments.length; i++) { var source = arguments[i] != null ? arguments[i] : {}; if (i % 2) { ownKeys(Object(source), true).forEach(function (key) { (0, _defineProperty2.default)(target, key, source[key]); }); } else if (Object.getOwnPropertyDescriptors) { Object.defineProperties(target, Object.getOwnPropertyDescriptors(source)); } else { ownKeys(Object(source)).forEach(function (key) { Object.defineProperty(target, key, Object.getOwnPropertyDescriptor(source, key)); }); } } return target; }
|
|
27
|
-
|
|
28
|
-
var VERSION = typeof "3.1.0-alpha.4" !== 'undefined' ? "3.1.0-alpha.4" : 'latest';
|
|
29
|
-
var DEFAULT_CSV_LOADER_OPTIONS = {
|
|
16
|
+
const VERSION = typeof "3.1.0-alpha.5" !== 'undefined' ? "3.1.0-alpha.5" : 'latest';
|
|
17
|
+
const DEFAULT_CSV_LOADER_OPTIONS = {
|
|
30
18
|
csv: {
|
|
31
19
|
shape: 'object-row-table',
|
|
32
20
|
optimizeMemoryUsage: false,
|
|
@@ -40,7 +28,7 @@ var DEFAULT_CSV_LOADER_OPTIONS = {
|
|
|
40
28
|
delimitersToGuess: [',', '\t', '|', ';']
|
|
41
29
|
}
|
|
42
30
|
};
|
|
43
|
-
|
|
31
|
+
const CSVLoader = {
|
|
44
32
|
id: 'csv',
|
|
45
33
|
module: 'csv',
|
|
46
34
|
name: 'CSV',
|
|
@@ -48,128 +36,90 @@ var CSVLoader = {
|
|
|
48
36
|
extensions: ['csv', 'tsv', 'dsv'],
|
|
49
37
|
mimeTypes: ['text/csv', 'text/tab-separated-values', 'text/dsv'],
|
|
50
38
|
category: 'table',
|
|
51
|
-
parse:
|
|
52
|
-
|
|
53
|
-
return _regenerator.default.wrap(function _callee$(_context) {
|
|
54
|
-
while (1) {
|
|
55
|
-
switch (_context.prev = _context.next) {
|
|
56
|
-
case 0:
|
|
57
|
-
return _context.abrupt("return", parseCSV(new TextDecoder().decode(arrayBuffer), options));
|
|
58
|
-
|
|
59
|
-
case 1:
|
|
60
|
-
case "end":
|
|
61
|
-
return _context.stop();
|
|
62
|
-
}
|
|
63
|
-
}
|
|
64
|
-
}, _callee);
|
|
65
|
-
}));
|
|
66
|
-
|
|
67
|
-
function parse(_x, _x2) {
|
|
68
|
-
return _parse.apply(this, arguments);
|
|
69
|
-
}
|
|
70
|
-
|
|
71
|
-
return parse;
|
|
72
|
-
}(),
|
|
73
|
-
parseText: function parseText(text, options) {
|
|
74
|
-
return parseCSV(text, options);
|
|
75
|
-
},
|
|
39
|
+
parse: async (arrayBuffer, options) => parseCSV(new TextDecoder().decode(arrayBuffer), options),
|
|
40
|
+
parseText: (text, options) => parseCSV(text, options),
|
|
76
41
|
parseInBatches: parseCSVInBatches,
|
|
77
42
|
options: DEFAULT_CSV_LOADER_OPTIONS
|
|
78
43
|
};
|
|
79
44
|
exports.CSVLoader = CSVLoader;
|
|
80
45
|
|
|
81
|
-
function parseCSV(
|
|
82
|
-
|
|
83
|
-
|
|
46
|
+
async function parseCSV(csvText, options) {
|
|
47
|
+
const csvOptions = { ...DEFAULT_CSV_LOADER_OPTIONS.csv,
|
|
48
|
+
...(options === null || options === void 0 ? void 0 : options.csv)
|
|
49
|
+
};
|
|
50
|
+
const firstRow = readFirstRow(csvText);
|
|
51
|
+
const header = csvOptions.header === 'auto' ? isHeaderRow(firstRow) : Boolean(csvOptions.header);
|
|
52
|
+
const parseWithHeader = header;
|
|
53
|
+
const papaparseConfig = { ...csvOptions,
|
|
54
|
+
header: parseWithHeader,
|
|
55
|
+
download: false,
|
|
56
|
+
transformHeader: parseWithHeader ? duplicateColumnTransformer() : undefined,
|
|
57
|
+
error: e => {
|
|
58
|
+
throw new Error(e);
|
|
59
|
+
}
|
|
60
|
+
};
|
|
84
61
|
|
|
85
|
-
|
|
86
|
-
|
|
87
|
-
|
|
88
|
-
|
|
89
|
-
|
|
90
|
-
|
|
91
|
-
|
|
92
|
-
|
|
93
|
-
|
|
94
|
-
|
|
95
|
-
|
|
96
|
-
|
|
97
|
-
|
|
98
|
-
|
|
99
|
-
|
|
100
|
-
|
|
101
|
-
|
|
102
|
-
|
|
103
|
-
|
|
104
|
-
|
|
105
|
-
rows = result.data;
|
|
106
|
-
headerRow = result.meta.fields || generateHeader(csvOptions.columnPrefix, firstRow.length);
|
|
107
|
-
_context2.t0 = csvOptions.shape;
|
|
108
|
-
_context2.next = _context2.t0 === 'object-row-table' ? 11 : _context2.t0 === 'array-row-table' ? 13 : 15;
|
|
109
|
-
break;
|
|
110
|
-
|
|
111
|
-
case 11:
|
|
112
|
-
rows = rows.map(function (row) {
|
|
113
|
-
return Array.isArray(row) ? (0, _schema.convertToObjectRow)(row, headerRow) : row;
|
|
114
|
-
});
|
|
115
|
-
return _context2.abrupt("break", 15);
|
|
116
|
-
|
|
117
|
-
case 13:
|
|
118
|
-
rows = rows.map(function (row) {
|
|
119
|
-
return Array.isArray(row) ? row : (0, _schema.convertToArrayRow)(row, headerRow);
|
|
120
|
-
});
|
|
121
|
-
return _context2.abrupt("break", 15);
|
|
122
|
-
|
|
123
|
-
case 15:
|
|
124
|
-
return _context2.abrupt("return", rows);
|
|
125
|
-
|
|
126
|
-
case 16:
|
|
127
|
-
case "end":
|
|
128
|
-
return _context2.stop();
|
|
129
|
-
}
|
|
130
|
-
}
|
|
131
|
-
}, _callee2);
|
|
132
|
-
}));
|
|
133
|
-
return _parseCSV.apply(this, arguments);
|
|
62
|
+
const result = _papaparse.default.parse(csvText, papaparseConfig);
|
|
63
|
+
|
|
64
|
+
let {
|
|
65
|
+
data: rows
|
|
66
|
+
} = result;
|
|
67
|
+
const headerRow = result.meta.fields || generateHeader(csvOptions.columnPrefix, firstRow.length);
|
|
68
|
+
|
|
69
|
+
switch (csvOptions.shape) {
|
|
70
|
+
case 'object-row-table':
|
|
71
|
+
rows = rows.map(row => Array.isArray(row) ? (0, _schema.convertToObjectRow)(row, headerRow) : row);
|
|
72
|
+
break;
|
|
73
|
+
|
|
74
|
+
case 'array-row-table':
|
|
75
|
+
rows = rows.map(row => Array.isArray(row) ? row : (0, _schema.convertToArrayRow)(row, headerRow));
|
|
76
|
+
break;
|
|
77
|
+
|
|
78
|
+
default:
|
|
79
|
+
}
|
|
80
|
+
|
|
81
|
+
return rows;
|
|
134
82
|
}
|
|
135
83
|
|
|
136
84
|
function parseCSVInBatches(asyncIterator, options) {
|
|
137
85
|
var _options;
|
|
138
86
|
|
|
139
|
-
options =
|
|
87
|
+
options = { ...options
|
|
88
|
+
};
|
|
140
89
|
|
|
141
90
|
if (options.batchSize === 'auto') {
|
|
142
91
|
options.batchSize = 4000;
|
|
143
92
|
}
|
|
144
93
|
|
|
145
|
-
|
|
146
|
-
|
|
147
|
-
|
|
148
|
-
|
|
149
|
-
|
|
150
|
-
|
|
151
|
-
|
|
152
|
-
|
|
153
|
-
|
|
94
|
+
const csvOptions = { ...DEFAULT_CSV_LOADER_OPTIONS.csv,
|
|
95
|
+
...((_options = options) === null || _options === void 0 ? void 0 : _options.csv)
|
|
96
|
+
};
|
|
97
|
+
const asyncQueue = new _schema.AsyncQueue();
|
|
98
|
+
let isFirstRow = true;
|
|
99
|
+
let headerRow = null;
|
|
100
|
+
let tableBatchBuilder = null;
|
|
101
|
+
let schema = null;
|
|
102
|
+
const config = { ...csvOptions,
|
|
154
103
|
header: false,
|
|
155
104
|
download: false,
|
|
156
105
|
chunkSize: 1024 * 1024 * 5,
|
|
157
106
|
skipEmptyLines: false,
|
|
158
|
-
|
|
159
|
-
|
|
107
|
+
|
|
108
|
+
step(results) {
|
|
109
|
+
let row = results.data;
|
|
160
110
|
|
|
161
111
|
if (csvOptions.skipEmptyLines) {
|
|
162
|
-
|
|
112
|
+
const collapsedRow = row.flat().join('').trim();
|
|
163
113
|
|
|
164
114
|
if (collapsedRow === '') {
|
|
165
115
|
return;
|
|
166
116
|
}
|
|
167
117
|
}
|
|
168
118
|
|
|
169
|
-
|
|
119
|
+
const bytesUsed = results.meta.cursor;
|
|
170
120
|
|
|
171
121
|
if (isFirstRow && !headerRow) {
|
|
172
|
-
|
|
122
|
+
const header = csvOptions.header === 'auto' ? isHeaderRow(row) : Boolean(csvOptions.header);
|
|
173
123
|
|
|
174
124
|
if (header) {
|
|
175
125
|
headerRow = row.map(duplicateColumnTransformer());
|
|
@@ -191,14 +141,15 @@ function parseCSVInBatches(asyncIterator, options) {
|
|
|
191
141
|
row = JSON.parse(JSON.stringify(row));
|
|
192
142
|
}
|
|
193
143
|
|
|
194
|
-
tableBatchBuilder = tableBatchBuilder || new _schema.TableBatchBuilder(schema,
|
|
195
|
-
shape: csvOptions.shape || 'array-row-table'
|
|
196
|
-
|
|
144
|
+
tableBatchBuilder = tableBatchBuilder || new _schema.TableBatchBuilder(schema, {
|
|
145
|
+
shape: csvOptions.shape || 'array-row-table',
|
|
146
|
+
...options
|
|
147
|
+
});
|
|
197
148
|
|
|
198
149
|
try {
|
|
199
150
|
tableBatchBuilder.addRow(row);
|
|
200
|
-
|
|
201
|
-
bytesUsed
|
|
151
|
+
const batch = tableBatchBuilder && tableBatchBuilder.getFullBatch({
|
|
152
|
+
bytesUsed
|
|
202
153
|
});
|
|
203
154
|
|
|
204
155
|
if (batch) {
|
|
@@ -208,11 +159,12 @@ function parseCSVInBatches(asyncIterator, options) {
|
|
|
208
159
|
asyncQueue.enqueue(error);
|
|
209
160
|
}
|
|
210
161
|
},
|
|
211
|
-
|
|
162
|
+
|
|
163
|
+
complete(results) {
|
|
212
164
|
try {
|
|
213
|
-
|
|
214
|
-
|
|
215
|
-
bytesUsed
|
|
165
|
+
const bytesUsed = results.meta.cursor;
|
|
166
|
+
const batch = tableBatchBuilder && tableBatchBuilder.getFinalBatch({
|
|
167
|
+
bytesUsed
|
|
216
168
|
});
|
|
217
169
|
|
|
218
170
|
if (batch) {
|
|
@@ -224,7 +176,8 @@ function parseCSVInBatches(asyncIterator, options) {
|
|
|
224
176
|
|
|
225
177
|
asyncQueue.close();
|
|
226
178
|
}
|
|
227
|
-
|
|
179
|
+
|
|
180
|
+
};
|
|
228
181
|
|
|
229
182
|
_papaparse.default.parse(asyncIterator, config, _asyncIteratorStreamer.default);
|
|
230
183
|
|
|
@@ -232,13 +185,11 @@ function parseCSVInBatches(asyncIterator, options) {
|
|
|
232
185
|
}
|
|
233
186
|
|
|
234
187
|
function isHeaderRow(row) {
|
|
235
|
-
return row && row.every(
|
|
236
|
-
return typeof value === 'string';
|
|
237
|
-
});
|
|
188
|
+
return row && row.every(value => typeof value === 'string');
|
|
238
189
|
}
|
|
239
190
|
|
|
240
191
|
function readFirstRow(csvText) {
|
|
241
|
-
|
|
192
|
+
const result = _papaparse.default.parse(csvText, {
|
|
242
193
|
download: false,
|
|
243
194
|
dynamicTyping: true,
|
|
244
195
|
preview: 1
|
|
@@ -248,10 +199,10 @@ function readFirstRow(csvText) {
|
|
|
248
199
|
}
|
|
249
200
|
|
|
250
201
|
function duplicateColumnTransformer() {
|
|
251
|
-
|
|
252
|
-
return
|
|
253
|
-
|
|
254
|
-
|
|
202
|
+
const observedColumns = new Set();
|
|
203
|
+
return col => {
|
|
204
|
+
let colName = col;
|
|
205
|
+
let counter = 1;
|
|
255
206
|
|
|
256
207
|
while (observedColumns.has(colName)) {
|
|
257
208
|
colName = "".concat(col, ".").concat(counter);
|
|
@@ -263,11 +214,10 @@ function duplicateColumnTransformer() {
|
|
|
263
214
|
};
|
|
264
215
|
}
|
|
265
216
|
|
|
266
|
-
function generateHeader(columnPrefix) {
|
|
267
|
-
|
|
268
|
-
var headers = [];
|
|
217
|
+
function generateHeader(columnPrefix, count = 0) {
|
|
218
|
+
const headers = [];
|
|
269
219
|
|
|
270
|
-
for (
|
|
220
|
+
for (let i = 0; i < count; i++) {
|
|
271
221
|
headers.push("".concat(columnPrefix).concat(i + 1));
|
|
272
222
|
}
|
|
273
223
|
|
|
@@ -275,13 +225,13 @@ function generateHeader(columnPrefix) {
|
|
|
275
225
|
}
|
|
276
226
|
|
|
277
227
|
function deduceSchema(row, headerRow) {
|
|
278
|
-
|
|
228
|
+
const schema = headerRow ? {} : [];
|
|
279
229
|
|
|
280
|
-
for (
|
|
281
|
-
|
|
282
|
-
|
|
230
|
+
for (let i = 0; i < row.length; i++) {
|
|
231
|
+
const columnName = headerRow && headerRow[i] || i;
|
|
232
|
+
const value = row[i];
|
|
283
233
|
|
|
284
|
-
switch (
|
|
234
|
+
switch (typeof value) {
|
|
285
235
|
case 'number':
|
|
286
236
|
case 'boolean':
|
|
287
237
|
schema[columnName] = {
|
|
@@ -304,6 +254,6 @@ function deduceSchema(row, headerRow) {
|
|
|
304
254
|
return schema;
|
|
305
255
|
}
|
|
306
256
|
|
|
307
|
-
|
|
257
|
+
const _typecheckCSVLoader = CSVLoader;
|
|
308
258
|
exports._typecheckCSVLoader = _typecheckCSVLoader;
|
|
309
259
|
//# sourceMappingURL=csv-loader.js.map
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"sources":["../../src/csv-loader.ts"],"names":["VERSION","DEFAULT_CSV_LOADER_OPTIONS","csv","shape","optimizeMemoryUsage","header","columnPrefix","quoteChar","escapeChar","dynamicTyping","comments","skipEmptyLines","delimitersToGuess","CSVLoader","id","module","name","version","extensions","mimeTypes","category","parse","arrayBuffer","options","parseCSV","TextDecoder","decode","parseText","text","parseInBatches","parseCSVInBatches","csvText","csvOptions","firstRow","readFirstRow","isHeaderRow","Boolean","parseWithHeader","papaparseConfig","download","transformHeader","duplicateColumnTransformer","undefined","error","e","Error","result","Papa","rows","data","headerRow","meta","fields","generateHeader","length","map","row","Array","isArray","asyncIterator","batchSize","asyncQueue","AsyncQueue","isFirstRow","tableBatchBuilder","schema","config","chunkSize","step","results","collapsedRow","flat","join","trim","bytesUsed","cursor","deduceSchema","JSON","stringify","TableBatchBuilder","addRow","batch","getFullBatch","enqueue","complete","getFinalBatch","close","AsyncIteratorStreamer","every","value","preview","observedColumns","Set","col","colName","counter","has","add","count","headers","i","push","columnName","String","index","type","Float32Array","_typecheckCSVLoader"],"mappings":";;;;;;;;;;;;;;;;;AAIA;;AAMA;;AACA;;;;;;AAIA,IAAMA,OAAO,GAAG,2BAAuB,WAAvB,qBAAmD,QAAnE;AA0BA,IAAMC,0BAA0B,GAAG;AACjCC,EAAAA,GAAG,EAAE;AACHC,IAAAA,KAAK,EAAE,kBADJ;AAEHC,IAAAA,mBAAmB,EAAE,KAFlB;AAIHC,IAAAA,MAAM,EAAE,MAJL;AAKHC,IAAAA,YAAY,EAAE,QALX;AAQHC,IAAAA,SAAS,EAAE,GARR;AASHC,IAAAA,UAAU,EAAE,GATT;AAUHC,IAAAA,aAAa,EAAE,IAVZ;AAWHC,IAAAA,QAAQ,EAAE,KAXP;AAYHC,IAAAA,cAAc,EAAE,IAZb;AAcHC,IAAAA,iBAAiB,EAAE,CAAC,GAAD,EAAM,IAAN,EAAY,GAAZ,EAAiB,GAAjB;AAdhB;AAD4B,CAAnC;AAoBO,IAAMC,SAAS,GAAG;AACvBC,EAAAA,EAAE,EAAE,KADmB;AAEvBC,EAAAA,MAAM,EAAE,KAFe;AAGvBC,EAAAA,IAAI,EAAE,KAHiB;AAIvBC,EAAAA,OAAO,EAAEjB,OAJc;AAKvBkB,EAAAA,UAAU,EAAE,CAAC,KAAD,EAAQ,KAAR,EAAe,KAAf,CALW;AAMvBC,EAAAA,SAAS,EAAE,CAAC,UAAD,EAAa,2BAAb,EAA0C,UAA1C,CANY;AAOvBC,EAAAA,QAAQ,EAAE,OAPa;AAQvBC,EAAAA,KAAK;AAAA,2EAAE,iBAAOC,WAAP,EAAiCC,OAAjC;AAAA;AAAA;AAAA;AAAA;AAAA,+CACLC,QAAQ,CAAC,IAAIC,WAAJ,GAAkBC,MAAlB,CAAyBJ,WAAzB,CAAD,EAAwCC,OAAxC,CADH;;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA,KAAF;;AAAA;AAAA;AAAA;;AAAA;AAAA,KARkB;AAUvBI,EAAAA,SAAS,EAAE,mBAACC,IAAD,EAAeL,OAAf;AAAA,WAA8CC,QAAQ,CAACI,IAAD,EAAOL,OAAP,CAAtD;AAAA,GAVY;AAWvBM,EAAAA,cAAc,EAAEC,iBAXO;AAcvBP,EAAAA,OAAO,EAAEtB;AAdc,CAAlB;;;SAiBQuB,Q;;;;;wEAAf,kBAAwBO,OAAxB,EAAyCR,OAAzC;AAAA;AAAA;AAAA;AAAA;AAAA;AAEQS,YAAAA,UAFR,mCAEyB/B,0BAA0B,CAACC,GAFpD,GAE4DqB,OAF5D,aAE4DA,OAF5D,uBAE4DA,OAAO,CAAErB,GAFrE;AAIQ+B,YAAAA,QAJR,GAImBC,YAAY,CAACH,OAAD,CAJ/B;AAKQ1B,YAAAA,MALR,GAMI2B,UAAU,CAAC3B,MAAX,KAAsB,MAAtB,GAA+B8B,WAAW,CAACF,QAAD,CAA1C,GAAuDG,OAAO,CAACJ,UAAU,CAAC3B,MAAZ,CANlE;AAQQgC,YAAAA,eARR,GAQ0BhC,MAR1B;AAUQiC,YAAAA,eAVR,mCAYON,UAZP;AAaI3B,cAAAA,MAAM,EAAEgC,eAbZ;AAcIE,cAAAA,QAAQ,EAAE,KAdd;AAeIC,cAAAA,eAAe,EAAEH,eAAe,GAAGI,0BAA0B,EAA7B,GAAkCC,SAftE;AAgBIC,cAAAA,KAAK,EAAE,eAACC,CAAD,EAAO;AACZ,sBAAM,IAAIC,KAAJ,CAAUD,CAAV,CAAN;AACD;AAlBL;AAqBQE,YAAAA,MArBR,GAqBiBC,mBAAK1B,KAAL,CAAWU,OAAX,EAAoBO,eAApB,CArBjB;AAsBaU,YAAAA,IAtBb,GAsBqBF,MAtBrB,CAsBOG,IAtBP;AAwBQC,YAAAA,SAxBR,GAwBoBJ,MAAM,CAACK,IAAP,CAAYC,MAAZ,IAAsBC,cAAc,CAACrB,UAAU,CAAC1B,YAAZ,EAA0B2B,QAAQ,CAACqB,MAAnC,CAxBxD;AAAA,2BA0BUtB,UAAU,CAAC7B,KA1BrB;AAAA,8CA2BS,kBA3BT,yBA8BS,iBA9BT;AAAA;;AAAA;AA4BM6C,YAAAA,IAAI,GAAGA,IAAI,CAACO,GAAL,CAAS,UAACC,GAAD;AAAA,qBAAUC,KAAK,CAACC,OAAN,CAAcF,GAAd,IAAqB,gCAAmBA,GAAnB,EAAwBN,SAAxB,CAArB,GAA0DM,GAApE;AAAA,aAAT,CAAP;AA5BN;;AAAA;AA+BMR,YAAAA,IAAI,GAAGA,IAAI,CAACO,GAAL,CAAS,UAACC,GAAD;AAAA,qBAAUC,KAAK,CAACC,OAAN,CAAcF,GAAd,IAAqBA,GAArB,GAA2B,+BAAkBA,GAAlB,EAAuBN,SAAvB,CAArC;AAAA,aAAT,CAAP;AA/BN;;AAAA;AAAA,8CAgDSF,IAhDT;;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA,G;;;;AAoDA,SAASlB,iBAAT,CACE6B,aADF,EAEEpC,OAFF,EAGwB;AAAA;;AAGtBA,EAAAA,OAAO,qBAAOA,OAAP,CAAP;;AACA,MAAIA,OAAO,CAACqC,SAAR,KAAsB,MAA1B,EAAkC;AAChCrC,IAAAA,OAAO,CAACqC,SAAR,GAAoB,IAApB;AACD;;AAGD,MAAM5B,UAAU,mCAAO/B,0BAA0B,CAACC,GAAlC,eAA0CqB,OAA1C,6CAA0C,SAASrB,GAAnD,CAAhB;;AAEA,MAAM2D,UAAU,GAAG,IAAIC,kBAAJ,EAAnB;AAEA,MAAIC,UAAmB,GAAG,IAA1B;AACA,MAAIb,SAA0B,GAAG,IAAjC;AACA,MAAIc,iBAA2C,GAAG,IAAlD;AACA,MAAIC,MAAqB,GAAG,IAA5B;;AAEA,MAAMC,MAAM,mCAEPlC,UAFO;AAGV3B,IAAAA,MAAM,EAAE,KAHE;AAIVkC,IAAAA,QAAQ,EAAE,KAJA;AAQV4B,IAAAA,SAAS,EAAE,OAAO,IAAP,GAAc,CARf;AAcVxD,IAAAA,cAAc,EAAE,KAdN;AAkBVyD,IAAAA,IAlBU,gBAkBLC,OAlBK,EAkBI;AACZ,UAAIb,GAAG,GAAGa,OAAO,CAACpB,IAAlB;;AAEA,UAAIjB,UAAU,CAACrB,cAAf,EAA+B;AAE7B,YAAM2D,YAAY,GAAGd,GAAG,CAACe,IAAJ,GAAWC,IAAX,CAAgB,EAAhB,EAAoBC,IAApB,EAArB;;AACA,YAAIH,YAAY,KAAK,EAArB,EAAyB;AACvB;AACD;AACF;;AACD,UAAMI,SAAS,GAAGL,OAAO,CAAClB,IAAR,CAAawB,MAA/B;;AAGA,UAAIZ,UAAU,IAAI,CAACb,SAAnB,EAA8B;AAE5B,YAAM7C,MAAM,GAAG2B,UAAU,CAAC3B,MAAX,KAAsB,MAAtB,GAA+B8B,WAAW,CAACqB,GAAD,CAA1C,GAAkDpB,OAAO,CAACJ,UAAU,CAAC3B,MAAZ,CAAxE;;AACA,YAAIA,MAAJ,EAAY;AACV6C,UAAAA,SAAS,GAAGM,GAAG,CAACD,GAAJ,CAAQd,0BAA0B,EAAlC,CAAZ;AACA;AACD;AACF;;AAGD,UAAIsB,UAAJ,EAAgB;AACdA,QAAAA,UAAU,GAAG,KAAb;;AACA,YAAI,CAACb,SAAL,EAAgB;AACdA,UAAAA,SAAS,GAAGG,cAAc,CAACrB,UAAU,CAAC1B,YAAZ,EAA0BkD,GAAG,CAACF,MAA9B,CAA1B;AACD;;AACDW,QAAAA,MAAM,GAAGW,YAAY,CAACpB,GAAD,EAAMN,SAAN,CAArB;AACD;;AAED,UAAIlB,UAAU,CAAC5B,mBAAf,EAAoC;AAGlCoD,QAAAA,GAAG,GAAGqB,IAAI,CAACxD,KAAL,CAAWwD,IAAI,CAACC,SAAL,CAAetB,GAAf,CAAX,CAAN;AACD;;AAGDQ,MAAAA,iBAAiB,GACfA,iBAAiB,IACjB,IAAIe,yBAAJ,CAAsBd,MAAtB;AAEE9D,QAAAA,KAAK,EAAE6B,UAAU,CAAC7B,KAAX,IAAoB;AAF7B,SAGKoB,OAHL,EAFF;;AAQA,UAAI;AACFyC,QAAAA,iBAAiB,CAACgB,MAAlB,CAAyBxB,GAAzB;AAEA,YAAMyB,KAAK,GAAGjB,iBAAiB,IAAIA,iBAAiB,CAACkB,YAAlB,CAA+B;AAACR,UAAAA,SAAS,EAATA;AAAD,SAA/B,CAAnC;;AACA,YAAIO,KAAJ,EAAW;AACTpB,UAAAA,UAAU,CAACsB,OAAX,CAAmBF,KAAnB;AACD;AACF,OAPD,CAOE,OAAOtC,KAAP,EAAc;AACdkB,QAAAA,UAAU,CAACsB,OAAX,CAAmBxC,KAAnB;AACD;AACF,KA1ES;AA6EVyC,IAAAA,QA7EU,oBA6EDf,OA7EC,EA6EQ;AAChB,UAAI;AACF,YAAMK,SAAS,GAAGL,OAAO,CAAClB,IAAR,CAAawB,MAA/B;AAEA,YAAMM,KAAK,GAAGjB,iBAAiB,IAAIA,iBAAiB,CAACqB,aAAlB,CAAgC;AAACX,UAAAA,SAAS,EAATA;AAAD,SAAhC,CAAnC;;AACA,YAAIO,KAAJ,EAAW;AACTpB,UAAAA,UAAU,CAACsB,OAAX,CAAmBF,KAAnB;AACD;AACF,OAPD,CAOE,OAAOtC,KAAP,EAAc;AACdkB,QAAAA,UAAU,CAACsB,OAAX,CAAmBxC,KAAnB;AACD;;AAEDkB,MAAAA,UAAU,CAACyB,KAAX;AACD;AA1FS,IAAZ;;AA6FAvC,qBAAK1B,KAAL,CAAWsC,aAAX,EAA0BO,MAA1B,EAAkCqB,8BAAlC;;AAIA,SAAO1B,UAAP;AACD;;AAOD,SAAS1B,WAAT,CAAqBqB,GAArB,EAA6C;AAC3C,SAAOA,GAAG,IAAIA,GAAG,CAACgC,KAAJ,CAAU,UAACC,KAAD;AAAA,WAAW,OAAOA,KAAP,KAAiB,QAA5B;AAAA,GAAV,CAAd;AACD;;AAOD,SAASvD,YAAT,CAAsBH,OAAtB,EAA8C;AAC5C,MAAMe,MAAM,GAAGC,mBAAK1B,KAAL,CAAWU,OAAX,EAAoB;AACjCQ,IAAAA,QAAQ,EAAE,KADuB;AAEjC9B,IAAAA,aAAa,EAAE,IAFkB;AAGjCiF,IAAAA,OAAO,EAAE;AAHwB,GAApB,CAAf;;AAKA,SAAO5C,MAAM,CAACG,IAAP,CAAY,CAAZ,CAAP;AACD;;AAQD,SAASR,0BAAT,GAAsC;AACpC,MAAMkD,eAAe,GAAG,IAAIC,GAAJ,EAAxB;AACA,SAAO,UAACC,GAAD,EAAS;AACd,QAAIC,OAAO,GAAGD,GAAd;AACA,QAAIE,OAAO,GAAG,CAAd;;AACA,WAAOJ,eAAe,CAACK,GAAhB,CAAoBF,OAApB,CAAP,EAAqC;AACnCA,MAAAA,OAAO,aAAMD,GAAN,cAAaE,OAAb,CAAP;AACAA,MAAAA,OAAO;AACR;;AACDJ,IAAAA,eAAe,CAACM,GAAhB,CAAoBH,OAApB;AACA,WAAOA,OAAP;AACD,GATD;AAUD;;AAQD,SAASzC,cAAT,CAAwB/C,YAAxB,EAA2E;AAAA,MAA7B4F,KAA6B,uEAAb,CAAa;AACzE,MAAMC,OAAiB,GAAG,EAA1B;;AACA,OAAK,IAAIC,CAAC,GAAG,CAAb,EAAgBA,CAAC,GAAGF,KAApB,EAA2BE,CAAC,EAA5B,EAAgC;AAC9BD,IAAAA,OAAO,CAACE,IAAR,WAAgB/F,YAAhB,SAA+B8F,CAAC,GAAG,CAAnC;AACD;;AACD,SAAOD,OAAP;AACD;;AAED,SAASvB,YAAT,CAAsBpB,GAAtB,EAA2BN,SAA3B,EAAsC;AACpC,MAAMe,MAAM,GAAGf,SAAS,GAAG,EAAH,GAAQ,EAAhC;;AACA,OAAK,IAAIkD,CAAC,GAAG,CAAb,EAAgBA,CAAC,GAAG5C,GAAG,CAACF,MAAxB,EAAgC8C,CAAC,EAAjC,EAAqC;AACnC,QAAME,UAAU,GAAIpD,SAAS,IAAIA,SAAS,CAACkD,CAAD,CAAvB,IAA+BA,CAAlD;AACA,QAAMX,KAAK,GAAGjC,GAAG,CAAC4C,CAAD,CAAjB;;AACA,kCAAeX,KAAf;AACE,WAAK,QAAL;AACA,WAAK,SAAL;AAEExB,QAAAA,MAAM,CAACqC,UAAD,CAAN,GAAqB;AAACtF,UAAAA,IAAI,EAAEuF,MAAM,CAACD,UAAD,CAAb;AAA2BE,UAAAA,KAAK,EAAEJ,CAAlC;AAAqCK,UAAAA,IAAI,EAAEC;AAA3C,SAArB;AACA;;AACF,WAAK,QAAL;AACA;AACEzC,QAAAA,MAAM,CAACqC,UAAD,CAAN,GAAqB;AAACtF,UAAAA,IAAI,EAAEuF,MAAM,CAACD,UAAD,CAAb;AAA2BE,UAAAA,KAAK,EAAEJ,CAAlC;AAAqCK,UAAAA,IAAI,EAAEhD;AAA3C,SAArB;AARJ;AAYD;;AACD,SAAOQ,MAAP;AACD;;AAEM,IAAM0C,mBAAqC,GAAG9F,SAA9C","sourcesContent":["import type {LoaderWithParser, LoaderOptions} from '@loaders.gl/loader-utils';\nimport type {Batch} from '@loaders.gl/schema';\ntype Schema = any;\n\nimport {\n AsyncQueue,\n TableBatchBuilder,\n convertToArrayRow,\n convertToObjectRow\n} from '@loaders.gl/schema';\nimport Papa from './libs/papaparse';\nimport AsyncIteratorStreamer from './lib/async-iterator-streamer';\n\n// __VERSION__ is injected by babel-plugin-version-inline\n// @ts-ignore TS2304: Cannot find name '__VERSION__'.\nconst VERSION = typeof __VERSION__ !== 'undefined' ? __VERSION__ : 'latest';\n\nexport type CSVLoaderOptions = LoaderOptions & {\n csv?: {\n // loaders.gl options\n shape?: 'array-row-table' | 'object-row-table' | 'columnar-table';\n /** optimizes memory usage but increases parsing time. */\n optimizeMemoryUsage?: boolean;\n columnPrefix?: string;\n header?: 'auto';\n\n // CSV options (papaparse)\n // delimiter: auto\n // newline: auto\n quoteChar?: string;\n escapeChar?: string;\n // Convert numbers and boolean values in rows from strings\n dynamicTyping?: boolean;\n comments?: boolean;\n skipEmptyLines?: boolean | 'greedy';\n // transform: null?\n delimitersToGuess?: string[];\n // fastMode: auto\n };\n};\n\nconst DEFAULT_CSV_LOADER_OPTIONS = {\n csv: {\n shape: 'object-row-table',\n optimizeMemoryUsage: false,\n // CSV options\n header: 'auto',\n columnPrefix: 'column',\n // delimiter: auto\n // newline: auto\n quoteChar: '\"',\n escapeChar: '\"',\n dynamicTyping: true,\n comments: false,\n skipEmptyLines: true,\n // transform: null?\n delimitersToGuess: [',', '\\t', '|', ';']\n // fastMode: auto\n }\n};\n\nexport const CSVLoader = {\n id: 'csv',\n module: 'csv',\n name: 'CSV',\n version: VERSION,\n extensions: ['csv', 'tsv', 'dsv'],\n mimeTypes: ['text/csv', 'text/tab-separated-values', 'text/dsv'],\n category: 'table',\n parse: async (arrayBuffer: ArrayBuffer, options?: CSVLoaderOptions) =>\n parseCSV(new TextDecoder().decode(arrayBuffer), options),\n parseText: (text: string, options?: CSVLoaderOptions) => parseCSV(text, options),\n parseInBatches: parseCSVInBatches,\n // @ts-ignore\n // testText: null,\n options: DEFAULT_CSV_LOADER_OPTIONS as CSVLoaderOptions\n};\n\nasync function parseCSV(csvText: string, options?: CSVLoaderOptions) {\n // Apps can call the parse method directly, we so apply default options here\n const csvOptions = {...DEFAULT_CSV_LOADER_OPTIONS.csv, ...options?.csv};\n\n const firstRow = readFirstRow(csvText);\n const header: boolean =\n csvOptions.header === 'auto' ? isHeaderRow(firstRow) : Boolean(csvOptions.header);\n\n const parseWithHeader = header;\n\n const papaparseConfig = {\n // dynamicTyping: true,\n ...csvOptions,\n header: parseWithHeader,\n download: false, // We handle loading, no need for papaparse to do it for us\n transformHeader: parseWithHeader ? duplicateColumnTransformer() : undefined,\n error: (e) => {\n throw new Error(e);\n }\n };\n\n const result = Papa.parse(csvText, papaparseConfig);\n let {data: rows} = result;\n\n const headerRow = result.meta.fields || generateHeader(csvOptions.columnPrefix, firstRow.length);\n\n switch (csvOptions.shape) {\n case 'object-row-table':\n rows = rows.map((row) => (Array.isArray(row) ? convertToObjectRow(row, headerRow) : row));\n break;\n case 'array-row-table':\n rows = rows.map((row) => (Array.isArray(row) ? row : convertToArrayRow(row, headerRow)));\n break;\n default:\n }\n\n /*\n if (!header && shape === 'object-row-table') {\n // If the dataset has no header, transform the array result into an object shape with an\n // autogenerated header\n return result.data.map((row) =>\n row.reduce((acc, value, i) => {\n acc[headerRow[i]] = value;\n return acc;\n }, {})\n );\n }\n */\n return rows;\n}\n\n// TODO - support batch size 0 = no batching/single batch?\nfunction parseCSVInBatches(\n asyncIterator: AsyncIterable<ArrayBuffer> | Iterable<ArrayBuffer>,\n options?: CSVLoaderOptions\n): AsyncIterable<Batch> {\n // Papaparse does not support standard batch size handling\n // TODO - investigate papaparse chunks mode\n options = {...options};\n if (options.batchSize === 'auto') {\n options.batchSize = 4000;\n }\n\n // Apps can call the parse method directly, we so apply default options here\n const csvOptions = {...DEFAULT_CSV_LOADER_OPTIONS.csv, ...options?.csv};\n\n const asyncQueue = new AsyncQueue<Batch>();\n\n let isFirstRow: boolean = true;\n let headerRow: string[] | null = null;\n let tableBatchBuilder: TableBatchBuilder | null = null;\n let schema: Schema | null = null;\n\n const config = {\n // dynamicTyping: true, // Convert numbers and boolean values in rows from strings,\n ...csvOptions,\n header: false, // Unfortunately, header detection is not automatic and does not infer shapes\n download: false, // We handle loading, no need for papaparse to do it for us\n // chunkSize is set to 5MB explicitly (same as Papaparse default) due to a bug where the\n // streaming parser gets stuck if skipEmptyLines and a step callback are both supplied.\n // See https://github.com/mholt/PapaParse/issues/465\n chunkSize: 1024 * 1024 * 5,\n // skipEmptyLines is set to a boolean value if supplied. Greedy is set to true\n // skipEmptyLines is handled manually given two bugs where the streaming parser gets stuck if\n // both of the skipEmptyLines and step callback options are provided:\n // - true doesn't work unless chunkSize is set: https://github.com/mholt/PapaParse/issues/465\n // - greedy doesn't work: https://github.com/mholt/PapaParse/issues/825\n skipEmptyLines: false,\n\n // step is called on every row\n // eslint-disable-next-line complexity\n step(results) {\n let row = results.data;\n\n if (csvOptions.skipEmptyLines) {\n // Manually reject lines that are empty\n const collapsedRow = row.flat().join('').trim();\n if (collapsedRow === '') {\n return;\n }\n }\n const bytesUsed = results.meta.cursor;\n\n // Check if we need to save a header row\n if (isFirstRow && !headerRow) {\n // Auto detects or can be forced with csvOptions.header\n const header = csvOptions.header === 'auto' ? isHeaderRow(row) : Boolean(csvOptions.header);\n if (header) {\n headerRow = row.map(duplicateColumnTransformer());\n return;\n }\n }\n\n // If first data row, we can deduce the schema\n if (isFirstRow) {\n isFirstRow = false;\n if (!headerRow) {\n headerRow = generateHeader(csvOptions.columnPrefix, row.length);\n }\n schema = deduceSchema(row, headerRow);\n }\n\n if (csvOptions.optimizeMemoryUsage) {\n // A workaround to allocate new strings and don't retain pointers to original strings.\n // https://bugs.chromium.org/p/v8/issues/detail?id=2869\n row = JSON.parse(JSON.stringify(row));\n }\n\n // Add the row\n tableBatchBuilder =\n tableBatchBuilder ||\n new TableBatchBuilder(schema, {\n // @ts-expect-error\n shape: csvOptions.shape || 'array-row-table',\n ...options\n });\n\n try {\n tableBatchBuilder.addRow(row);\n // If a batch has been completed, emit it\n const batch = tableBatchBuilder && tableBatchBuilder.getFullBatch({bytesUsed});\n if (batch) {\n asyncQueue.enqueue(batch);\n }\n } catch (error) {\n asyncQueue.enqueue(error as Error);\n }\n },\n\n // complete is called when all rows have been read\n complete(results) {\n try {\n const bytesUsed = results.meta.cursor;\n // Ensure any final (partial) batch gets emitted\n const batch = tableBatchBuilder && tableBatchBuilder.getFinalBatch({bytesUsed});\n if (batch) {\n asyncQueue.enqueue(batch);\n }\n } catch (error) {\n asyncQueue.enqueue(error as Error);\n }\n\n asyncQueue.close();\n }\n };\n\n Papa.parse(asyncIterator, config, AsyncIteratorStreamer);\n\n // TODO - Does it matter if we return asyncIterable or asyncIterator\n // return asyncQueue[Symbol.asyncIterator]();\n return asyncQueue;\n}\n\n/**\n * Checks if a certain row is a header row\n * @param row the row to check\n * @returns true if the row looks like a header\n */\nfunction isHeaderRow(row: string[]): boolean {\n return row && row.every((value) => typeof value === 'string');\n}\n\n/**\n * Reads, parses, and returns the first row of a CSV text\n * @param csvText the csv text to parse\n * @returns the first row\n */\nfunction readFirstRow(csvText: string): any[] {\n const result = Papa.parse(csvText, {\n download: false,\n dynamicTyping: true,\n preview: 1\n });\n return result.data[0];\n}\n\n/**\n * Creates a transformer that renames duplicate columns. This is needed as Papaparse doesn't handle\n * duplicate header columns and would use the latest occurrence by default.\n * See the header option in https://www.papaparse.com/docs#config\n * @returns a transform function that returns sanitized names for duplicate fields\n */\nfunction duplicateColumnTransformer() {\n const observedColumns = new Set();\n return (col) => {\n let colName = col;\n let counter = 1;\n while (observedColumns.has(colName)) {\n colName = `${col}.${counter}`;\n counter++;\n }\n observedColumns.add(colName);\n return colName;\n };\n}\n\n/**\n * Generates the header of a CSV given a prefix and a column count\n * @param columnPrefix the columnPrefix to use\n * @param count the count of column names to generate\n * @returns an array of column names\n */\nfunction generateHeader(columnPrefix: string, count: number = 0): string[] {\n const headers: string[] = [];\n for (let i = 0; i < count; i++) {\n headers.push(`${columnPrefix}${i + 1}`);\n }\n return headers;\n}\n\nfunction deduceSchema(row, headerRow) {\n const schema = headerRow ? {} : [];\n for (let i = 0; i < row.length; i++) {\n const columnName = (headerRow && headerRow[i]) || i;\n const value = row[i];\n switch (typeof value) {\n case 'number':\n case 'boolean':\n // TODO - booleans could be handled differently...\n schema[columnName] = {name: String(columnName), index: i, type: Float32Array};\n break;\n case 'string':\n default:\n schema[columnName] = {name: String(columnName), index: i, type: Array};\n // We currently only handle numeric rows\n // TODO we could offer a function to map strings to numbers?\n }\n }\n return schema;\n}\n\nexport const _typecheckCSVLoader: LoaderWithParser = CSVLoader;\n"],"file":"csv-loader.js"}
|
|
1
|
+
{"version":3,"sources":["../../src/csv-loader.ts"],"names":["VERSION","DEFAULT_CSV_LOADER_OPTIONS","csv","shape","optimizeMemoryUsage","header","columnPrefix","quoteChar","escapeChar","dynamicTyping","comments","skipEmptyLines","delimitersToGuess","CSVLoader","id","module","name","version","extensions","mimeTypes","category","parse","arrayBuffer","options","parseCSV","TextDecoder","decode","parseText","text","parseInBatches","parseCSVInBatches","csvText","csvOptions","firstRow","readFirstRow","isHeaderRow","Boolean","parseWithHeader","papaparseConfig","download","transformHeader","duplicateColumnTransformer","undefined","error","e","Error","result","Papa","data","rows","headerRow","meta","fields","generateHeader","length","map","row","Array","isArray","asyncIterator","batchSize","asyncQueue","AsyncQueue","isFirstRow","tableBatchBuilder","schema","config","chunkSize","step","results","collapsedRow","flat","join","trim","bytesUsed","cursor","deduceSchema","JSON","stringify","TableBatchBuilder","addRow","batch","getFullBatch","enqueue","complete","getFinalBatch","close","AsyncIteratorStreamer","every","value","preview","observedColumns","Set","col","colName","counter","has","add","count","headers","i","push","columnName","String","index","type","Float32Array","_typecheckCSVLoader"],"mappings":";;;;;;;;;AAIA;;AAMA;;AACA;;AAIA,MAAMA,OAAO,GAAG,2BAAuB,WAAvB,qBAAmD,QAAnE;AA0BA,MAAMC,0BAA0B,GAAG;AACjCC,EAAAA,GAAG,EAAE;AACHC,IAAAA,KAAK,EAAE,kBADJ;AAEHC,IAAAA,mBAAmB,EAAE,KAFlB;AAIHC,IAAAA,MAAM,EAAE,MAJL;AAKHC,IAAAA,YAAY,EAAE,QALX;AAQHC,IAAAA,SAAS,EAAE,GARR;AASHC,IAAAA,UAAU,EAAE,GATT;AAUHC,IAAAA,aAAa,EAAE,IAVZ;AAWHC,IAAAA,QAAQ,EAAE,KAXP;AAYHC,IAAAA,cAAc,EAAE,IAZb;AAcHC,IAAAA,iBAAiB,EAAE,CAAC,GAAD,EAAM,IAAN,EAAY,GAAZ,EAAiB,GAAjB;AAdhB;AAD4B,CAAnC;AAoBO,MAAMC,SAAS,GAAG;AACvBC,EAAAA,EAAE,EAAE,KADmB;AAEvBC,EAAAA,MAAM,EAAE,KAFe;AAGvBC,EAAAA,IAAI,EAAE,KAHiB;AAIvBC,EAAAA,OAAO,EAAEjB,OAJc;AAKvBkB,EAAAA,UAAU,EAAE,CAAC,KAAD,EAAQ,KAAR,EAAe,KAAf,CALW;AAMvBC,EAAAA,SAAS,EAAE,CAAC,UAAD,EAAa,2BAAb,EAA0C,UAA1C,CANY;AAOvBC,EAAAA,QAAQ,EAAE,OAPa;AAQvBC,EAAAA,KAAK,EAAE,OAAOC,WAAP,EAAiCC,OAAjC,KACLC,QAAQ,CAAC,IAAIC,WAAJ,GAAkBC,MAAlB,CAAyBJ,WAAzB,CAAD,EAAwCC,OAAxC,CATa;AAUvBI,EAAAA,SAAS,EAAE,CAACC,IAAD,EAAeL,OAAf,KAA8CC,QAAQ,CAACI,IAAD,EAAOL,OAAP,CAV1C;AAWvBM,EAAAA,cAAc,EAAEC,iBAXO;AAcvBP,EAAAA,OAAO,EAAEtB;AAdc,CAAlB;;;AAiBP,eAAeuB,QAAf,CAAwBO,OAAxB,EAAyCR,OAAzC,EAAqE;AAEnE,QAAMS,UAAU,GAAG,EAAC,GAAG/B,0BAA0B,CAACC,GAA/B;AAAoC,QAAGqB,OAAH,aAAGA,OAAH,uBAAGA,OAAO,CAAErB,GAAZ;AAApC,GAAnB;AAEA,QAAM+B,QAAQ,GAAGC,YAAY,CAACH,OAAD,CAA7B;AACA,QAAM1B,MAAe,GACnB2B,UAAU,CAAC3B,MAAX,KAAsB,MAAtB,GAA+B8B,WAAW,CAACF,QAAD,CAA1C,GAAuDG,OAAO,CAACJ,UAAU,CAAC3B,MAAZ,CADhE;AAGA,QAAMgC,eAAe,GAAGhC,MAAxB;AAEA,QAAMiC,eAAe,GAAG,EAEtB,GAAGN,UAFmB;AAGtB3B,IAAAA,MAAM,EAAEgC,eAHc;AAItBE,IAAAA,QAAQ,EAAE,KAJY;AAKtBC,IAAAA,eAAe,EAAEH,eAAe,GAAGI,0BAA0B,EAA7B,GAAkCC,SAL5C;AAMtBC,IAAAA,KAAK,EAAGC,CAAD,IAAO;AACZ,YAAM,IAAIC,KAAJ,CAAUD,CAAV,CAAN;AACD;AARqB,GAAxB;;AAWA,QAAME,MAAM,GAAGC,mBAAK1B,KAAL,CAAWU,OAAX,EAAoBO,eAApB,CAAf;;AACA,MAAI;AAACU,IAAAA,IAAI,EAAEC;AAAP,MAAeH,MAAnB;AAEA,QAAMI,SAAS,GAAGJ,MAAM,CAACK,IAAP,CAAYC,MAAZ,IAAsBC,cAAc,CAACrB,UAAU,CAAC1B,YAAZ,EAA0B2B,QAAQ,CAACqB,MAAnC,CAAtD;;AAEA,UAAQtB,UAAU,CAAC7B,KAAnB;AACE,SAAK,kBAAL;AACE8C,MAAAA,IAAI,GAAGA,IAAI,CAACM,GAAL,CAAUC,GAAD,IAAUC,KAAK,CAACC,OAAN,CAAcF,GAAd,IAAqB,gCAAmBA,GAAnB,EAAwBN,SAAxB,CAArB,GAA0DM,GAA7E,CAAP;AACA;;AACF,SAAK,iBAAL;AACEP,MAAAA,IAAI,GAAGA,IAAI,CAACM,GAAL,CAAUC,GAAD,IAAUC,KAAK,CAACC,OAAN,CAAcF,GAAd,IAAqBA,GAArB,GAA2B,+BAAkBA,GAAlB,EAAuBN,SAAvB,CAA9C,CAAP;AACA;;AACF;AAPF;;AAsBA,SAAOD,IAAP;AACD;;AAGD,SAASnB,iBAAT,CACE6B,aADF,EAEEpC,OAFF,EAGwB;AAAA;;AAGtBA,EAAAA,OAAO,GAAG,EAAC,GAAGA;AAAJ,GAAV;;AACA,MAAIA,OAAO,CAACqC,SAAR,KAAsB,MAA1B,EAAkC;AAChCrC,IAAAA,OAAO,CAACqC,SAAR,GAAoB,IAApB;AACD;;AAGD,QAAM5B,UAAU,GAAG,EAAC,GAAG/B,0BAA0B,CAACC,GAA/B;AAAoC,oBAAGqB,OAAH,6CAAG,SAASrB,GAAZ;AAApC,GAAnB;AAEA,QAAM2D,UAAU,GAAG,IAAIC,kBAAJ,EAAnB;AAEA,MAAIC,UAAmB,GAAG,IAA1B;AACA,MAAIb,SAA0B,GAAG,IAAjC;AACA,MAAIc,iBAA2C,GAAG,IAAlD;AACA,MAAIC,MAAqB,GAAG,IAA5B;AAEA,QAAMC,MAAM,GAAG,EAEb,GAAGlC,UAFU;AAGb3B,IAAAA,MAAM,EAAE,KAHK;AAIbkC,IAAAA,QAAQ,EAAE,KAJG;AAQb4B,IAAAA,SAAS,EAAE,OAAO,IAAP,GAAc,CARZ;AAcbxD,IAAAA,cAAc,EAAE,KAdH;;AAkBbyD,IAAAA,IAAI,CAACC,OAAD,EAAU;AACZ,UAAIb,GAAG,GAAGa,OAAO,CAACrB,IAAlB;;AAEA,UAAIhB,UAAU,CAACrB,cAAf,EAA+B;AAE7B,cAAM2D,YAAY,GAAGd,GAAG,CAACe,IAAJ,GAAWC,IAAX,CAAgB,EAAhB,EAAoBC,IAApB,EAArB;;AACA,YAAIH,YAAY,KAAK,EAArB,EAAyB;AACvB;AACD;AACF;;AACD,YAAMI,SAAS,GAAGL,OAAO,CAAClB,IAAR,CAAawB,MAA/B;;AAGA,UAAIZ,UAAU,IAAI,CAACb,SAAnB,EAA8B;AAE5B,cAAM7C,MAAM,GAAG2B,UAAU,CAAC3B,MAAX,KAAsB,MAAtB,GAA+B8B,WAAW,CAACqB,GAAD,CAA1C,GAAkDpB,OAAO,CAACJ,UAAU,CAAC3B,MAAZ,CAAxE;;AACA,YAAIA,MAAJ,EAAY;AACV6C,UAAAA,SAAS,GAAGM,GAAG,CAACD,GAAJ,CAAQd,0BAA0B,EAAlC,CAAZ;AACA;AACD;AACF;;AAGD,UAAIsB,UAAJ,EAAgB;AACdA,QAAAA,UAAU,GAAG,KAAb;;AACA,YAAI,CAACb,SAAL,EAAgB;AACdA,UAAAA,SAAS,GAAGG,cAAc,CAACrB,UAAU,CAAC1B,YAAZ,EAA0BkD,GAAG,CAACF,MAA9B,CAA1B;AACD;;AACDW,QAAAA,MAAM,GAAGW,YAAY,CAACpB,GAAD,EAAMN,SAAN,CAArB;AACD;;AAED,UAAIlB,UAAU,CAAC5B,mBAAf,EAAoC;AAGlCoD,QAAAA,GAAG,GAAGqB,IAAI,CAACxD,KAAL,CAAWwD,IAAI,CAACC,SAAL,CAAetB,GAAf,CAAX,CAAN;AACD;;AAGDQ,MAAAA,iBAAiB,GACfA,iBAAiB,IACjB,IAAIe,yBAAJ,CAAsBd,MAAtB,EAA8B;AAE5B9D,QAAAA,KAAK,EAAE6B,UAAU,CAAC7B,KAAX,IAAoB,iBAFC;AAG5B,WAAGoB;AAHyB,OAA9B,CAFF;;AAQA,UAAI;AACFyC,QAAAA,iBAAiB,CAACgB,MAAlB,CAAyBxB,GAAzB;AAEA,cAAMyB,KAAK,GAAGjB,iBAAiB,IAAIA,iBAAiB,CAACkB,YAAlB,CAA+B;AAACR,UAAAA;AAAD,SAA/B,CAAnC;;AACA,YAAIO,KAAJ,EAAW;AACTpB,UAAAA,UAAU,CAACsB,OAAX,CAAmBF,KAAnB;AACD;AACF,OAPD,CAOE,OAAOtC,KAAP,EAAc;AACdkB,QAAAA,UAAU,CAACsB,OAAX,CAAmBxC,KAAnB;AACD;AACF,KA1EY;;AA6EbyC,IAAAA,QAAQ,CAACf,OAAD,EAAU;AAChB,UAAI;AACF,cAAMK,SAAS,GAAGL,OAAO,CAAClB,IAAR,CAAawB,MAA/B;AAEA,cAAMM,KAAK,GAAGjB,iBAAiB,IAAIA,iBAAiB,CAACqB,aAAlB,CAAgC;AAACX,UAAAA;AAAD,SAAhC,CAAnC;;AACA,YAAIO,KAAJ,EAAW;AACTpB,UAAAA,UAAU,CAACsB,OAAX,CAAmBF,KAAnB;AACD;AACF,OAPD,CAOE,OAAOtC,KAAP,EAAc;AACdkB,QAAAA,UAAU,CAACsB,OAAX,CAAmBxC,KAAnB;AACD;;AAEDkB,MAAAA,UAAU,CAACyB,KAAX;AACD;;AA1FY,GAAf;;AA6FAvC,qBAAK1B,KAAL,CAAWsC,aAAX,EAA0BO,MAA1B,EAAkCqB,8BAAlC;;AAIA,SAAO1B,UAAP;AACD;;AAOD,SAAS1B,WAAT,CAAqBqB,GAArB,EAA6C;AAC3C,SAAOA,GAAG,IAAIA,GAAG,CAACgC,KAAJ,CAAWC,KAAD,IAAW,OAAOA,KAAP,KAAiB,QAAtC,CAAd;AACD;;AAOD,SAASvD,YAAT,CAAsBH,OAAtB,EAA8C;AAC5C,QAAMe,MAAM,GAAGC,mBAAK1B,KAAL,CAAWU,OAAX,EAAoB;AACjCQ,IAAAA,QAAQ,EAAE,KADuB;AAEjC9B,IAAAA,aAAa,EAAE,IAFkB;AAGjCiF,IAAAA,OAAO,EAAE;AAHwB,GAApB,CAAf;;AAKA,SAAO5C,MAAM,CAACE,IAAP,CAAY,CAAZ,CAAP;AACD;;AAQD,SAASP,0BAAT,GAAsC;AACpC,QAAMkD,eAAe,GAAG,IAAIC,GAAJ,EAAxB;AACA,SAAQC,GAAD,IAAS;AACd,QAAIC,OAAO,GAAGD,GAAd;AACA,QAAIE,OAAO,GAAG,CAAd;;AACA,WAAOJ,eAAe,CAACK,GAAhB,CAAoBF,OAApB,CAAP,EAAqC;AACnCA,MAAAA,OAAO,aAAMD,GAAN,cAAaE,OAAb,CAAP;AACAA,MAAAA,OAAO;AACR;;AACDJ,IAAAA,eAAe,CAACM,GAAhB,CAAoBH,OAApB;AACA,WAAOA,OAAP;AACD,GATD;AAUD;;AAQD,SAASzC,cAAT,CAAwB/C,YAAxB,EAA8C4F,KAAa,GAAG,CAA9D,EAA2E;AACzE,QAAMC,OAAiB,GAAG,EAA1B;;AACA,OAAK,IAAIC,CAAC,GAAG,CAAb,EAAgBA,CAAC,GAAGF,KAApB,EAA2BE,CAAC,EAA5B,EAAgC;AAC9BD,IAAAA,OAAO,CAACE,IAAR,WAAgB/F,YAAhB,SAA+B8F,CAAC,GAAG,CAAnC;AACD;;AACD,SAAOD,OAAP;AACD;;AAED,SAASvB,YAAT,CAAsBpB,GAAtB,EAA2BN,SAA3B,EAAsC;AACpC,QAAMe,MAAM,GAAGf,SAAS,GAAG,EAAH,GAAQ,EAAhC;;AACA,OAAK,IAAIkD,CAAC,GAAG,CAAb,EAAgBA,CAAC,GAAG5C,GAAG,CAACF,MAAxB,EAAgC8C,CAAC,EAAjC,EAAqC;AACnC,UAAME,UAAU,GAAIpD,SAAS,IAAIA,SAAS,CAACkD,CAAD,CAAvB,IAA+BA,CAAlD;AACA,UAAMX,KAAK,GAAGjC,GAAG,CAAC4C,CAAD,CAAjB;;AACA,YAAQ,OAAOX,KAAf;AACE,WAAK,QAAL;AACA,WAAK,SAAL;AAEExB,QAAAA,MAAM,CAACqC,UAAD,CAAN,GAAqB;AAACtF,UAAAA,IAAI,EAAEuF,MAAM,CAACD,UAAD,CAAb;AAA2BE,UAAAA,KAAK,EAAEJ,CAAlC;AAAqCK,UAAAA,IAAI,EAAEC;AAA3C,SAArB;AACA;;AACF,WAAK,QAAL;AACA;AACEzC,QAAAA,MAAM,CAACqC,UAAD,CAAN,GAAqB;AAACtF,UAAAA,IAAI,EAAEuF,MAAM,CAACD,UAAD,CAAb;AAA2BE,UAAAA,KAAK,EAAEJ,CAAlC;AAAqCK,UAAAA,IAAI,EAAEhD;AAA3C,SAArB;AARJ;AAYD;;AACD,SAAOQ,MAAP;AACD;;AAEM,MAAM0C,mBAAqC,GAAG9F,SAA9C","sourcesContent":["import type {LoaderWithParser, LoaderOptions} from '@loaders.gl/loader-utils';\nimport type {Batch} from '@loaders.gl/schema';\ntype Schema = any;\n\nimport {\n AsyncQueue,\n TableBatchBuilder,\n convertToArrayRow,\n convertToObjectRow\n} from '@loaders.gl/schema';\nimport Papa from './libs/papaparse';\nimport AsyncIteratorStreamer from './lib/async-iterator-streamer';\n\n// __VERSION__ is injected by babel-plugin-version-inline\n// @ts-ignore TS2304: Cannot find name '__VERSION__'.\nconst VERSION = typeof __VERSION__ !== 'undefined' ? __VERSION__ : 'latest';\n\nexport type CSVLoaderOptions = LoaderOptions & {\n csv?: {\n // loaders.gl options\n shape?: 'array-row-table' | 'object-row-table' | 'columnar-table';\n /** optimizes memory usage but increases parsing time. */\n optimizeMemoryUsage?: boolean;\n columnPrefix?: string;\n header?: 'auto';\n\n // CSV options (papaparse)\n // delimiter: auto\n // newline: auto\n quoteChar?: string;\n escapeChar?: string;\n // Convert numbers and boolean values in rows from strings\n dynamicTyping?: boolean;\n comments?: boolean;\n skipEmptyLines?: boolean | 'greedy';\n // transform: null?\n delimitersToGuess?: string[];\n // fastMode: auto\n };\n};\n\nconst DEFAULT_CSV_LOADER_OPTIONS = {\n csv: {\n shape: 'object-row-table',\n optimizeMemoryUsage: false,\n // CSV options\n header: 'auto',\n columnPrefix: 'column',\n // delimiter: auto\n // newline: auto\n quoteChar: '\"',\n escapeChar: '\"',\n dynamicTyping: true,\n comments: false,\n skipEmptyLines: true,\n // transform: null?\n delimitersToGuess: [',', '\\t', '|', ';']\n // fastMode: auto\n }\n};\n\nexport const CSVLoader = {\n id: 'csv',\n module: 'csv',\n name: 'CSV',\n version: VERSION,\n extensions: ['csv', 'tsv', 'dsv'],\n mimeTypes: ['text/csv', 'text/tab-separated-values', 'text/dsv'],\n category: 'table',\n parse: async (arrayBuffer: ArrayBuffer, options?: CSVLoaderOptions) =>\n parseCSV(new TextDecoder().decode(arrayBuffer), options),\n parseText: (text: string, options?: CSVLoaderOptions) => parseCSV(text, options),\n parseInBatches: parseCSVInBatches,\n // @ts-ignore\n // testText: null,\n options: DEFAULT_CSV_LOADER_OPTIONS as CSVLoaderOptions\n};\n\nasync function parseCSV(csvText: string, options?: CSVLoaderOptions) {\n // Apps can call the parse method directly, we so apply default options here\n const csvOptions = {...DEFAULT_CSV_LOADER_OPTIONS.csv, ...options?.csv};\n\n const firstRow = readFirstRow(csvText);\n const header: boolean =\n csvOptions.header === 'auto' ? isHeaderRow(firstRow) : Boolean(csvOptions.header);\n\n const parseWithHeader = header;\n\n const papaparseConfig = {\n // dynamicTyping: true,\n ...csvOptions,\n header: parseWithHeader,\n download: false, // We handle loading, no need for papaparse to do it for us\n transformHeader: parseWithHeader ? duplicateColumnTransformer() : undefined,\n error: (e) => {\n throw new Error(e);\n }\n };\n\n const result = Papa.parse(csvText, papaparseConfig);\n let {data: rows} = result;\n\n const headerRow = result.meta.fields || generateHeader(csvOptions.columnPrefix, firstRow.length);\n\n switch (csvOptions.shape) {\n case 'object-row-table':\n rows = rows.map((row) => (Array.isArray(row) ? convertToObjectRow(row, headerRow) : row));\n break;\n case 'array-row-table':\n rows = rows.map((row) => (Array.isArray(row) ? row : convertToArrayRow(row, headerRow)));\n break;\n default:\n }\n\n /*\n if (!header && shape === 'object-row-table') {\n // If the dataset has no header, transform the array result into an object shape with an\n // autogenerated header\n return result.data.map((row) =>\n row.reduce((acc, value, i) => {\n acc[headerRow[i]] = value;\n return acc;\n }, {})\n );\n }\n */\n return rows;\n}\n\n// TODO - support batch size 0 = no batching/single batch?\nfunction parseCSVInBatches(\n asyncIterator: AsyncIterable<ArrayBuffer> | Iterable<ArrayBuffer>,\n options?: CSVLoaderOptions\n): AsyncIterable<Batch> {\n // Papaparse does not support standard batch size handling\n // TODO - investigate papaparse chunks mode\n options = {...options};\n if (options.batchSize === 'auto') {\n options.batchSize = 4000;\n }\n\n // Apps can call the parse method directly, we so apply default options here\n const csvOptions = {...DEFAULT_CSV_LOADER_OPTIONS.csv, ...options?.csv};\n\n const asyncQueue = new AsyncQueue<Batch>();\n\n let isFirstRow: boolean = true;\n let headerRow: string[] | null = null;\n let tableBatchBuilder: TableBatchBuilder | null = null;\n let schema: Schema | null = null;\n\n const config = {\n // dynamicTyping: true, // Convert numbers and boolean values in rows from strings,\n ...csvOptions,\n header: false, // Unfortunately, header detection is not automatic and does not infer shapes\n download: false, // We handle loading, no need for papaparse to do it for us\n // chunkSize is set to 5MB explicitly (same as Papaparse default) due to a bug where the\n // streaming parser gets stuck if skipEmptyLines and a step callback are both supplied.\n // See https://github.com/mholt/PapaParse/issues/465\n chunkSize: 1024 * 1024 * 5,\n // skipEmptyLines is set to a boolean value if supplied. Greedy is set to true\n // skipEmptyLines is handled manually given two bugs where the streaming parser gets stuck if\n // both of the skipEmptyLines and step callback options are provided:\n // - true doesn't work unless chunkSize is set: https://github.com/mholt/PapaParse/issues/465\n // - greedy doesn't work: https://github.com/mholt/PapaParse/issues/825\n skipEmptyLines: false,\n\n // step is called on every row\n // eslint-disable-next-line complexity\n step(results) {\n let row = results.data;\n\n if (csvOptions.skipEmptyLines) {\n // Manually reject lines that are empty\n const collapsedRow = row.flat().join('').trim();\n if (collapsedRow === '') {\n return;\n }\n }\n const bytesUsed = results.meta.cursor;\n\n // Check if we need to save a header row\n if (isFirstRow && !headerRow) {\n // Auto detects or can be forced with csvOptions.header\n const header = csvOptions.header === 'auto' ? isHeaderRow(row) : Boolean(csvOptions.header);\n if (header) {\n headerRow = row.map(duplicateColumnTransformer());\n return;\n }\n }\n\n // If first data row, we can deduce the schema\n if (isFirstRow) {\n isFirstRow = false;\n if (!headerRow) {\n headerRow = generateHeader(csvOptions.columnPrefix, row.length);\n }\n schema = deduceSchema(row, headerRow);\n }\n\n if (csvOptions.optimizeMemoryUsage) {\n // A workaround to allocate new strings and don't retain pointers to original strings.\n // https://bugs.chromium.org/p/v8/issues/detail?id=2869\n row = JSON.parse(JSON.stringify(row));\n }\n\n // Add the row\n tableBatchBuilder =\n tableBatchBuilder ||\n new TableBatchBuilder(schema, {\n // @ts-expect-error\n shape: csvOptions.shape || 'array-row-table',\n ...options\n });\n\n try {\n tableBatchBuilder.addRow(row);\n // If a batch has been completed, emit it\n const batch = tableBatchBuilder && tableBatchBuilder.getFullBatch({bytesUsed});\n if (batch) {\n asyncQueue.enqueue(batch);\n }\n } catch (error) {\n asyncQueue.enqueue(error as Error);\n }\n },\n\n // complete is called when all rows have been read\n complete(results) {\n try {\n const bytesUsed = results.meta.cursor;\n // Ensure any final (partial) batch gets emitted\n const batch = tableBatchBuilder && tableBatchBuilder.getFinalBatch({bytesUsed});\n if (batch) {\n asyncQueue.enqueue(batch);\n }\n } catch (error) {\n asyncQueue.enqueue(error as Error);\n }\n\n asyncQueue.close();\n }\n };\n\n Papa.parse(asyncIterator, config, AsyncIteratorStreamer);\n\n // TODO - Does it matter if we return asyncIterable or asyncIterator\n // return asyncQueue[Symbol.asyncIterator]();\n return asyncQueue;\n}\n\n/**\n * Checks if a certain row is a header row\n * @param row the row to check\n * @returns true if the row looks like a header\n */\nfunction isHeaderRow(row: string[]): boolean {\n return row && row.every((value) => typeof value === 'string');\n}\n\n/**\n * Reads, parses, and returns the first row of a CSV text\n * @param csvText the csv text to parse\n * @returns the first row\n */\nfunction readFirstRow(csvText: string): any[] {\n const result = Papa.parse(csvText, {\n download: false,\n dynamicTyping: true,\n preview: 1\n });\n return result.data[0];\n}\n\n/**\n * Creates a transformer that renames duplicate columns. This is needed as Papaparse doesn't handle\n * duplicate header columns and would use the latest occurrence by default.\n * See the header option in https://www.papaparse.com/docs#config\n * @returns a transform function that returns sanitized names for duplicate fields\n */\nfunction duplicateColumnTransformer() {\n const observedColumns = new Set();\n return (col) => {\n let colName = col;\n let counter = 1;\n while (observedColumns.has(colName)) {\n colName = `${col}.${counter}`;\n counter++;\n }\n observedColumns.add(colName);\n return colName;\n };\n}\n\n/**\n * Generates the header of a CSV given a prefix and a column count\n * @param columnPrefix the columnPrefix to use\n * @param count the count of column names to generate\n * @returns an array of column names\n */\nfunction generateHeader(columnPrefix: string, count: number = 0): string[] {\n const headers: string[] = [];\n for (let i = 0; i < count; i++) {\n headers.push(`${columnPrefix}${i + 1}`);\n }\n return headers;\n}\n\nfunction deduceSchema(row, headerRow) {\n const schema = headerRow ? {} : [];\n for (let i = 0; i < row.length; i++) {\n const columnName = (headerRow && headerRow[i]) || i;\n const value = row[i];\n switch (typeof value) {\n case 'number':\n case 'boolean':\n // TODO - booleans could be handled differently...\n schema[columnName] = {name: String(columnName), index: i, type: Float32Array};\n break;\n case 'string':\n default:\n schema[columnName] = {name: String(columnName), index: i, type: Array};\n // We currently only handle numeric rows\n // TODO we could offer a function to map strings to numbers?\n }\n }\n return schema;\n}\n\nexport const _typecheckCSVLoader: LoaderWithParser = CSVLoader;\n"],"file":"csv-loader.js"}
|
package/dist/es5/index.js
CHANGED
|
@@ -7,124 +7,31 @@ Object.defineProperty(exports, "__esModule", {
|
|
|
7
7
|
});
|
|
8
8
|
exports.default = AsyncIteratorStreamer;
|
|
9
9
|
|
|
10
|
-
var _regenerator = _interopRequireDefault(require("@babel/runtime/regenerator"));
|
|
11
|
-
|
|
12
|
-
var _asyncToGenerator2 = _interopRequireDefault(require("@babel/runtime/helpers/asyncToGenerator"));
|
|
13
|
-
|
|
14
|
-
var _asyncIterator2 = _interopRequireDefault(require("@babel/runtime/helpers/asyncIterator"));
|
|
15
|
-
|
|
16
10
|
var _papaparse = _interopRequireDefault(require("../libs/papaparse"));
|
|
17
11
|
|
|
18
|
-
|
|
12
|
+
const {
|
|
13
|
+
ChunkStreamer
|
|
14
|
+
} = _papaparse.default;
|
|
19
15
|
|
|
20
16
|
function AsyncIteratorStreamer(config) {
|
|
21
17
|
config = config || {};
|
|
22
18
|
ChunkStreamer.call(this, config);
|
|
23
19
|
this.textDecoder = new TextDecoder(this._config.encoding);
|
|
24
20
|
|
|
25
|
-
this.stream = function () {
|
|
26
|
-
|
|
27
|
-
var _iteratorNormalCompletion, _didIteratorError, _iteratorError, _iterator, _step, _value, chunk;
|
|
28
|
-
|
|
29
|
-
return _regenerator.default.wrap(function _callee$(_context) {
|
|
30
|
-
while (1) {
|
|
31
|
-
switch (_context.prev = _context.next) {
|
|
32
|
-
case 0:
|
|
33
|
-
this._input = asyncIterator;
|
|
34
|
-
_context.prev = 1;
|
|
35
|
-
_iteratorNormalCompletion = true;
|
|
36
|
-
_didIteratorError = false;
|
|
37
|
-
_context.prev = 4;
|
|
38
|
-
_iterator = (0, _asyncIterator2.default)(asyncIterator);
|
|
39
|
-
|
|
40
|
-
case 6:
|
|
41
|
-
_context.next = 8;
|
|
42
|
-
return _iterator.next();
|
|
43
|
-
|
|
44
|
-
case 8:
|
|
45
|
-
_step = _context.sent;
|
|
46
|
-
_iteratorNormalCompletion = _step.done;
|
|
47
|
-
_context.next = 12;
|
|
48
|
-
return _step.value;
|
|
49
|
-
|
|
50
|
-
case 12:
|
|
51
|
-
_value = _context.sent;
|
|
52
|
-
|
|
53
|
-
if (_iteratorNormalCompletion) {
|
|
54
|
-
_context.next = 19;
|
|
55
|
-
break;
|
|
56
|
-
}
|
|
57
|
-
|
|
58
|
-
chunk = _value;
|
|
59
|
-
this.parseChunk(this.getStringChunk(chunk));
|
|
60
|
-
|
|
61
|
-
case 16:
|
|
62
|
-
_iteratorNormalCompletion = true;
|
|
63
|
-
_context.next = 6;
|
|
64
|
-
break;
|
|
65
|
-
|
|
66
|
-
case 19:
|
|
67
|
-
_context.next = 25;
|
|
68
|
-
break;
|
|
69
|
-
|
|
70
|
-
case 21:
|
|
71
|
-
_context.prev = 21;
|
|
72
|
-
_context.t0 = _context["catch"](4);
|
|
73
|
-
_didIteratorError = true;
|
|
74
|
-
_iteratorError = _context.t0;
|
|
21
|
+
this.stream = async function (asyncIterator) {
|
|
22
|
+
this._input = asyncIterator;
|
|
75
23
|
|
|
76
|
-
|
|
77
|
-
|
|
78
|
-
|
|
24
|
+
try {
|
|
25
|
+
for await (const chunk of asyncIterator) {
|
|
26
|
+
this.parseChunk(this.getStringChunk(chunk));
|
|
27
|
+
}
|
|
79
28
|
|
|
80
|
-
|
|
81
|
-
|
|
82
|
-
|
|
83
|
-
|
|
84
|
-
|
|
85
|
-
|
|
86
|
-
return _iterator.return();
|
|
87
|
-
|
|
88
|
-
case 30:
|
|
89
|
-
_context.prev = 30;
|
|
90
|
-
|
|
91
|
-
if (!_didIteratorError) {
|
|
92
|
-
_context.next = 33;
|
|
93
|
-
break;
|
|
94
|
-
}
|
|
95
|
-
|
|
96
|
-
throw _iteratorError;
|
|
97
|
-
|
|
98
|
-
case 33:
|
|
99
|
-
return _context.finish(30);
|
|
100
|
-
|
|
101
|
-
case 34:
|
|
102
|
-
return _context.finish(25);
|
|
103
|
-
|
|
104
|
-
case 35:
|
|
105
|
-
this._finished = true;
|
|
106
|
-
this.parseChunk('');
|
|
107
|
-
_context.next = 42;
|
|
108
|
-
break;
|
|
109
|
-
|
|
110
|
-
case 39:
|
|
111
|
-
_context.prev = 39;
|
|
112
|
-
_context.t1 = _context["catch"](1);
|
|
113
|
-
|
|
114
|
-
this._sendError(_context.t1);
|
|
115
|
-
|
|
116
|
-
case 42:
|
|
117
|
-
case "end":
|
|
118
|
-
return _context.stop();
|
|
119
|
-
}
|
|
120
|
-
}
|
|
121
|
-
}, _callee, this, [[1, 39], [4, 21, 25, 35], [26,, 30, 34]]);
|
|
122
|
-
}));
|
|
123
|
-
|
|
124
|
-
return function (_x) {
|
|
125
|
-
return _ref.apply(this, arguments);
|
|
126
|
-
};
|
|
127
|
-
}();
|
|
29
|
+
this._finished = true;
|
|
30
|
+
this.parseChunk('');
|
|
31
|
+
} catch (error) {
|
|
32
|
+
this._sendError(error);
|
|
33
|
+
}
|
|
34
|
+
};
|
|
128
35
|
|
|
129
36
|
this._nextChunk = function nextChunk() {};
|
|
130
37
|
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"sources":["../../../src/lib/async-iterator-streamer.ts"],"names":["ChunkStreamer","Papa","AsyncIteratorStreamer","config","call","textDecoder","TextDecoder","_config","encoding","stream","asyncIterator","_input","chunk","parseChunk","getStringChunk","_finished","_sendError","_nextChunk","nextChunk","decode","prototype","Object","create","constructor"],"mappings":"
|
|
1
|
+
{"version":3,"sources":["../../../src/lib/async-iterator-streamer.ts"],"names":["ChunkStreamer","Papa","AsyncIteratorStreamer","config","call","textDecoder","TextDecoder","_config","encoding","stream","asyncIterator","_input","chunk","parseChunk","getStringChunk","_finished","error","_sendError","_nextChunk","nextChunk","decode","prototype","Object","create","constructor"],"mappings":";;;;;;;;;AAQA;;AACA,MAAM;AAACA,EAAAA;AAAD,IAAkBC,kBAAxB;;AAEe,SAASC,qBAAT,CAA+BC,MAA/B,EAAuC;AACpDA,EAAAA,MAAM,GAAGA,MAAM,IAAI,EAAnB;AAEAH,EAAAA,aAAa,CAACI,IAAd,CAAmB,IAAnB,EAAyBD,MAAzB;AAEA,OAAKE,WAAL,GAAmB,IAAIC,WAAJ,CAAgB,KAAKC,OAAL,CAAaC,QAA7B,CAAnB;;AAaA,OAAKC,MAAL,GAAc,gBAAgBC,aAAhB,EAA+B;AAC3C,SAAKC,MAAL,GAAcD,aAAd;;AAEA,QAAI;AAGF,iBAAW,MAAME,KAAjB,IAA0BF,aAA1B,EAAyC;AACvC,aAAKG,UAAL,CAAgB,KAAKC,cAAL,CAAoBF,KAApB,CAAhB;AACD;;AAcD,WAAKG,SAAL,GAAiB,IAAjB;AACA,WAAKF,UAAL,CAAgB,EAAhB;AACD,KArBD,CAqBE,OAAOG,KAAP,EAAc;AAEd,WAAKC,UAAL,CAAgBD,KAAhB;AACD;AACF,GA5BD;;AA8BA,OAAKE,UAAL,GAAkB,SAASC,SAAT,GAAqB,CAEtC,CAFD;;AAKA,OAAKL,cAAL,GAAsB,UAAUF,KAAV,EAAiB;AACrC,WAAO,OAAOA,KAAP,KAAiB,QAAjB,GAA4BA,KAA5B,GAAoC,KAAKP,WAAL,CAAiBe,MAAjB,CAAwBR,KAAxB,EAA+B;AAACH,MAAAA,MAAM,EAAE;AAAT,KAA/B,CAA3C;AACD,GAFD;AAGD;;AAEDP,qBAAqB,CAACmB,SAAtB,GAAkCC,MAAM,CAACC,MAAP,CAAcvB,aAAa,CAACqB,SAA5B,CAAlC;AACAnB,qBAAqB,CAACmB,SAAtB,CAAgCG,WAAhC,GAA8CtB,qBAA9C","sourcesContent":["// A custom papaparse `Streamer` for async iterators\n// Ideally this can be contributed back to papaparse\n// Or papaparse can expose Streamer API so we can extend without forking.\n\n// @ts-nocheck\n/* eslint-disable no-invalid-this */\n\n// Note: papaparse is not an ES6 module\nimport Papa from '../libs/papaparse';\nconst {ChunkStreamer} = Papa;\n\nexport default function AsyncIteratorStreamer(config) {\n config = config || {};\n\n ChunkStreamer.call(this, config);\n\n this.textDecoder = new TextDecoder(this._config.encoding);\n\n // Implement ChunkStreamer base class methods\n\n // this.pause = function() {\n // ChunkStreamer.prototype.pause.apply(this, arguments);\n // };\n\n // this.resume = function() {\n // ChunkStreamer.prototype.resume.apply(this, arguments);\n // this._input.resume();\n // };\n\n this.stream = async function (asyncIterator) {\n this._input = asyncIterator;\n\n try {\n // ES2018 version\n // TODO - check for pause and abort flags?\n for await (const chunk of asyncIterator) {\n this.parseChunk(this.getStringChunk(chunk));\n }\n\n // ES5 VERSION\n // while (true) {\n // asyncIterator.next().then(function(value) {\n // if (value.done) {\n // // finalize iterator?\n // }\n // }\n // const = await ;\n // if (done) return total;\n // total += value.length;\n // }\n\n this._finished = true;\n this.parseChunk('');\n } catch (error) {\n // Inform ChunkStreamer base class of error\n this._sendError(error);\n }\n };\n\n this._nextChunk = function nextChunk() {\n // Left empty, as async iterator automatically pulls next chunk\n };\n\n // HELPER METHODS\n this.getStringChunk = function (chunk) {\n return typeof chunk === 'string' ? chunk : this.textDecoder.decode(chunk, {stream: true});\n };\n}\n\nAsyncIteratorStreamer.prototype = Object.create(ChunkStreamer.prototype);\nAsyncIteratorStreamer.prototype.constructor = AsyncIteratorStreamer;\n"],"file":"async-iterator-streamer.js"}
|
|
@@ -7,124 +7,31 @@ Object.defineProperty(exports, "__esModule", {
|
|
|
7
7
|
});
|
|
8
8
|
exports.default = AsyncIteratorStreamer;
|
|
9
9
|
|
|
10
|
-
var _regenerator = _interopRequireDefault(require("@babel/runtime/regenerator"));
|
|
11
|
-
|
|
12
|
-
var _asyncToGenerator2 = _interopRequireDefault(require("@babel/runtime/helpers/asyncToGenerator"));
|
|
13
|
-
|
|
14
|
-
var _asyncIterator2 = _interopRequireDefault(require("@babel/runtime/helpers/asyncIterator"));
|
|
15
|
-
|
|
16
10
|
var _papaparse = _interopRequireDefault(require("../libs/papaparse"));
|
|
17
11
|
|
|
18
|
-
|
|
12
|
+
const {
|
|
13
|
+
ChunkStreamer
|
|
14
|
+
} = _papaparse.default;
|
|
19
15
|
|
|
20
16
|
function AsyncIteratorStreamer(config) {
|
|
21
17
|
config = config || {};
|
|
22
18
|
ChunkStreamer.call(this, config);
|
|
23
19
|
this.textDecoder = new TextDecoder(this._config.encoding);
|
|
24
20
|
|
|
25
|
-
this.stream = function () {
|
|
26
|
-
|
|
27
|
-
var _iteratorNormalCompletion, _didIteratorError, _iteratorError, _iterator, _step, _value, chunk;
|
|
28
|
-
|
|
29
|
-
return _regenerator.default.wrap(function _callee$(_context) {
|
|
30
|
-
while (1) {
|
|
31
|
-
switch (_context.prev = _context.next) {
|
|
32
|
-
case 0:
|
|
33
|
-
this._input = asyncIterator;
|
|
34
|
-
_context.prev = 1;
|
|
35
|
-
_iteratorNormalCompletion = true;
|
|
36
|
-
_didIteratorError = false;
|
|
37
|
-
_context.prev = 4;
|
|
38
|
-
_iterator = (0, _asyncIterator2.default)(asyncIterator);
|
|
39
|
-
|
|
40
|
-
case 6:
|
|
41
|
-
_context.next = 8;
|
|
42
|
-
return _iterator.next();
|
|
43
|
-
|
|
44
|
-
case 8:
|
|
45
|
-
_step = _context.sent;
|
|
46
|
-
_iteratorNormalCompletion = _step.done;
|
|
47
|
-
_context.next = 12;
|
|
48
|
-
return _step.value;
|
|
49
|
-
|
|
50
|
-
case 12:
|
|
51
|
-
_value = _context.sent;
|
|
52
|
-
|
|
53
|
-
if (_iteratorNormalCompletion) {
|
|
54
|
-
_context.next = 19;
|
|
55
|
-
break;
|
|
56
|
-
}
|
|
57
|
-
|
|
58
|
-
chunk = _value;
|
|
59
|
-
this.parseChunk(this.getStringChunk(chunk));
|
|
60
|
-
|
|
61
|
-
case 16:
|
|
62
|
-
_iteratorNormalCompletion = true;
|
|
63
|
-
_context.next = 6;
|
|
64
|
-
break;
|
|
65
|
-
|
|
66
|
-
case 19:
|
|
67
|
-
_context.next = 25;
|
|
68
|
-
break;
|
|
69
|
-
|
|
70
|
-
case 21:
|
|
71
|
-
_context.prev = 21;
|
|
72
|
-
_context.t0 = _context["catch"](4);
|
|
73
|
-
_didIteratorError = true;
|
|
74
|
-
_iteratorError = _context.t0;
|
|
21
|
+
this.stream = async function (asyncIterator) {
|
|
22
|
+
this._input = asyncIterator;
|
|
75
23
|
|
|
76
|
-
|
|
77
|
-
|
|
78
|
-
|
|
24
|
+
try {
|
|
25
|
+
for await (const chunk of asyncIterator) {
|
|
26
|
+
this.parseChunk(this.getStringChunk(chunk));
|
|
27
|
+
}
|
|
79
28
|
|
|
80
|
-
|
|
81
|
-
|
|
82
|
-
|
|
83
|
-
|
|
84
|
-
|
|
85
|
-
|
|
86
|
-
return _iterator.return();
|
|
87
|
-
|
|
88
|
-
case 30:
|
|
89
|
-
_context.prev = 30;
|
|
90
|
-
|
|
91
|
-
if (!_didIteratorError) {
|
|
92
|
-
_context.next = 33;
|
|
93
|
-
break;
|
|
94
|
-
}
|
|
95
|
-
|
|
96
|
-
throw _iteratorError;
|
|
97
|
-
|
|
98
|
-
case 33:
|
|
99
|
-
return _context.finish(30);
|
|
100
|
-
|
|
101
|
-
case 34:
|
|
102
|
-
return _context.finish(25);
|
|
103
|
-
|
|
104
|
-
case 35:
|
|
105
|
-
this._finished = true;
|
|
106
|
-
this.parseChunk('');
|
|
107
|
-
_context.next = 42;
|
|
108
|
-
break;
|
|
109
|
-
|
|
110
|
-
case 39:
|
|
111
|
-
_context.prev = 39;
|
|
112
|
-
_context.t1 = _context["catch"](1);
|
|
113
|
-
|
|
114
|
-
this._sendError(_context.t1);
|
|
115
|
-
|
|
116
|
-
case 42:
|
|
117
|
-
case "end":
|
|
118
|
-
return _context.stop();
|
|
119
|
-
}
|
|
120
|
-
}
|
|
121
|
-
}, _callee, this, [[1, 39], [4, 21, 25, 35], [26,, 30, 34]]);
|
|
122
|
-
}));
|
|
123
|
-
|
|
124
|
-
return function (_x) {
|
|
125
|
-
return _ref.apply(this, arguments);
|
|
126
|
-
};
|
|
127
|
-
}();
|
|
29
|
+
this._finished = true;
|
|
30
|
+
this.parseChunk('');
|
|
31
|
+
} catch (error) {
|
|
32
|
+
this._sendError(error);
|
|
33
|
+
}
|
|
34
|
+
};
|
|
128
35
|
|
|
129
36
|
this._nextChunk = function nextChunk() {};
|
|
130
37
|
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"sources":["../../../src/papaparse/async-iterator-streamer.js"],"names":["ChunkStreamer","Papa","AsyncIteratorStreamer","config","call","textDecoder","TextDecoder","_config","encoding","stream","asyncIterator","_input","chunk","parseChunk","getStringChunk","_finished","_sendError","_nextChunk","nextChunk","decode","prototype","Object","create","constructor"],"mappings":"
|
|
1
|
+
{"version":3,"sources":["../../../src/papaparse/async-iterator-streamer.js"],"names":["ChunkStreamer","Papa","AsyncIteratorStreamer","config","call","textDecoder","TextDecoder","_config","encoding","stream","asyncIterator","_input","chunk","parseChunk","getStringChunk","_finished","error","_sendError","_nextChunk","nextChunk","decode","prototype","Object","create","constructor"],"mappings":";;;;;;;;;AAQA;;AACA,MAAM;AAACA,EAAAA;AAAD,IAAkBC,kBAAxB;;AAEe,SAASC,qBAAT,CAA+BC,MAA/B,EAAuC;AACpDA,EAAAA,MAAM,GAAGA,MAAM,IAAI,EAAnB;AAEAH,EAAAA,aAAa,CAACI,IAAd,CAAmB,IAAnB,EAAyBD,MAAzB;AAEA,OAAKE,WAAL,GAAmB,IAAIC,WAAJ,CAAgB,KAAKC,OAAL,CAAaC,QAA7B,CAAnB;;AAaA,OAAKC,MAAL,GAAc,gBAAgBC,aAAhB,EAA+B;AAC3C,SAAKC,MAAL,GAAcD,aAAd;;AAEA,QAAI;AAGF,iBAAW,MAAME,KAAjB,IAA0BF,aAA1B,EAAyC;AACvC,aAAKG,UAAL,CAAgB,KAAKC,cAAL,CAAoBF,KAApB,CAAhB;AACD;;AAcD,WAAKG,SAAL,GAAiB,IAAjB;AACA,WAAKF,UAAL,CAAgB,EAAhB;AACD,KArBD,CAqBE,OAAOG,KAAP,EAAc;AAEd,WAAKC,UAAL,CAAgBD,KAAhB;AACD;AACF,GA5BD;;AA8BA,OAAKE,UAAL,GAAkB,SAASC,SAAT,GAAqB,CAEtC,CAFD;;AAKA,OAAKL,cAAL,GAAsB,UAAUF,KAAV,EAAiB;AACrC,WAAO,OAAOA,KAAP,KAAiB,QAAjB,GAA4BA,KAA5B,GAAoC,KAAKP,WAAL,CAAiBe,MAAjB,CAAwBR,KAAxB,EAA+B;AAACH,MAAAA,MAAM,EAAE;AAAT,KAA/B,CAA3C;AACD,GAFD;AAGD;;AAEDP,qBAAqB,CAACmB,SAAtB,GAAkCC,MAAM,CAACC,MAAP,CAAcvB,aAAa,CAACqB,SAA5B,CAAlC;AACAnB,qBAAqB,CAACmB,SAAtB,CAAgCG,WAAhC,GAA8CtB,qBAA9C","sourcesContent":["// A custom papaparse `Streamer` for async iterators\n// Ideally this can be contributed back to papaparse\n// Or papaparse can expose Streamer API so we can extend without forking.\n\n// @ts-nocheck\n/* eslint-disable no-invalid-this */\n\n// Note: papaparse is not an ES6 module\nimport Papa from '../libs/papaparse';\nconst {ChunkStreamer} = Papa;\n\nexport default function AsyncIteratorStreamer(config) {\n config = config || {};\n\n ChunkStreamer.call(this, config);\n\n this.textDecoder = new TextDecoder(this._config.encoding);\n\n // Implement ChunkStreamer base class methods\n\n // this.pause = function() {\n // ChunkStreamer.prototype.pause.apply(this, arguments);\n // };\n\n // this.resume = function() {\n // ChunkStreamer.prototype.resume.apply(this, arguments);\n // this._input.resume();\n // };\n\n this.stream = async function (asyncIterator) {\n this._input = asyncIterator;\n\n try {\n // ES2018 version\n // TODO - check for pause and abort flags?\n for await (const chunk of asyncIterator) {\n this.parseChunk(this.getStringChunk(chunk));\n }\n\n // ES5 VERSION\n // while (true) {\n // asyncIterator.next().then(function(value) {\n // if (value.done) {\n // // finalize iterator?\n // }\n // }\n // const = await ;\n // if (done) return total;\n // total += value.length;\n // }\n\n this._finished = true;\n this.parseChunk('');\n } catch (error) {\n // Inform ChunkStreamer base class of error\n this._sendError(error);\n }\n };\n\n this._nextChunk = function nextChunk() {\n // Left empty, as async iterator automatically pulls next chunk\n };\n\n // HELPER METHODS\n this.getStringChunk = function (chunk) {\n return typeof chunk === 'string' ? chunk : this.textDecoder.decode(chunk, {stream: true});\n };\n}\n\nAsyncIteratorStreamer.prototype = Object.create(ChunkStreamer.prototype);\nAsyncIteratorStreamer.prototype.constructor = AsyncIteratorStreamer;\n"],"file":"async-iterator-streamer.js"}
|
package/dist/esm/csv-loader.js
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
import { AsyncQueue, TableBatchBuilder, convertToArrayRow, convertToObjectRow } from '@loaders.gl/schema';
|
|
2
2
|
import Papa from './libs/papaparse';
|
|
3
3
|
import AsyncIteratorStreamer from './lib/async-iterator-streamer';
|
|
4
|
-
const VERSION = typeof "3.1.0-alpha.
|
|
4
|
+
const VERSION = typeof "3.1.0-alpha.5" !== 'undefined' ? "3.1.0-alpha.5" : 'latest';
|
|
5
5
|
const DEFAULT_CSV_LOADER_OPTIONS = {
|
|
6
6
|
csv: {
|
|
7
7
|
shape: 'object-row-table',
|
|
@@ -187,7 +187,7 @@ function duplicateColumnTransformer() {
|
|
|
187
187
|
let counter = 1;
|
|
188
188
|
|
|
189
189
|
while (observedColumns.has(colName)) {
|
|
190
|
-
colName =
|
|
190
|
+
colName = "".concat(col, ".").concat(counter);
|
|
191
191
|
counter++;
|
|
192
192
|
}
|
|
193
193
|
|
|
@@ -200,7 +200,7 @@ function generateHeader(columnPrefix, count = 0) {
|
|
|
200
200
|
const headers = [];
|
|
201
201
|
|
|
202
202
|
for (let i = 0; i < count; i++) {
|
|
203
|
-
headers.push(
|
|
203
|
+
headers.push("".concat(columnPrefix).concat(i + 1));
|
|
204
204
|
}
|
|
205
205
|
|
|
206
206
|
return headers;
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"sources":["../../src/csv-loader.ts"],"names":["AsyncQueue","TableBatchBuilder","convertToArrayRow","convertToObjectRow","Papa","AsyncIteratorStreamer","VERSION","DEFAULT_CSV_LOADER_OPTIONS","csv","shape","optimizeMemoryUsage","header","columnPrefix","quoteChar","escapeChar","dynamicTyping","comments","skipEmptyLines","delimitersToGuess","CSVLoader","id","module","name","version","extensions","mimeTypes","category","parse","arrayBuffer","options","parseCSV","TextDecoder","decode","parseText","text","parseInBatches","parseCSVInBatches","csvText","csvOptions","firstRow","readFirstRow","isHeaderRow","Boolean","parseWithHeader","papaparseConfig","download","transformHeader","duplicateColumnTransformer","undefined","error","e","Error","result","data","rows","headerRow","meta","fields","generateHeader","length","map","row","Array","isArray","asyncIterator","batchSize","asyncQueue","isFirstRow","tableBatchBuilder","schema","config","chunkSize","step","results","collapsedRow","flat","join","trim","bytesUsed","cursor","deduceSchema","JSON","stringify","addRow","batch","getFullBatch","enqueue","complete","getFinalBatch","close","every","value","preview","observedColumns","Set","col","colName","counter","has","add","count","headers","i","push","columnName","String","index","type","Float32Array","_typecheckCSVLoader"],"mappings":"AAIA,SACEA,UADF,EAEEC,iBAFF,EAGEC,iBAHF,EAIEC,kBAJF,QAKO,oBALP;AAMA,OAAOC,IAAP,MAAiB,kBAAjB;AACA,OAAOC,qBAAP,MAAkC,+BAAlC;AAIA,MAAMC,OAAO,GAAG,2BAAuB,WAAvB,qBAAmD,QAAnE;AA0BA,MAAMC,0BAA0B,GAAG;AACjCC,EAAAA,GAAG,EAAE;AACHC,IAAAA,KAAK,EAAE,kBADJ;AAEHC,IAAAA,mBAAmB,EAAE,KAFlB;AAIHC,IAAAA,MAAM,EAAE,MAJL;AAKHC,IAAAA,YAAY,EAAE,QALX;AAQHC,IAAAA,SAAS,EAAE,GARR;AASHC,IAAAA,UAAU,EAAE,GATT;AAUHC,IAAAA,aAAa,EAAE,IAVZ;AAWHC,IAAAA,QAAQ,EAAE,KAXP;AAYHC,IAAAA,cAAc,EAAE,IAZb;AAcHC,IAAAA,iBAAiB,EAAE,CAAC,GAAD,EAAM,IAAN,EAAY,GAAZ,EAAiB,GAAjB;AAdhB;AAD4B,CAAnC;AAoBA,OAAO,MAAMC,SAAS,GAAG;AACvBC,EAAAA,EAAE,EAAE,KADmB;AAEvBC,EAAAA,MAAM,EAAE,KAFe;AAGvBC,EAAAA,IAAI,EAAE,KAHiB;AAIvBC,EAAAA,OAAO,EAAEjB,OAJc;AAKvBkB,EAAAA,UAAU,EAAE,CAAC,KAAD,EAAQ,KAAR,EAAe,KAAf,CALW;AAMvBC,EAAAA,SAAS,EAAE,CAAC,UAAD,EAAa,2BAAb,EAA0C,UAA1C,CANY;AAOvBC,EAAAA,QAAQ,EAAE,OAPa;AAQvBC,EAAAA,KAAK,EAAE,OAAOC,WAAP,EAAiCC,OAAjC,KACLC,QAAQ,CAAC,IAAIC,WAAJ,GAAkBC,MAAlB,CAAyBJ,WAAzB,CAAD,EAAwCC,OAAxC,CATa;AAUvBI,EAAAA,SAAS,EAAE,CAACC,IAAD,EAAeL,OAAf,KAA8CC,QAAQ,CAACI,IAAD,EAAOL,OAAP,CAV1C;AAWvBM,EAAAA,cAAc,EAAEC,iBAXO;AAcvBP,EAAAA,OAAO,EAAEtB;AAdc,CAAlB;;AAiBP,eAAeuB,QAAf,CAAwBO,OAAxB,EAAyCR,OAAzC,EAAqE;AAEnE,QAAMS,UAAU,GAAG,EAAC,GAAG/B,0BAA0B,CAACC,GAA/B;AAAoC,QAAGqB,OAAH,aAAGA,OAAH,uBAAGA,OAAO,CAAErB,GAAZ;AAApC,GAAnB;AAEA,QAAM+B,QAAQ,GAAGC,YAAY,CAACH,OAAD,CAA7B;AACA,QAAM1B,MAAe,GACnB2B,UAAU,CAAC3B,MAAX,KAAsB,MAAtB,GAA+B8B,WAAW,CAACF,QAAD,CAA1C,GAAuDG,OAAO,CAACJ,UAAU,CAAC3B,MAAZ,CADhE;AAGA,QAAMgC,eAAe,GAAGhC,MAAxB;AAEA,QAAMiC,eAAe,GAAG,EAEtB,GAAGN,UAFmB;AAGtB3B,IAAAA,MAAM,EAAEgC,eAHc;AAItBE,IAAAA,QAAQ,EAAE,KAJY;AAKtBC,IAAAA,eAAe,EAAEH,eAAe,GAAGI,0BAA0B,EAA7B,GAAkCC,SAL5C;AAMtBC,IAAAA,KAAK,EAAGC,CAAD,IAAO;AACZ,YAAM,IAAIC,KAAJ,CAAUD,CAAV,CAAN;AACD;AARqB,GAAxB;AAWA,QAAME,MAAM,GAAGhD,IAAI,CAACuB,KAAL,CAAWU,OAAX,EAAoBO,eAApB,CAAf;AACA,MAAI;AAACS,IAAAA,IAAI,EAAEC;AAAP,MAAeF,MAAnB;AAEA,QAAMG,SAAS,GAAGH,MAAM,CAACI,IAAP,CAAYC,MAAZ,IAAsBC,cAAc,CAACpB,UAAU,CAAC1B,YAAZ,EAA0B2B,QAAQ,CAACoB,MAAnC,CAAtD;;AAEA,UAAQrB,UAAU,CAAC7B,KAAnB;AACE,SAAK,kBAAL;AACE6C,MAAAA,IAAI,GAAGA,IAAI,CAACM,GAAL,CAAUC,GAAD,IAAUC,KAAK,CAACC,OAAN,CAAcF,GAAd,IAAqB1D,kBAAkB,CAAC0D,GAAD,EAAMN,SAAN,CAAvC,GAA0DM,GAA7E,CAAP;AACA;;AACF,SAAK,iBAAL;AACEP,MAAAA,IAAI,GAAGA,IAAI,CAACM,GAAL,CAAUC,GAAD,IAAUC,KAAK,CAACC,OAAN,CAAcF,GAAd,IAAqBA,GAArB,GAA2B3D,iBAAiB,CAAC2D,GAAD,EAAMN,SAAN,CAA/D,CAAP;AACA;;AACF;AAPF;;AAsBA,SAAOD,IAAP;AACD;;AAGD,SAASlB,iBAAT,CACE4B,aADF,EAEEnC,OAFF,EAGwB;AAAA;;AAGtBA,EAAAA,OAAO,GAAG,EAAC,GAAGA;AAAJ,GAAV;;AACA,MAAIA,OAAO,CAACoC,SAAR,KAAsB,MAA1B,EAAkC;AAChCpC,IAAAA,OAAO,CAACoC,SAAR,GAAoB,IAApB;AACD;;AAGD,QAAM3B,UAAU,GAAG,EAAC,GAAG/B,0BAA0B,CAACC,GAA/B;AAAoC,oBAAGqB,OAAH,6CAAG,SAASrB,GAAZ;AAApC,GAAnB;AAEA,QAAM0D,UAAU,GAAG,IAAIlE,UAAJ,EAAnB;AAEA,MAAImE,UAAmB,GAAG,IAA1B;AACA,MAAIZ,SAA0B,GAAG,IAAjC;AACA,MAAIa,iBAA2C,GAAG,IAAlD;AACA,MAAIC,MAAqB,GAAG,IAA5B;AAEA,QAAMC,MAAM,GAAG,EAEb,GAAGhC,UAFU;AAGb3B,IAAAA,MAAM,EAAE,KAHK;AAIbkC,IAAAA,QAAQ,EAAE,KAJG;AAQb0B,IAAAA,SAAS,EAAE,OAAO,IAAP,GAAc,CARZ;AAcbtD,IAAAA,cAAc,EAAE,KAdH;;AAkBbuD,IAAAA,IAAI,CAACC,OAAD,EAAU;AACZ,UAAIZ,GAAG,GAAGY,OAAO,CAACpB,IAAlB;;AAEA,UAAIf,UAAU,CAACrB,cAAf,EAA+B;AAE7B,cAAMyD,YAAY,GAAGb,GAAG,CAACc,IAAJ,GAAWC,IAAX,CAAgB,EAAhB,EAAoBC,IAApB,EAArB;;AACA,YAAIH,YAAY,KAAK,EAArB,EAAyB;AACvB;AACD;AACF;;AACD,YAAMI,SAAS,GAAGL,OAAO,CAACjB,IAAR,CAAauB,MAA/B;;AAGA,UAAIZ,UAAU,IAAI,CAACZ,SAAnB,EAA8B;AAE5B,cAAM5C,MAAM,GAAG2B,UAAU,CAAC3B,MAAX,KAAsB,MAAtB,GAA+B8B,WAAW,CAACoB,GAAD,CAA1C,GAAkDnB,OAAO,CAACJ,UAAU,CAAC3B,MAAZ,CAAxE;;AACA,YAAIA,MAAJ,EAAY;AACV4C,UAAAA,SAAS,GAAGM,GAAG,CAACD,GAAJ,CAAQb,0BAA0B,EAAlC,CAAZ;AACA;AACD;AACF;;AAGD,UAAIoB,UAAJ,EAAgB;AACdA,QAAAA,UAAU,GAAG,KAAb;;AACA,YAAI,CAACZ,SAAL,EAAgB;AACdA,UAAAA,SAAS,GAAGG,cAAc,CAACpB,UAAU,CAAC1B,YAAZ,EAA0BiD,GAAG,CAACF,MAA9B,CAA1B;AACD;;AACDU,QAAAA,MAAM,GAAGW,YAAY,CAACnB,GAAD,EAAMN,SAAN,CAArB;AACD;;AAED,UAAIjB,UAAU,CAAC5B,mBAAf,EAAoC;AAGlCmD,QAAAA,GAAG,GAAGoB,IAAI,CAACtD,KAAL,CAAWsD,IAAI,CAACC,SAAL,CAAerB,GAAf,CAAX,CAAN;AACD;;AAGDO,MAAAA,iBAAiB,GACfA,iBAAiB,IACjB,IAAInE,iBAAJ,CAAsBoE,MAAtB,EAA8B;AAE5B5D,QAAAA,KAAK,EAAE6B,UAAU,CAAC7B,KAAX,IAAoB,iBAFC;AAG5B,WAAGoB;AAHyB,OAA9B,CAFF;;AAQA,UAAI;AACFuC,QAAAA,iBAAiB,CAACe,MAAlB,CAAyBtB,GAAzB;AAEA,cAAMuB,KAAK,GAAGhB,iBAAiB,IAAIA,iBAAiB,CAACiB,YAAlB,CAA+B;AAACP,UAAAA;AAAD,SAA/B,CAAnC;;AACA,YAAIM,KAAJ,EAAW;AACTlB,UAAAA,UAAU,CAACoB,OAAX,CAAmBF,KAAnB;AACD;AACF,OAPD,CAOE,OAAOnC,KAAP,EAAc;AACdiB,QAAAA,UAAU,CAACoB,OAAX,CAAmBrC,KAAnB;AACD;AACF,KA1EY;;AA6EbsC,IAAAA,QAAQ,CAACd,OAAD,EAAU;AAChB,UAAI;AACF,cAAMK,SAAS,GAAGL,OAAO,CAACjB,IAAR,CAAauB,MAA/B;AAEA,cAAMK,KAAK,GAAGhB,iBAAiB,IAAIA,iBAAiB,CAACoB,aAAlB,CAAgC;AAACV,UAAAA;AAAD,SAAhC,CAAnC;;AACA,YAAIM,KAAJ,EAAW;AACTlB,UAAAA,UAAU,CAACoB,OAAX,CAAmBF,KAAnB;AACD;AACF,OAPD,CAOE,OAAOnC,KAAP,EAAc;AACdiB,QAAAA,UAAU,CAACoB,OAAX,CAAmBrC,KAAnB;AACD;;AAEDiB,MAAAA,UAAU,CAACuB,KAAX;AACD;;AA1FY,GAAf;AA6FArF,EAAAA,IAAI,CAACuB,KAAL,CAAWqC,aAAX,EAA0BM,MAA1B,EAAkCjE,qBAAlC;AAIA,SAAO6D,UAAP;AACD;;AAOD,SAASzB,WAAT,CAAqBoB,GAArB,EAA6C;AAC3C,SAAOA,GAAG,IAAIA,GAAG,CAAC6B,KAAJ,CAAWC,KAAD,IAAW,OAAOA,KAAP,KAAiB,QAAtC,CAAd;AACD;;AAOD,SAASnD,YAAT,CAAsBH,OAAtB,EAA8C;AAC5C,QAAMe,MAAM,GAAGhD,IAAI,CAACuB,KAAL,CAAWU,OAAX,EAAoB;AACjCQ,IAAAA,QAAQ,EAAE,KADuB;AAEjC9B,IAAAA,aAAa,EAAE,IAFkB;AAGjC6E,IAAAA,OAAO,EAAE;AAHwB,GAApB,CAAf;AAKA,SAAOxC,MAAM,CAACC,IAAP,CAAY,CAAZ,CAAP;AACD;;AAQD,SAASN,0BAAT,GAAsC;AACpC,QAAM8C,eAAe,GAAG,IAAIC,GAAJ,EAAxB;AACA,SAAQC,GAAD,IAAS;AACd,QAAIC,OAAO,GAAGD,GAAd;AACA,QAAIE,OAAO,GAAG,CAAd;;AACA,WAAOJ,eAAe,CAACK,GAAhB,CAAoBF,OAApB,CAAP,EAAqC;AACnCA,MAAAA,OAAO,GAAI,GAAED,GAAI,IAAGE,OAAQ,EAA5B;AACAA,MAAAA,OAAO;AACR;;AACDJ,IAAAA,eAAe,CAACM,GAAhB,CAAoBH,OAApB;AACA,WAAOA,OAAP;AACD,GATD;AAUD;;AAQD,SAAStC,cAAT,CAAwB9C,YAAxB,EAA8CwF,KAAa,GAAG,CAA9D,EAA2E;AACzE,QAAMC,OAAiB,GAAG,EAA1B;;AACA,OAAK,IAAIC,CAAC,GAAG,CAAb,EAAgBA,CAAC,GAAGF,KAApB,EAA2BE,CAAC,EAA5B,EAAgC;AAC9BD,IAAAA,OAAO,CAACE,IAAR,CAAc,GAAE3F,YAAa,GAAE0F,CAAC,GAAG,CAAE,EAArC;AACD;;AACD,SAAOD,OAAP;AACD;;AAED,SAASrB,YAAT,CAAsBnB,GAAtB,EAA2BN,SAA3B,EAAsC;AACpC,QAAMc,MAAM,GAAGd,SAAS,GAAG,EAAH,GAAQ,EAAhC;;AACA,OAAK,IAAI+C,CAAC,GAAG,CAAb,EAAgBA,CAAC,GAAGzC,GAAG,CAACF,MAAxB,EAAgC2C,CAAC,EAAjC,EAAqC;AACnC,UAAME,UAAU,GAAIjD,SAAS,IAAIA,SAAS,CAAC+C,CAAD,CAAvB,IAA+BA,CAAlD;AACA,UAAMX,KAAK,GAAG9B,GAAG,CAACyC,CAAD,CAAjB;;AACA,YAAQ,OAAOX,KAAf;AACE,WAAK,QAAL;AACA,WAAK,SAAL;AAEEtB,QAAAA,MAAM,CAACmC,UAAD,CAAN,GAAqB;AAAClF,UAAAA,IAAI,EAAEmF,MAAM,CAACD,UAAD,CAAb;AAA2BE,UAAAA,KAAK,EAAEJ,CAAlC;AAAqCK,UAAAA,IAAI,EAAEC;AAA3C,SAArB;AACA;;AACF,WAAK,QAAL;AACA;AACEvC,QAAAA,MAAM,CAACmC,UAAD,CAAN,GAAqB;AAAClF,UAAAA,IAAI,EAAEmF,MAAM,CAACD,UAAD,CAAb;AAA2BE,UAAAA,KAAK,EAAEJ,CAAlC;AAAqCK,UAAAA,IAAI,EAAE7C;AAA3C,SAArB;AARJ;AAYD;;AACD,SAAOO,MAAP;AACD;;AAED,OAAO,MAAMwC,mBAAqC,GAAG1F,SAA9C","sourcesContent":["import type {LoaderWithParser, LoaderOptions} from '@loaders.gl/loader-utils';\nimport type {Batch} from '@loaders.gl/schema';\ntype Schema = any;\n\nimport {\n AsyncQueue,\n TableBatchBuilder,\n convertToArrayRow,\n convertToObjectRow\n} from '@loaders.gl/schema';\nimport Papa from './libs/papaparse';\nimport AsyncIteratorStreamer from './lib/async-iterator-streamer';\n\n// __VERSION__ is injected by babel-plugin-version-inline\n// @ts-ignore TS2304: Cannot find name '__VERSION__'.\nconst VERSION = typeof __VERSION__ !== 'undefined' ? __VERSION__ : 'latest';\n\nexport type CSVLoaderOptions = LoaderOptions & {\n csv?: {\n // loaders.gl options\n shape?: 'array-row-table' | 'object-row-table' | 'columnar-table';\n /** optimizes memory usage but increases parsing time. */\n optimizeMemoryUsage?: boolean;\n columnPrefix?: string;\n header?: 'auto';\n\n // CSV options (papaparse)\n // delimiter: auto\n // newline: auto\n quoteChar?: string;\n escapeChar?: string;\n // Convert numbers and boolean values in rows from strings\n dynamicTyping?: boolean;\n comments?: boolean;\n skipEmptyLines?: boolean | 'greedy';\n // transform: null?\n delimitersToGuess?: string[];\n // fastMode: auto\n };\n};\n\nconst DEFAULT_CSV_LOADER_OPTIONS = {\n csv: {\n shape: 'object-row-table',\n optimizeMemoryUsage: false,\n // CSV options\n header: 'auto',\n columnPrefix: 'column',\n // delimiter: auto\n // newline: auto\n quoteChar: '\"',\n escapeChar: '\"',\n dynamicTyping: true,\n comments: false,\n skipEmptyLines: true,\n // transform: null?\n delimitersToGuess: [',', '\\t', '|', ';']\n // fastMode: auto\n }\n};\n\nexport const CSVLoader = {\n id: 'csv',\n module: 'csv',\n name: 'CSV',\n version: VERSION,\n extensions: ['csv', 'tsv', 'dsv'],\n mimeTypes: ['text/csv', 'text/tab-separated-values', 'text/dsv'],\n category: 'table',\n parse: async (arrayBuffer: ArrayBuffer, options?: CSVLoaderOptions) =>\n parseCSV(new TextDecoder().decode(arrayBuffer), options),\n parseText: (text: string, options?: CSVLoaderOptions) => parseCSV(text, options),\n parseInBatches: parseCSVInBatches,\n // @ts-ignore\n // testText: null,\n options: DEFAULT_CSV_LOADER_OPTIONS as CSVLoaderOptions\n};\n\nasync function parseCSV(csvText: string, options?: CSVLoaderOptions) {\n // Apps can call the parse method directly, we so apply default options here\n const csvOptions = {...DEFAULT_CSV_LOADER_OPTIONS.csv, ...options?.csv};\n\n const firstRow = readFirstRow(csvText);\n const header: boolean =\n csvOptions.header === 'auto' ? isHeaderRow(firstRow) : Boolean(csvOptions.header);\n\n const parseWithHeader = header;\n\n const papaparseConfig = {\n // dynamicTyping: true,\n ...csvOptions,\n header: parseWithHeader,\n download: false, // We handle loading, no need for papaparse to do it for us\n transformHeader: parseWithHeader ? duplicateColumnTransformer() : undefined,\n error: (e) => {\n throw new Error(e);\n }\n };\n\n const result = Papa.parse(csvText, papaparseConfig);\n let {data: rows} = result;\n\n const headerRow = result.meta.fields || generateHeader(csvOptions.columnPrefix, firstRow.length);\n\n switch (csvOptions.shape) {\n case 'object-row-table':\n rows = rows.map((row) => (Array.isArray(row) ? convertToObjectRow(row, headerRow) : row));\n break;\n case 'array-row-table':\n rows = rows.map((row) => (Array.isArray(row) ? row : convertToArrayRow(row, headerRow)));\n break;\n default:\n }\n\n /*\n if (!header && shape === 'object-row-table') {\n // If the dataset has no header, transform the array result into an object shape with an\n // autogenerated header\n return result.data.map((row) =>\n row.reduce((acc, value, i) => {\n acc[headerRow[i]] = value;\n return acc;\n }, {})\n );\n }\n */\n return rows;\n}\n\n// TODO - support batch size 0 = no batching/single batch?\nfunction parseCSVInBatches(\n asyncIterator: AsyncIterable<ArrayBuffer> | Iterable<ArrayBuffer>,\n options?: CSVLoaderOptions\n): AsyncIterable<Batch> {\n // Papaparse does not support standard batch size handling\n // TODO - investigate papaparse chunks mode\n options = {...options};\n if (options.batchSize === 'auto') {\n options.batchSize = 4000;\n }\n\n // Apps can call the parse method directly, we so apply default options here\n const csvOptions = {...DEFAULT_CSV_LOADER_OPTIONS.csv, ...options?.csv};\n\n const asyncQueue = new AsyncQueue<Batch>();\n\n let isFirstRow: boolean = true;\n let headerRow: string[] | null = null;\n let tableBatchBuilder: TableBatchBuilder | null = null;\n let schema: Schema | null = null;\n\n const config = {\n // dynamicTyping: true, // Convert numbers and boolean values in rows from strings,\n ...csvOptions,\n header: false, // Unfortunately, header detection is not automatic and does not infer shapes\n download: false, // We handle loading, no need for papaparse to do it for us\n // chunkSize is set to 5MB explicitly (same as Papaparse default) due to a bug where the\n // streaming parser gets stuck if skipEmptyLines and a step callback are both supplied.\n // See https://github.com/mholt/PapaParse/issues/465\n chunkSize: 1024 * 1024 * 5,\n // skipEmptyLines is set to a boolean value if supplied. Greedy is set to true\n // skipEmptyLines is handled manually given two bugs where the streaming parser gets stuck if\n // both of the skipEmptyLines and step callback options are provided:\n // - true doesn't work unless chunkSize is set: https://github.com/mholt/PapaParse/issues/465\n // - greedy doesn't work: https://github.com/mholt/PapaParse/issues/825\n skipEmptyLines: false,\n\n // step is called on every row\n // eslint-disable-next-line complexity\n step(results) {\n let row = results.data;\n\n if (csvOptions.skipEmptyLines) {\n // Manually reject lines that are empty\n const collapsedRow = row.flat().join('').trim();\n if (collapsedRow === '') {\n return;\n }\n }\n const bytesUsed = results.meta.cursor;\n\n // Check if we need to save a header row\n if (isFirstRow && !headerRow) {\n // Auto detects or can be forced with csvOptions.header\n const header = csvOptions.header === 'auto' ? isHeaderRow(row) : Boolean(csvOptions.header);\n if (header) {\n headerRow = row.map(duplicateColumnTransformer());\n return;\n }\n }\n\n // If first data row, we can deduce the schema\n if (isFirstRow) {\n isFirstRow = false;\n if (!headerRow) {\n headerRow = generateHeader(csvOptions.columnPrefix, row.length);\n }\n schema = deduceSchema(row, headerRow);\n }\n\n if (csvOptions.optimizeMemoryUsage) {\n // A workaround to allocate new strings and don't retain pointers to original strings.\n // https://bugs.chromium.org/p/v8/issues/detail?id=2869\n row = JSON.parse(JSON.stringify(row));\n }\n\n // Add the row\n tableBatchBuilder =\n tableBatchBuilder ||\n new TableBatchBuilder(schema, {\n // @ts-expect-error\n shape: csvOptions.shape || 'array-row-table',\n ...options\n });\n\n try {\n tableBatchBuilder.addRow(row);\n // If a batch has been completed, emit it\n const batch = tableBatchBuilder && tableBatchBuilder.getFullBatch({bytesUsed});\n if (batch) {\n asyncQueue.enqueue(batch);\n }\n } catch (error) {\n asyncQueue.enqueue(error as Error);\n }\n },\n\n // complete is called when all rows have been read\n complete(results) {\n try {\n const bytesUsed = results.meta.cursor;\n // Ensure any final (partial) batch gets emitted\n const batch = tableBatchBuilder && tableBatchBuilder.getFinalBatch({bytesUsed});\n if (batch) {\n asyncQueue.enqueue(batch);\n }\n } catch (error) {\n asyncQueue.enqueue(error as Error);\n }\n\n asyncQueue.close();\n }\n };\n\n Papa.parse(asyncIterator, config, AsyncIteratorStreamer);\n\n // TODO - Does it matter if we return asyncIterable or asyncIterator\n // return asyncQueue[Symbol.asyncIterator]();\n return asyncQueue;\n}\n\n/**\n * Checks if a certain row is a header row\n * @param row the row to check\n * @returns true if the row looks like a header\n */\nfunction isHeaderRow(row: string[]): boolean {\n return row && row.every((value) => typeof value === 'string');\n}\n\n/**\n * Reads, parses, and returns the first row of a CSV text\n * @param csvText the csv text to parse\n * @returns the first row\n */\nfunction readFirstRow(csvText: string): any[] {\n const result = Papa.parse(csvText, {\n download: false,\n dynamicTyping: true,\n preview: 1\n });\n return result.data[0];\n}\n\n/**\n * Creates a transformer that renames duplicate columns. This is needed as Papaparse doesn't handle\n * duplicate header columns and would use the latest occurrence by default.\n * See the header option in https://www.papaparse.com/docs#config\n * @returns a transform function that returns sanitized names for duplicate fields\n */\nfunction duplicateColumnTransformer() {\n const observedColumns = new Set();\n return (col) => {\n let colName = col;\n let counter = 1;\n while (observedColumns.has(colName)) {\n colName = `${col}.${counter}`;\n counter++;\n }\n observedColumns.add(colName);\n return colName;\n };\n}\n\n/**\n * Generates the header of a CSV given a prefix and a column count\n * @param columnPrefix the columnPrefix to use\n * @param count the count of column names to generate\n * @returns an array of column names\n */\nfunction generateHeader(columnPrefix: string, count: number = 0): string[] {\n const headers: string[] = [];\n for (let i = 0; i < count; i++) {\n headers.push(`${columnPrefix}${i + 1}`);\n }\n return headers;\n}\n\nfunction deduceSchema(row, headerRow) {\n const schema = headerRow ? {} : [];\n for (let i = 0; i < row.length; i++) {\n const columnName = (headerRow && headerRow[i]) || i;\n const value = row[i];\n switch (typeof value) {\n case 'number':\n case 'boolean':\n // TODO - booleans could be handled differently...\n schema[columnName] = {name: String(columnName), index: i, type: Float32Array};\n break;\n case 'string':\n default:\n schema[columnName] = {name: String(columnName), index: i, type: Array};\n // We currently only handle numeric rows\n // TODO we could offer a function to map strings to numbers?\n }\n }\n return schema;\n}\n\nexport const _typecheckCSVLoader: LoaderWithParser = CSVLoader;\n"],"file":"csv-loader.js"}
|
|
1
|
+
{"version":3,"sources":["../../src/csv-loader.ts"],"names":["AsyncQueue","TableBatchBuilder","convertToArrayRow","convertToObjectRow","Papa","AsyncIteratorStreamer","VERSION","DEFAULT_CSV_LOADER_OPTIONS","csv","shape","optimizeMemoryUsage","header","columnPrefix","quoteChar","escapeChar","dynamicTyping","comments","skipEmptyLines","delimitersToGuess","CSVLoader","id","module","name","version","extensions","mimeTypes","category","parse","arrayBuffer","options","parseCSV","TextDecoder","decode","parseText","text","parseInBatches","parseCSVInBatches","csvText","csvOptions","firstRow","readFirstRow","isHeaderRow","Boolean","parseWithHeader","papaparseConfig","download","transformHeader","duplicateColumnTransformer","undefined","error","e","Error","result","data","rows","headerRow","meta","fields","generateHeader","length","map","row","Array","isArray","asyncIterator","batchSize","asyncQueue","isFirstRow","tableBatchBuilder","schema","config","chunkSize","step","results","collapsedRow","flat","join","trim","bytesUsed","cursor","deduceSchema","JSON","stringify","addRow","batch","getFullBatch","enqueue","complete","getFinalBatch","close","every","value","preview","observedColumns","Set","col","colName","counter","has","add","count","headers","i","push","columnName","String","index","type","Float32Array","_typecheckCSVLoader"],"mappings":"AAIA,SACEA,UADF,EAEEC,iBAFF,EAGEC,iBAHF,EAIEC,kBAJF,QAKO,oBALP;AAMA,OAAOC,IAAP,MAAiB,kBAAjB;AACA,OAAOC,qBAAP,MAAkC,+BAAlC;AAIA,MAAMC,OAAO,GAAG,2BAAuB,WAAvB,qBAAmD,QAAnE;AA0BA,MAAMC,0BAA0B,GAAG;AACjCC,EAAAA,GAAG,EAAE;AACHC,IAAAA,KAAK,EAAE,kBADJ;AAEHC,IAAAA,mBAAmB,EAAE,KAFlB;AAIHC,IAAAA,MAAM,EAAE,MAJL;AAKHC,IAAAA,YAAY,EAAE,QALX;AAQHC,IAAAA,SAAS,EAAE,GARR;AASHC,IAAAA,UAAU,EAAE,GATT;AAUHC,IAAAA,aAAa,EAAE,IAVZ;AAWHC,IAAAA,QAAQ,EAAE,KAXP;AAYHC,IAAAA,cAAc,EAAE,IAZb;AAcHC,IAAAA,iBAAiB,EAAE,CAAC,GAAD,EAAM,IAAN,EAAY,GAAZ,EAAiB,GAAjB;AAdhB;AAD4B,CAAnC;AAoBA,OAAO,MAAMC,SAAS,GAAG;AACvBC,EAAAA,EAAE,EAAE,KADmB;AAEvBC,EAAAA,MAAM,EAAE,KAFe;AAGvBC,EAAAA,IAAI,EAAE,KAHiB;AAIvBC,EAAAA,OAAO,EAAEjB,OAJc;AAKvBkB,EAAAA,UAAU,EAAE,CAAC,KAAD,EAAQ,KAAR,EAAe,KAAf,CALW;AAMvBC,EAAAA,SAAS,EAAE,CAAC,UAAD,EAAa,2BAAb,EAA0C,UAA1C,CANY;AAOvBC,EAAAA,QAAQ,EAAE,OAPa;AAQvBC,EAAAA,KAAK,EAAE,OAAOC,WAAP,EAAiCC,OAAjC,KACLC,QAAQ,CAAC,IAAIC,WAAJ,GAAkBC,MAAlB,CAAyBJ,WAAzB,CAAD,EAAwCC,OAAxC,CATa;AAUvBI,EAAAA,SAAS,EAAE,CAACC,IAAD,EAAeL,OAAf,KAA8CC,QAAQ,CAACI,IAAD,EAAOL,OAAP,CAV1C;AAWvBM,EAAAA,cAAc,EAAEC,iBAXO;AAcvBP,EAAAA,OAAO,EAAEtB;AAdc,CAAlB;;AAiBP,eAAeuB,QAAf,CAAwBO,OAAxB,EAAyCR,OAAzC,EAAqE;AAEnE,QAAMS,UAAU,GAAG,EAAC,GAAG/B,0BAA0B,CAACC,GAA/B;AAAoC,QAAGqB,OAAH,aAAGA,OAAH,uBAAGA,OAAO,CAAErB,GAAZ;AAApC,GAAnB;AAEA,QAAM+B,QAAQ,GAAGC,YAAY,CAACH,OAAD,CAA7B;AACA,QAAM1B,MAAe,GACnB2B,UAAU,CAAC3B,MAAX,KAAsB,MAAtB,GAA+B8B,WAAW,CAACF,QAAD,CAA1C,GAAuDG,OAAO,CAACJ,UAAU,CAAC3B,MAAZ,CADhE;AAGA,QAAMgC,eAAe,GAAGhC,MAAxB;AAEA,QAAMiC,eAAe,GAAG,EAEtB,GAAGN,UAFmB;AAGtB3B,IAAAA,MAAM,EAAEgC,eAHc;AAItBE,IAAAA,QAAQ,EAAE,KAJY;AAKtBC,IAAAA,eAAe,EAAEH,eAAe,GAAGI,0BAA0B,EAA7B,GAAkCC,SAL5C;AAMtBC,IAAAA,KAAK,EAAGC,CAAD,IAAO;AACZ,YAAM,IAAIC,KAAJ,CAAUD,CAAV,CAAN;AACD;AARqB,GAAxB;AAWA,QAAME,MAAM,GAAGhD,IAAI,CAACuB,KAAL,CAAWU,OAAX,EAAoBO,eAApB,CAAf;AACA,MAAI;AAACS,IAAAA,IAAI,EAAEC;AAAP,MAAeF,MAAnB;AAEA,QAAMG,SAAS,GAAGH,MAAM,CAACI,IAAP,CAAYC,MAAZ,IAAsBC,cAAc,CAACpB,UAAU,CAAC1B,YAAZ,EAA0B2B,QAAQ,CAACoB,MAAnC,CAAtD;;AAEA,UAAQrB,UAAU,CAAC7B,KAAnB;AACE,SAAK,kBAAL;AACE6C,MAAAA,IAAI,GAAGA,IAAI,CAACM,GAAL,CAAUC,GAAD,IAAUC,KAAK,CAACC,OAAN,CAAcF,GAAd,IAAqB1D,kBAAkB,CAAC0D,GAAD,EAAMN,SAAN,CAAvC,GAA0DM,GAA7E,CAAP;AACA;;AACF,SAAK,iBAAL;AACEP,MAAAA,IAAI,GAAGA,IAAI,CAACM,GAAL,CAAUC,GAAD,IAAUC,KAAK,CAACC,OAAN,CAAcF,GAAd,IAAqBA,GAArB,GAA2B3D,iBAAiB,CAAC2D,GAAD,EAAMN,SAAN,CAA/D,CAAP;AACA;;AACF;AAPF;;AAsBA,SAAOD,IAAP;AACD;;AAGD,SAASlB,iBAAT,CACE4B,aADF,EAEEnC,OAFF,EAGwB;AAAA;;AAGtBA,EAAAA,OAAO,GAAG,EAAC,GAAGA;AAAJ,GAAV;;AACA,MAAIA,OAAO,CAACoC,SAAR,KAAsB,MAA1B,EAAkC;AAChCpC,IAAAA,OAAO,CAACoC,SAAR,GAAoB,IAApB;AACD;;AAGD,QAAM3B,UAAU,GAAG,EAAC,GAAG/B,0BAA0B,CAACC,GAA/B;AAAoC,oBAAGqB,OAAH,6CAAG,SAASrB,GAAZ;AAApC,GAAnB;AAEA,QAAM0D,UAAU,GAAG,IAAIlE,UAAJ,EAAnB;AAEA,MAAImE,UAAmB,GAAG,IAA1B;AACA,MAAIZ,SAA0B,GAAG,IAAjC;AACA,MAAIa,iBAA2C,GAAG,IAAlD;AACA,MAAIC,MAAqB,GAAG,IAA5B;AAEA,QAAMC,MAAM,GAAG,EAEb,GAAGhC,UAFU;AAGb3B,IAAAA,MAAM,EAAE,KAHK;AAIbkC,IAAAA,QAAQ,EAAE,KAJG;AAQb0B,IAAAA,SAAS,EAAE,OAAO,IAAP,GAAc,CARZ;AAcbtD,IAAAA,cAAc,EAAE,KAdH;;AAkBbuD,IAAAA,IAAI,CAACC,OAAD,EAAU;AACZ,UAAIZ,GAAG,GAAGY,OAAO,CAACpB,IAAlB;;AAEA,UAAIf,UAAU,CAACrB,cAAf,EAA+B;AAE7B,cAAMyD,YAAY,GAAGb,GAAG,CAACc,IAAJ,GAAWC,IAAX,CAAgB,EAAhB,EAAoBC,IAApB,EAArB;;AACA,YAAIH,YAAY,KAAK,EAArB,EAAyB;AACvB;AACD;AACF;;AACD,YAAMI,SAAS,GAAGL,OAAO,CAACjB,IAAR,CAAauB,MAA/B;;AAGA,UAAIZ,UAAU,IAAI,CAACZ,SAAnB,EAA8B;AAE5B,cAAM5C,MAAM,GAAG2B,UAAU,CAAC3B,MAAX,KAAsB,MAAtB,GAA+B8B,WAAW,CAACoB,GAAD,CAA1C,GAAkDnB,OAAO,CAACJ,UAAU,CAAC3B,MAAZ,CAAxE;;AACA,YAAIA,MAAJ,EAAY;AACV4C,UAAAA,SAAS,GAAGM,GAAG,CAACD,GAAJ,CAAQb,0BAA0B,EAAlC,CAAZ;AACA;AACD;AACF;;AAGD,UAAIoB,UAAJ,EAAgB;AACdA,QAAAA,UAAU,GAAG,KAAb;;AACA,YAAI,CAACZ,SAAL,EAAgB;AACdA,UAAAA,SAAS,GAAGG,cAAc,CAACpB,UAAU,CAAC1B,YAAZ,EAA0BiD,GAAG,CAACF,MAA9B,CAA1B;AACD;;AACDU,QAAAA,MAAM,GAAGW,YAAY,CAACnB,GAAD,EAAMN,SAAN,CAArB;AACD;;AAED,UAAIjB,UAAU,CAAC5B,mBAAf,EAAoC;AAGlCmD,QAAAA,GAAG,GAAGoB,IAAI,CAACtD,KAAL,CAAWsD,IAAI,CAACC,SAAL,CAAerB,GAAf,CAAX,CAAN;AACD;;AAGDO,MAAAA,iBAAiB,GACfA,iBAAiB,IACjB,IAAInE,iBAAJ,CAAsBoE,MAAtB,EAA8B;AAE5B5D,QAAAA,KAAK,EAAE6B,UAAU,CAAC7B,KAAX,IAAoB,iBAFC;AAG5B,WAAGoB;AAHyB,OAA9B,CAFF;;AAQA,UAAI;AACFuC,QAAAA,iBAAiB,CAACe,MAAlB,CAAyBtB,GAAzB;AAEA,cAAMuB,KAAK,GAAGhB,iBAAiB,IAAIA,iBAAiB,CAACiB,YAAlB,CAA+B;AAACP,UAAAA;AAAD,SAA/B,CAAnC;;AACA,YAAIM,KAAJ,EAAW;AACTlB,UAAAA,UAAU,CAACoB,OAAX,CAAmBF,KAAnB;AACD;AACF,OAPD,CAOE,OAAOnC,KAAP,EAAc;AACdiB,QAAAA,UAAU,CAACoB,OAAX,CAAmBrC,KAAnB;AACD;AACF,KA1EY;;AA6EbsC,IAAAA,QAAQ,CAACd,OAAD,EAAU;AAChB,UAAI;AACF,cAAMK,SAAS,GAAGL,OAAO,CAACjB,IAAR,CAAauB,MAA/B;AAEA,cAAMK,KAAK,GAAGhB,iBAAiB,IAAIA,iBAAiB,CAACoB,aAAlB,CAAgC;AAACV,UAAAA;AAAD,SAAhC,CAAnC;;AACA,YAAIM,KAAJ,EAAW;AACTlB,UAAAA,UAAU,CAACoB,OAAX,CAAmBF,KAAnB;AACD;AACF,OAPD,CAOE,OAAOnC,KAAP,EAAc;AACdiB,QAAAA,UAAU,CAACoB,OAAX,CAAmBrC,KAAnB;AACD;;AAEDiB,MAAAA,UAAU,CAACuB,KAAX;AACD;;AA1FY,GAAf;AA6FArF,EAAAA,IAAI,CAACuB,KAAL,CAAWqC,aAAX,EAA0BM,MAA1B,EAAkCjE,qBAAlC;AAIA,SAAO6D,UAAP;AACD;;AAOD,SAASzB,WAAT,CAAqBoB,GAArB,EAA6C;AAC3C,SAAOA,GAAG,IAAIA,GAAG,CAAC6B,KAAJ,CAAWC,KAAD,IAAW,OAAOA,KAAP,KAAiB,QAAtC,CAAd;AACD;;AAOD,SAASnD,YAAT,CAAsBH,OAAtB,EAA8C;AAC5C,QAAMe,MAAM,GAAGhD,IAAI,CAACuB,KAAL,CAAWU,OAAX,EAAoB;AACjCQ,IAAAA,QAAQ,EAAE,KADuB;AAEjC9B,IAAAA,aAAa,EAAE,IAFkB;AAGjC6E,IAAAA,OAAO,EAAE;AAHwB,GAApB,CAAf;AAKA,SAAOxC,MAAM,CAACC,IAAP,CAAY,CAAZ,CAAP;AACD;;AAQD,SAASN,0BAAT,GAAsC;AACpC,QAAM8C,eAAe,GAAG,IAAIC,GAAJ,EAAxB;AACA,SAAQC,GAAD,IAAS;AACd,QAAIC,OAAO,GAAGD,GAAd;AACA,QAAIE,OAAO,GAAG,CAAd;;AACA,WAAOJ,eAAe,CAACK,GAAhB,CAAoBF,OAApB,CAAP,EAAqC;AACnCA,MAAAA,OAAO,aAAMD,GAAN,cAAaE,OAAb,CAAP;AACAA,MAAAA,OAAO;AACR;;AACDJ,IAAAA,eAAe,CAACM,GAAhB,CAAoBH,OAApB;AACA,WAAOA,OAAP;AACD,GATD;AAUD;;AAQD,SAAStC,cAAT,CAAwB9C,YAAxB,EAA8CwF,KAAa,GAAG,CAA9D,EAA2E;AACzE,QAAMC,OAAiB,GAAG,EAA1B;;AACA,OAAK,IAAIC,CAAC,GAAG,CAAb,EAAgBA,CAAC,GAAGF,KAApB,EAA2BE,CAAC,EAA5B,EAAgC;AAC9BD,IAAAA,OAAO,CAACE,IAAR,WAAgB3F,YAAhB,SAA+B0F,CAAC,GAAG,CAAnC;AACD;;AACD,SAAOD,OAAP;AACD;;AAED,SAASrB,YAAT,CAAsBnB,GAAtB,EAA2BN,SAA3B,EAAsC;AACpC,QAAMc,MAAM,GAAGd,SAAS,GAAG,EAAH,GAAQ,EAAhC;;AACA,OAAK,IAAI+C,CAAC,GAAG,CAAb,EAAgBA,CAAC,GAAGzC,GAAG,CAACF,MAAxB,EAAgC2C,CAAC,EAAjC,EAAqC;AACnC,UAAME,UAAU,GAAIjD,SAAS,IAAIA,SAAS,CAAC+C,CAAD,CAAvB,IAA+BA,CAAlD;AACA,UAAMX,KAAK,GAAG9B,GAAG,CAACyC,CAAD,CAAjB;;AACA,YAAQ,OAAOX,KAAf;AACE,WAAK,QAAL;AACA,WAAK,SAAL;AAEEtB,QAAAA,MAAM,CAACmC,UAAD,CAAN,GAAqB;AAAClF,UAAAA,IAAI,EAAEmF,MAAM,CAACD,UAAD,CAAb;AAA2BE,UAAAA,KAAK,EAAEJ,CAAlC;AAAqCK,UAAAA,IAAI,EAAEC;AAA3C,SAArB;AACA;;AACF,WAAK,QAAL;AACA;AACEvC,QAAAA,MAAM,CAACmC,UAAD,CAAN,GAAqB;AAAClF,UAAAA,IAAI,EAAEmF,MAAM,CAACD,UAAD,CAAb;AAA2BE,UAAAA,KAAK,EAAEJ,CAAlC;AAAqCK,UAAAA,IAAI,EAAE7C;AAA3C,SAArB;AARJ;AAYD;;AACD,SAAOO,MAAP;AACD;;AAED,OAAO,MAAMwC,mBAAqC,GAAG1F,SAA9C","sourcesContent":["import type {LoaderWithParser, LoaderOptions} from '@loaders.gl/loader-utils';\nimport type {Batch} from '@loaders.gl/schema';\ntype Schema = any;\n\nimport {\n AsyncQueue,\n TableBatchBuilder,\n convertToArrayRow,\n convertToObjectRow\n} from '@loaders.gl/schema';\nimport Papa from './libs/papaparse';\nimport AsyncIteratorStreamer from './lib/async-iterator-streamer';\n\n// __VERSION__ is injected by babel-plugin-version-inline\n// @ts-ignore TS2304: Cannot find name '__VERSION__'.\nconst VERSION = typeof __VERSION__ !== 'undefined' ? __VERSION__ : 'latest';\n\nexport type CSVLoaderOptions = LoaderOptions & {\n csv?: {\n // loaders.gl options\n shape?: 'array-row-table' | 'object-row-table' | 'columnar-table';\n /** optimizes memory usage but increases parsing time. */\n optimizeMemoryUsage?: boolean;\n columnPrefix?: string;\n header?: 'auto';\n\n // CSV options (papaparse)\n // delimiter: auto\n // newline: auto\n quoteChar?: string;\n escapeChar?: string;\n // Convert numbers and boolean values in rows from strings\n dynamicTyping?: boolean;\n comments?: boolean;\n skipEmptyLines?: boolean | 'greedy';\n // transform: null?\n delimitersToGuess?: string[];\n // fastMode: auto\n };\n};\n\nconst DEFAULT_CSV_LOADER_OPTIONS = {\n csv: {\n shape: 'object-row-table',\n optimizeMemoryUsage: false,\n // CSV options\n header: 'auto',\n columnPrefix: 'column',\n // delimiter: auto\n // newline: auto\n quoteChar: '\"',\n escapeChar: '\"',\n dynamicTyping: true,\n comments: false,\n skipEmptyLines: true,\n // transform: null?\n delimitersToGuess: [',', '\\t', '|', ';']\n // fastMode: auto\n }\n};\n\nexport const CSVLoader = {\n id: 'csv',\n module: 'csv',\n name: 'CSV',\n version: VERSION,\n extensions: ['csv', 'tsv', 'dsv'],\n mimeTypes: ['text/csv', 'text/tab-separated-values', 'text/dsv'],\n category: 'table',\n parse: async (arrayBuffer: ArrayBuffer, options?: CSVLoaderOptions) =>\n parseCSV(new TextDecoder().decode(arrayBuffer), options),\n parseText: (text: string, options?: CSVLoaderOptions) => parseCSV(text, options),\n parseInBatches: parseCSVInBatches,\n // @ts-ignore\n // testText: null,\n options: DEFAULT_CSV_LOADER_OPTIONS as CSVLoaderOptions\n};\n\nasync function parseCSV(csvText: string, options?: CSVLoaderOptions) {\n // Apps can call the parse method directly, we so apply default options here\n const csvOptions = {...DEFAULT_CSV_LOADER_OPTIONS.csv, ...options?.csv};\n\n const firstRow = readFirstRow(csvText);\n const header: boolean =\n csvOptions.header === 'auto' ? isHeaderRow(firstRow) : Boolean(csvOptions.header);\n\n const parseWithHeader = header;\n\n const papaparseConfig = {\n // dynamicTyping: true,\n ...csvOptions,\n header: parseWithHeader,\n download: false, // We handle loading, no need for papaparse to do it for us\n transformHeader: parseWithHeader ? duplicateColumnTransformer() : undefined,\n error: (e) => {\n throw new Error(e);\n }\n };\n\n const result = Papa.parse(csvText, papaparseConfig);\n let {data: rows} = result;\n\n const headerRow = result.meta.fields || generateHeader(csvOptions.columnPrefix, firstRow.length);\n\n switch (csvOptions.shape) {\n case 'object-row-table':\n rows = rows.map((row) => (Array.isArray(row) ? convertToObjectRow(row, headerRow) : row));\n break;\n case 'array-row-table':\n rows = rows.map((row) => (Array.isArray(row) ? row : convertToArrayRow(row, headerRow)));\n break;\n default:\n }\n\n /*\n if (!header && shape === 'object-row-table') {\n // If the dataset has no header, transform the array result into an object shape with an\n // autogenerated header\n return result.data.map((row) =>\n row.reduce((acc, value, i) => {\n acc[headerRow[i]] = value;\n return acc;\n }, {})\n );\n }\n */\n return rows;\n}\n\n// TODO - support batch size 0 = no batching/single batch?\nfunction parseCSVInBatches(\n asyncIterator: AsyncIterable<ArrayBuffer> | Iterable<ArrayBuffer>,\n options?: CSVLoaderOptions\n): AsyncIterable<Batch> {\n // Papaparse does not support standard batch size handling\n // TODO - investigate papaparse chunks mode\n options = {...options};\n if (options.batchSize === 'auto') {\n options.batchSize = 4000;\n }\n\n // Apps can call the parse method directly, we so apply default options here\n const csvOptions = {...DEFAULT_CSV_LOADER_OPTIONS.csv, ...options?.csv};\n\n const asyncQueue = new AsyncQueue<Batch>();\n\n let isFirstRow: boolean = true;\n let headerRow: string[] | null = null;\n let tableBatchBuilder: TableBatchBuilder | null = null;\n let schema: Schema | null = null;\n\n const config = {\n // dynamicTyping: true, // Convert numbers and boolean values in rows from strings,\n ...csvOptions,\n header: false, // Unfortunately, header detection is not automatic and does not infer shapes\n download: false, // We handle loading, no need for papaparse to do it for us\n // chunkSize is set to 5MB explicitly (same as Papaparse default) due to a bug where the\n // streaming parser gets stuck if skipEmptyLines and a step callback are both supplied.\n // See https://github.com/mholt/PapaParse/issues/465\n chunkSize: 1024 * 1024 * 5,\n // skipEmptyLines is set to a boolean value if supplied. Greedy is set to true\n // skipEmptyLines is handled manually given two bugs where the streaming parser gets stuck if\n // both of the skipEmptyLines and step callback options are provided:\n // - true doesn't work unless chunkSize is set: https://github.com/mholt/PapaParse/issues/465\n // - greedy doesn't work: https://github.com/mholt/PapaParse/issues/825\n skipEmptyLines: false,\n\n // step is called on every row\n // eslint-disable-next-line complexity\n step(results) {\n let row = results.data;\n\n if (csvOptions.skipEmptyLines) {\n // Manually reject lines that are empty\n const collapsedRow = row.flat().join('').trim();\n if (collapsedRow === '') {\n return;\n }\n }\n const bytesUsed = results.meta.cursor;\n\n // Check if we need to save a header row\n if (isFirstRow && !headerRow) {\n // Auto detects or can be forced with csvOptions.header\n const header = csvOptions.header === 'auto' ? isHeaderRow(row) : Boolean(csvOptions.header);\n if (header) {\n headerRow = row.map(duplicateColumnTransformer());\n return;\n }\n }\n\n // If first data row, we can deduce the schema\n if (isFirstRow) {\n isFirstRow = false;\n if (!headerRow) {\n headerRow = generateHeader(csvOptions.columnPrefix, row.length);\n }\n schema = deduceSchema(row, headerRow);\n }\n\n if (csvOptions.optimizeMemoryUsage) {\n // A workaround to allocate new strings and don't retain pointers to original strings.\n // https://bugs.chromium.org/p/v8/issues/detail?id=2869\n row = JSON.parse(JSON.stringify(row));\n }\n\n // Add the row\n tableBatchBuilder =\n tableBatchBuilder ||\n new TableBatchBuilder(schema, {\n // @ts-expect-error\n shape: csvOptions.shape || 'array-row-table',\n ...options\n });\n\n try {\n tableBatchBuilder.addRow(row);\n // If a batch has been completed, emit it\n const batch = tableBatchBuilder && tableBatchBuilder.getFullBatch({bytesUsed});\n if (batch) {\n asyncQueue.enqueue(batch);\n }\n } catch (error) {\n asyncQueue.enqueue(error as Error);\n }\n },\n\n // complete is called when all rows have been read\n complete(results) {\n try {\n const bytesUsed = results.meta.cursor;\n // Ensure any final (partial) batch gets emitted\n const batch = tableBatchBuilder && tableBatchBuilder.getFinalBatch({bytesUsed});\n if (batch) {\n asyncQueue.enqueue(batch);\n }\n } catch (error) {\n asyncQueue.enqueue(error as Error);\n }\n\n asyncQueue.close();\n }\n };\n\n Papa.parse(asyncIterator, config, AsyncIteratorStreamer);\n\n // TODO - Does it matter if we return asyncIterable or asyncIterator\n // return asyncQueue[Symbol.asyncIterator]();\n return asyncQueue;\n}\n\n/**\n * Checks if a certain row is a header row\n * @param row the row to check\n * @returns true if the row looks like a header\n */\nfunction isHeaderRow(row: string[]): boolean {\n return row && row.every((value) => typeof value === 'string');\n}\n\n/**\n * Reads, parses, and returns the first row of a CSV text\n * @param csvText the csv text to parse\n * @returns the first row\n */\nfunction readFirstRow(csvText: string): any[] {\n const result = Papa.parse(csvText, {\n download: false,\n dynamicTyping: true,\n preview: 1\n });\n return result.data[0];\n}\n\n/**\n * Creates a transformer that renames duplicate columns. This is needed as Papaparse doesn't handle\n * duplicate header columns and would use the latest occurrence by default.\n * See the header option in https://www.papaparse.com/docs#config\n * @returns a transform function that returns sanitized names for duplicate fields\n */\nfunction duplicateColumnTransformer() {\n const observedColumns = new Set();\n return (col) => {\n let colName = col;\n let counter = 1;\n while (observedColumns.has(colName)) {\n colName = `${col}.${counter}`;\n counter++;\n }\n observedColumns.add(colName);\n return colName;\n };\n}\n\n/**\n * Generates the header of a CSV given a prefix and a column count\n * @param columnPrefix the columnPrefix to use\n * @param count the count of column names to generate\n * @returns an array of column names\n */\nfunction generateHeader(columnPrefix: string, count: number = 0): string[] {\n const headers: string[] = [];\n for (let i = 0; i < count; i++) {\n headers.push(`${columnPrefix}${i + 1}`);\n }\n return headers;\n}\n\nfunction deduceSchema(row, headerRow) {\n const schema = headerRow ? {} : [];\n for (let i = 0; i < row.length; i++) {\n const columnName = (headerRow && headerRow[i]) || i;\n const value = row[i];\n switch (typeof value) {\n case 'number':\n case 'boolean':\n // TODO - booleans could be handled differently...\n schema[columnName] = {name: String(columnName), index: i, type: Float32Array};\n break;\n case 'string':\n default:\n schema[columnName] = {name: String(columnName), index: i, type: Array};\n // We currently only handle numeric rows\n // TODO we could offer a function to map strings to numbers?\n }\n }\n return schema;\n}\n\nexport const _typecheckCSVLoader: LoaderWithParser = CSVLoader;\n"],"file":"csv-loader.js"}
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@loaders.gl/csv",
|
|
3
|
-
"version": "3.1.0-alpha.
|
|
3
|
+
"version": "3.1.0-alpha.5",
|
|
4
4
|
"description": "Framework-independent loader for CSV and DSV table formats",
|
|
5
5
|
"license": "MIT",
|
|
6
6
|
"publishConfig": {
|
|
@@ -30,11 +30,11 @@
|
|
|
30
30
|
"build-bundle": "webpack --display=minimal --config ../../scripts/webpack/bundle.js"
|
|
31
31
|
},
|
|
32
32
|
"dependencies": {
|
|
33
|
-
"@loaders.gl/loader-utils": "3.1.0-alpha.
|
|
34
|
-
"@loaders.gl/schema": "3.1.0-alpha.
|
|
33
|
+
"@loaders.gl/loader-utils": "3.1.0-alpha.5",
|
|
34
|
+
"@loaders.gl/schema": "3.1.0-alpha.5"
|
|
35
35
|
},
|
|
36
36
|
"devDependencies": {
|
|
37
37
|
"d3-dsv": "^1.2.0"
|
|
38
38
|
},
|
|
39
|
-
"gitHead": "
|
|
39
|
+
"gitHead": "352241dd910a8c6307a235dadbe154ca915b885b"
|
|
40
40
|
}
|