fast-xml-parser 4.3.4 → 4.3.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,96 @@
1
+ const trimParser = require("../valueParsers/trim")
2
+ const booleanParser = require("../valueParsers/booleanParser")
3
+ const currencyParser = require("../valueParsers/currency")
4
+ const numberParser = require("../valueParsers/number")
5
+
6
+ const defaultOptions={
7
+ nameFor:{
8
+ text: "#text",
9
+ comment: "",
10
+ cdata: "",
11
+ },
12
+ // onTagClose: () => {},
13
+ // onAttribute: () => {},
14
+ piTag: false,
15
+ declaration: false, //"?xml"
16
+ tags: {
17
+ valueParsers: [
18
+ // "trim",
19
+ // "boolean",
20
+ // "number",
21
+ // "currency",
22
+ // "date",
23
+ ]
24
+ },
25
+ attributes:{
26
+ prefix: "@_",
27
+ suffix: "",
28
+ groupBy: "",
29
+
30
+ valueParsers: [
31
+ // "trim",
32
+ // "boolean",
33
+ // "number",
34
+ // "currency",
35
+ // "date",
36
+ ]
37
+ }
38
+ }
39
+
40
+ //TODO
41
+ const withJoin = ["trim","join", /*"entities",*/"number","boolean","currency"/*, "date"*/]
42
+ const withoutJoin = ["trim", /*"entities",*/"number","boolean","currency"/*, "date"*/]
43
+
44
+ function buildOptions(options){
45
+ //clone
46
+ const finalOptions = { ... defaultOptions};
47
+
48
+ //add config missed in cloning
49
+ finalOptions.tags.valueParsers.push(...withJoin)
50
+ if(!this.preserveOrder)
51
+ finalOptions.tags.valueParsers.push(...withoutJoin);
52
+
53
+ //add config missed in cloning
54
+ finalOptions.attributes.valueParsers.push(...withJoin)
55
+
56
+ //override configuration
57
+ copyProperties(finalOptions,options);
58
+ return finalOptions;
59
+ }
60
+
61
+ function copyProperties(target, source) {
62
+ for (let key in source) {
63
+ if (source.hasOwnProperty(key)) {
64
+ if (typeof source[key] === 'object' && !Array.isArray(source[key])) {
65
+ // Recursively copy nested properties
66
+ if (typeof target[key] === 'undefined') {
67
+ target[key] = {};
68
+ }
69
+ copyProperties(target[key], source[key]);
70
+ } else {
71
+ // Copy non-nested properties
72
+ target[key] = source[key];
73
+ }
74
+ }
75
+ }
76
+ }
77
+
78
+ function registerCommonValueParsers(){
79
+ return {
80
+ "trim": new trimParser(),
81
+ // "join": this.entityParser.parse,
82
+ "boolean": new booleanParser(),
83
+ "number": new numberParser({
84
+ hex: true,
85
+ leadingZeros: true,
86
+ eNotation: true
87
+ }),
88
+ "currency": new currencyParser(),
89
+ // "date": this.entityParser.parse,
90
+ }
91
+ }
92
+
93
+ module.exports = {
94
+ buildOptions : buildOptions,
95
+ registerCommonValueParsers: registerCommonValueParsers
96
+ }
File without changes
@@ -0,0 +1,81 @@
1
+ class TagPath{
2
+ constructor(pathStr){
3
+ let text = "";
4
+ let tName = "";
5
+ let pos;
6
+ let aName = "";
7
+ let aVal = "";
8
+ this.stack = []
9
+
10
+ for (let i = 0; i < pathStr.length; i++) {
11
+ let ch = pathStr[i];
12
+ if(ch === " ") {
13
+ if(text.length === 0) continue;
14
+ tName = text; text = "";
15
+ }else if(ch === "["){
16
+ if(tName.length === 0){
17
+ tName = text; text = "";
18
+ }
19
+ i++;
20
+ for (; i < pathStr.length; i++) {
21
+ ch = pathStr[i];
22
+ if(ch=== "=") continue;
23
+ else if(ch=== "]") {aName = text.trim(); text=""; break; i--;}
24
+ else if(ch === "'" || ch === '"'){
25
+ let attrEnd = pathStr.indexOf(ch,i+1);
26
+ aVal = pathStr.substring(i+1, attrEnd);
27
+ i = attrEnd;
28
+ }else{
29
+ text +=ch;
30
+ }
31
+ }
32
+ }else if(ch !== " " && text.length === 0 && tName.length > 0){//reading tagName
33
+ //save previous tag
34
+ this.stack.push(new TagPathNode(tName,pos,aName,aVal));
35
+ text = ch; tName = ""; aName = ""; aVal = "";
36
+ }else{
37
+ text+=ch;
38
+ }
39
+ }
40
+
41
+ //last tag in the path
42
+ if(tName.length >0 || text.length>0){
43
+ this.stack.push(new TagPathNode(text||tName,pos,aName,aVal));
44
+ }
45
+ }
46
+
47
+ match(tagStack,node){
48
+ if(this.stack[0].name !== "*"){
49
+ if(this.stack.length !== tagStack.length +1) return false;
50
+
51
+ //loop through tagPath and tagStack and match
52
+ for (let i = 0; i < this.tagStack.length; i++) {
53
+ if(!this.stack[i].match(tagStack[i])) return false;
54
+ }
55
+ }
56
+ if(!this.stack[this.stack.length - 1].match(node)) return false;
57
+ return true;
58
+ }
59
+ }
60
+
61
+ class TagPathNode{
62
+ constructor(name,position,attrName,attrVal){
63
+ this.name = name;
64
+ this.position = position;
65
+ this.attrName = attrName,
66
+ this.attrVal = attrVal;
67
+ }
68
+
69
+ match(node){
70
+ let matching = true;
71
+ matching = node.name === this.name;
72
+ if(this.position) matching = node.position === this.position;
73
+ if(this.attrName) matching = node.attrs[this.attrName !== undefined];
74
+ if(this.attrVal) matching = node.attrs[this.attrName !== this.attrVal];
75
+ return matching;
76
+ }
77
+ }
78
+
79
+ // console.log((new TagPath("* b[b]")).stack);
80
+ // console.log((new TagPath("a[a] b[b] c")).stack);
81
+ // console.log((new TagPath(" b [ b= 'cf sdadwa' ] a ")).stack);
@@ -0,0 +1,15 @@
1
+ const TagPath = require("./TagPath");
2
+
3
+ class TagPathMatcher{
4
+ constructor(stack,node){
5
+ this.stack = stack;
6
+ this.node= node;
7
+ }
8
+
9
+ match(path){
10
+ const tagPath = new TagPath(path);
11
+ return tagPath.match(this.stack, this.node);
12
+ }
13
+ }
14
+
15
+ module.exports = TagPathMatcher;
@@ -0,0 +1,85 @@
1
+ const { buildOptions} = require("./OptionsBuilder");
2
+ const Xml2JsParser = require("./Xml2JsParser");
3
+
4
+ class XMLParser{
5
+
6
+ constructor(options){
7
+ this.externalEntities = {};
8
+ this.options = buildOptions(options);
9
+ // console.log(this.options)
10
+ }
11
+ /**
12
+ * Parse XML data string to JS object
13
+ * @param {string|Buffer} xmlData
14
+ * @param {boolean|Object} validationOption
15
+ */
16
+ parse(xmlData){
17
+ if(Array.isArray(xmlData) && xmlData.byteLength !== undefined){
18
+ return this.parse(xmlData);
19
+ }else if( xmlData.toString){
20
+ xmlData = xmlData.toString();
21
+ }else{
22
+ throw new Error("XML data is accepted in String or Bytes[] form.")
23
+ }
24
+ // if( validationOption){
25
+ // if(validationOption === true) validationOption = {}; //validate with default options
26
+
27
+ // const result = validator.validate(xmlData, validationOption);
28
+ // if (result !== true) {
29
+ // throw Error( `${result.err.msg}:${result.err.line}:${result.err.col}` )
30
+ // }
31
+ // }
32
+ const parser = new Xml2JsParser(this.options);
33
+ parser.entityParser.addExternalEntities(this.externalEntities);
34
+ return parser.parse(xmlData);
35
+ }
36
+ /**
37
+ * Parse XML data buffer to JS object
38
+ * @param {string|Buffer} xmlData
39
+ * @param {boolean|Object} validationOption
40
+ */
41
+ parseBytesArr(xmlData){
42
+ if(Array.isArray(xmlData) && xmlData.byteLength !== undefined){
43
+ }else{
44
+ throw new Error("XML data is accepted in Bytes[] form.")
45
+ }
46
+ const parser = new Xml2JsParser(this.options);
47
+ parser.entityParser.addExternalEntities(this.externalEntities);
48
+ return parser.parseBytesArr(xmlData);
49
+ }
50
+ /**
51
+ * Parse XML data stream to JS object
52
+ * @param {fs.ReadableStream} xmlDataStream
53
+ */
54
+ parseStream(xmlDataStream){
55
+ if(!isStream(xmlDataStream)) throw new Error("FXP: Invalid stream input");
56
+
57
+ const orderedObjParser = new Xml2JsParser(this.options);
58
+ orderedObjParser.entityParser.addExternalEntities(this.externalEntities);
59
+ return orderedObjParser.parseStream(xmlDataStream);
60
+ }
61
+
62
+ /**
63
+ * Add Entity which is not by default supported by this library
64
+ * @param {string} key
65
+ * @param {string} value
66
+ */
67
+ addEntity(key, value){
68
+ if(value.indexOf("&") !== -1){
69
+ throw new Error("Entity value can't have '&'")
70
+ }else if(key.indexOf("&") !== -1 || key.indexOf(";") !== -1){
71
+ throw new Error("An entity must be set without '&' and ';'. Eg. use '#xD' for '&#xD;'")
72
+ }else if(value === "&"){
73
+ throw new Error("An entity with value '&' is not permitted");
74
+ }else{
75
+ this.externalEntities[key] = value;
76
+ }
77
+ }
78
+ }
79
+
80
+ function isStream(stream){
81
+ if(stream && typeof stream.read === "function" && typeof stream.on === "function" && typeof stream.readableEnded === "boolean") return true;
82
+ return false;
83
+ }
84
+
85
+ module.exports = XMLParser;
@@ -0,0 +1,237 @@
1
+ const StringSource = require("./inputSource/StringSource");
2
+ const BufferSource = require("./inputSource/BufferSource");
3
+ const {readTagExp,readClosingTagName} = require("./XmlPartReader");
4
+ const {readComment, readCdata,readDocType,readPiTag} = require("./XmlSpecialTagsReader");
5
+ const TagPath = require("./TagPath");
6
+ const TagPathMatcher = require("./TagPathMatcher");
7
+ const EntitiesParser = require('./EntitiesParser');
8
+
9
+ //To hold the data of current tag
10
+ //This is usually used to compare jpath expression against current tag
11
+ class TagDetail{
12
+ constructor(name){
13
+ this.name = name;
14
+ this.position = 0;
15
+ // this.attributes = {};
16
+ }
17
+ }
18
+
19
+ class Xml2JsParser {
20
+ constructor(options) {
21
+ this.options = options;
22
+
23
+ this.currentTagDetail = null;
24
+ this.tagTextData = "";
25
+ this.tagsStack = [];
26
+ this.entityParser = new EntitiesParser(options.htmlEntities);
27
+ this.stopNodes = [];
28
+ for (let i = 0; i < this.options.stopNodes.length; i++) {
29
+ this.stopNodes.push(new TagPath(this.options.stopNodes[i]));
30
+ }
31
+ }
32
+
33
+ parse(strData) {
34
+ this.source = new StringSource(strData);
35
+ this.parseXml();
36
+ return this.outputBuilder.getOutput();
37
+ }
38
+ parseBytesArr(data) {
39
+ this.source = new BufferSource(data );
40
+ this.parseXml();
41
+ return this.outputBuilder.getOutput();
42
+ }
43
+
44
+ parseXml() {
45
+ //TODO: Separate TagValueParser as separate class. So no scope issue in node builder class
46
+
47
+ //OutputBuilder should be set in XML Parser
48
+ this.outputBuilder = this.options.OutputBuilder.getInstance(this.options);
49
+ this.root = { root: true};
50
+ this.currentTagDetail = this.root;
51
+
52
+ while(this.source.canRead()){
53
+ let ch = this.source.readCh();
54
+ if (ch === "") break;
55
+
56
+ if(ch === "<"){//tagStart
57
+ let nextChar = this.source.readChAt(0);
58
+ if (nextChar === "" ) throw new Error("Unexpected end of source");
59
+
60
+
61
+ if(nextChar === "!" || nextChar === "?"){
62
+ this.source.updateBufferBoundary();
63
+ //previously collected text should be added to current node
64
+ this.addTextNode();
65
+
66
+ this.readSpecialTag(nextChar);// Read DOCTYPE, comment, CDATA, PI tag
67
+ }else if(nextChar === "/"){
68
+ this.source.updateBufferBoundary();
69
+ this.readClosingTag();
70
+ // console.log(this.source.buffer.length, this.source.readable);
71
+ // console.log(this.tagsStack.length);
72
+ }else{//opening tag
73
+ this.readOpeningTag();
74
+ }
75
+ }else{
76
+ this.tagTextData += ch;
77
+ }
78
+ }//End While loop
79
+ if(this.tagsStack.length > 0 || ( this.tagTextData !== "undefined" && this.tagTextData.trimEnd().length > 0) ) throw new Error("Unexpected data in the end of document");
80
+ }
81
+
82
+ /**
83
+ * read closing paired tag. Set parent tag in scope.
84
+ * skip a node on user's choice
85
+ */
86
+ readClosingTag(){
87
+ const tagName = this.processTagName(readClosingTagName(this.source));
88
+ // console.log(tagName, this.tagsStack.length);
89
+ this.validateClosingTag(tagName);
90
+ // All the text data collected, belongs to current tag.
91
+ if(!this.currentTagDetail.root) this.addTextNode();
92
+ this.outputBuilder.closeTag();
93
+ // Since the tag is closed now, parent tag comes in scope
94
+ this.currentTagDetail = this.tagsStack.pop();
95
+ }
96
+
97
+ validateClosingTag(tagName){
98
+ // This can't be unpaired tag, or a stop tag.
99
+ if(this.isUnpaired(tagName) || this.isStopNode(tagName)) throw new Error(`Unexpected closing tag '${tagName}'`);
100
+ // This must match with last opening tag
101
+ else if(tagName !== this.currentTagDetail.name)
102
+ throw new Error(`Unexpected closing tag '${tagName}' expecting '${this.currentTagDetail.name}'`)
103
+ }
104
+
105
+ /**
106
+ * Read paired, unpaired, self-closing, stop and special tags.
107
+ * Create a new node
108
+ * Push paired tag in stack.
109
+ */
110
+ readOpeningTag(){
111
+ //save previously collected text data to current node
112
+ this.addTextNode();
113
+
114
+ //create new tag
115
+ let tagExp = readTagExp(this, ">" );
116
+
117
+ // process and skip from tagsStack For unpaired tag, self closing tag, and stop node
118
+ const tagDetail = new TagDetail(tagExp.tagName);
119
+ if(this.isUnpaired(tagExp.tagName)) {
120
+ //TODO: this will lead 2 extra stack operation
121
+ this.outputBuilder.addTag(tagDetail);
122
+ this.outputBuilder.closeTag();
123
+ } else if(tagExp.selfClosing){
124
+ this.outputBuilder.addTag(tagDetail);
125
+ this.outputBuilder.closeTag();
126
+ } else if(this.isStopNode(this.currentTagDetail)){
127
+ // TODO: let's user set a stop node boundary detector for complex contents like script tag
128
+ //TODO: pass tag name only to avoid string operations
129
+ const content = source.readUptoCloseTag(`</${tagExp.tagName}`);
130
+ this.outputBuilder.addTag(tagDetail);
131
+ this.outputBuilder.addValue(content);
132
+ this.outputBuilder.closeTag();
133
+ }else{//paired tag
134
+ //set new nested tag in scope.
135
+ this.tagsStack.push(this.currentTagDetail);
136
+ this.outputBuilder.addTag(tagDetail);
137
+ this.currentTagDetail = tagDetail;
138
+ }
139
+ // console.log(tagExp.tagName,this.tagsStack.length);
140
+ // this.options.onClose()
141
+
142
+ }
143
+
144
+ readSpecialTag(startCh){
145
+ if(startCh == "!"){
146
+ let nextChar = this.source.readCh();
147
+ if (nextChar === null || nextChar === undefined) throw new Error("Unexpected ending of the source");
148
+
149
+ if(nextChar === "-"){//comment
150
+ readComment(this);
151
+ }else if(nextChar === "["){//CDATA
152
+ readCdata(this);
153
+ }else if(nextChar === "D"){//DOCTYPE
154
+ readDocType(this);
155
+ }
156
+ }else if(startCh === "?"){
157
+ readPiTag(this);
158
+ }else{
159
+ throw new Error(`Invalid tag '<${startCh}' at ${this.source.line}:${this.source.col}`)
160
+ }
161
+ }
162
+ addTextNode = function() {
163
+ // if(this.currentTagDetail){
164
+ //save text as child node
165
+ // if(this.currentTagDetail.tagname !== '!xml')
166
+ if (this.tagTextData !== undefined && this.tagTextData !== "") { //store previously collected data as textNode
167
+ if(this.tagTextData.trim().length > 0){
168
+ //TODO: shift parsing to output builder
169
+
170
+ this.outputBuilder.addValue(this.replaceEntities(this.tagTextData));
171
+ }
172
+ this.tagTextData = "";
173
+ }
174
+ // }
175
+ }
176
+
177
+ processAttrName(name){
178
+ if(name === "__proto__") name = "#__proto__";
179
+ name = resolveNameSpace(name, this.removeNSPrefix);
180
+ return name;
181
+ }
182
+
183
+ processTagName(name){
184
+ if(name === "__proto__") name = "#__proto__";
185
+ name = resolveNameSpace(name, this.removeNSPrefix);
186
+ return name;
187
+ }
188
+
189
+ /**
190
+ * Generate tags path from tagsStack
191
+ */
192
+ tagsPath(tagName){
193
+ //TODO: return TagPath Object. User can call match method with path
194
+ return "";
195
+ }
196
+
197
+ isUnpaired(tagName){
198
+ return this.options.tags.unpaired.indexOf(tagName) !== -1;
199
+ }
200
+
201
+ /**
202
+ * valid expressions are
203
+ * tag nested
204
+ * * nested
205
+ * tag nested[attribute]
206
+ * tag nested[attribute=""]
207
+ * tag nested[attribute!=""]
208
+ * tag nested:0 //for future
209
+ * @param {string} tagName
210
+ * @returns
211
+ */
212
+ isStopNode(node){
213
+ for (let i = 0; i < this.stopNodes.length; i++) {
214
+ const givenPath = this.stopNodes[i];
215
+ if(givenPath.match(this.tagsStack, node)) return true;
216
+ }
217
+ return false
218
+ }
219
+
220
+ replaceEntities(text){
221
+ //TODO: if option is set then replace entities
222
+ return this.entityParser.parse(text)
223
+ }
224
+ }
225
+
226
+ function resolveNameSpace(name, removeNSPrefix) {
227
+ if (removeNSPrefix) {
228
+ const parts = name.split(':');
229
+ if(parts.length === 2){
230
+ if (parts[0] === 'xmlns') return '';
231
+ else return parts[1];
232
+ }else reportError(`Multiple namespaces ${name}`)
233
+ }
234
+ return name;
235
+ }
236
+
237
+ module.exports = Xml2JsParser;