npm - @sap/cds-compiler - Versions diffs - 2.10.4 → 2.12.0 - Mend

@sap/cds-compiler 2.10.4 → 2.12.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (103) hide show

package/CHANGELOG.md +136 -0
package/bin/.eslintrc.json +1 -2
package/bin/cds_update_identifiers.js +10 -8
package/bin/cdsc.js +58 -35
package/bin/cdsse.js +1 -0
package/bin/cdsv2m.js +3 -2
package/doc/CHANGELOG_ARCHIVE.md +1 -1
package/doc/CHANGELOG_BETA.md +16 -0
package/lib/api/.eslintrc.json +2 -0
package/lib/api/main.js +10 -36
package/lib/api/options.js +17 -8
package/lib/api/validate.js +30 -3
package/lib/backends.js +12 -13
package/lib/base/dictionaries.js +2 -1
package/lib/base/keywords.js +3 -2
package/lib/base/message-registry.js +64 -11
package/lib/base/messages.js +38 -18
package/lib/base/model.js +6 -4
package/lib/base/optionProcessorHelper.js +148 -86
package/lib/checks/.eslintrc.json +2 -0
package/lib/checks/actionsFunctions.js +2 -1
package/lib/checks/emptyOrOnlyVirtual.js +2 -2
package/lib/checks/foreignKeys.js +4 -4
package/lib/checks/managedInType.js +4 -4
package/lib/checks/queryNoDbArtifacts.js +1 -3
package/lib/checks/selectItems.js +4 -0
package/lib/checks/sql-snippets.js +93 -0
package/lib/checks/unknownMagic.js +6 -3
package/lib/checks/validator.js +8 -0
package/lib/compiler/assert-consistency.js +14 -5
package/lib/compiler/base.js +64 -0
package/lib/compiler/builtins.js +62 -16
package/lib/compiler/checks.js +34 -10
package/lib/compiler/definer.js +91 -112
package/lib/compiler/index.js +30 -30
package/lib/compiler/propagator.js +8 -4
package/lib/compiler/resolver.js +279 -63
package/lib/compiler/shared.js +65 -230
package/lib/compiler/utils.js +191 -0
package/lib/edm/annotations/genericTranslation.js +35 -18
package/lib/edm/annotations/preprocessAnnotations.js +1 -1
package/lib/edm/csn2edm.js +4 -3
package/lib/edm/edm.js +8 -8
package/lib/edm/edmPreprocessor.js +61 -59
package/lib/edm/edmUtils.js +14 -15
package/lib/gen/Dictionary.json +82 -40
package/lib/gen/language.checksum +1 -1
package/lib/gen/language.interp +19 -1
package/lib/gen/language.tokens +80 -73
package/lib/gen/languageLexer.interp +27 -1
package/lib/gen/languageLexer.js +925 -826
package/lib/gen/languageLexer.tokens +72 -65
package/lib/gen/languageParser.js +4817 -4102
package/lib/json/from-csn.js +57 -26
package/lib/json/to-csn.js +244 -51
package/lib/language/antlrParser.js +12 -1
package/lib/language/docCommentParser.js +1 -1
package/lib/language/errorStrategy.js +26 -8
package/lib/language/genericAntlrParser.js +106 -30
package/lib/language/language.g4 +200 -70
package/lib/language/multiLineStringParser.js +536 -0
package/lib/main.d.ts +220 -21
package/lib/main.js +6 -3
package/lib/model/api.js +2 -2
package/lib/model/csnRefs.js +218 -86
package/lib/model/csnUtils.js +99 -178
package/lib/model/enrichCsn.js +84 -43
package/lib/model/revealInternalProperties.js +25 -8
package/lib/model/sortViews.js +8 -1
package/lib/modelCompare/compare.js +2 -1
package/lib/optionProcessor.js +33 -18
package/lib/render/.eslintrc.json +1 -2
package/lib/render/DuplicateChecker.js +2 -2
package/lib/render/manageConstraints.js +1 -1
package/lib/render/toCdl.js +202 -82
package/lib/render/toHdbcds.js +194 -135
package/lib/render/toRename.js +7 -10
package/lib/render/toSql.js +91 -51
package/lib/render/utils/common.js +24 -5
package/lib/render/utils/sql.js +6 -4
package/lib/transform/braceExpression.js +4 -2
package/lib/transform/db/applyTransformations.js +189 -0
package/lib/transform/db/associations.js +389 -0
package/lib/transform/db/cdsPersistence.js +150 -0
package/lib/transform/db/constraints.js +275 -119
package/lib/transform/db/draft.js +6 -4
package/lib/transform/db/expansion.js +10 -9
package/lib/transform/db/flattening.js +23 -8
package/lib/transform/db/temporal.js +236 -0
package/lib/transform/db/transformExists.js +106 -25
package/lib/transform/db/views.js +485 -0
package/lib/transform/forHanaNew.js +90 -1036
package/lib/transform/forOdataNew.js +11 -3
package/lib/transform/localized.js +5 -14
package/lib/transform/odata/generateForeignKeyElements.js +2 -2
package/lib/transform/transformUtilsNew.js +34 -20
package/lib/transform/translateAssocsToJoins.js +15 -23
package/lib/transform/universalCsnEnricher.js +217 -47
package/lib/utils/file.js +13 -6
package/lib/utils/term.js +65 -42
package/lib/utils/timetrace.js +55 -27
package/package.json +1 -1
package/lib/transform/db/helpers.js +0 -58

package/lib/language/multiLineStringParser.js ADDED Viewed

@@ -0,0 +1,536 @@
+'use strict';
+const whitespaceRegEx = /[\t\u{000B}\u{000C} \u{00A0}\u{FEFF}\p{Zs}]/u;
+const newLineRegEx = /\r\n?|\n|\u2028|\u2029/u;
+/**
+ * Returns true if the given string only contains whitespace characters.
+ *
+ * @todo Combine with function from docCommentParser
+ * @param {string} str
+ * @returns {boolean}
+ */
+function isWhiteSpaceOnly(str) {
+  return /^\s*$/.test(str);
+}
+/**
+ * Check whether the given character is a white-space character as
+ * defined by §11.2 of the ECMAScript 2020 specification.
+ * See <https://262.ecma-international.org/11.0/#sec-white-space>.
+ *
+ * | Code Point          | Name                                           | Abbreviation |
+ * |:--------------------|:-----------------------------------------------|--------------|
+ * | U+0009              | CHARACTER TABULATION                           | `<TAB>`      |
+ * | U+000B              | LINE TABULATION                                | `<VT>`       |
+ * | U+000C              | FORM FEED (FF)                                 | `<FF>`       |
+ * | U+0020              | SPACE                                          | `<SP>`       |
+ * | U+00A0              | NO-BREAK SPACE                                 | `<NBSP>`     |
+ * | U+FEFF              | ZERO WIDTH NO-BREAK SPACE                      | `<ZWNBSP>`   |
+ * | Other category “Zs” | Any other Unicode “Space_Separator” code point | `<USP>`      |
+ *
+ * @param char
+ * @returns {boolean}
+ */
+function isWhitespaceCharacter(char) {
+  return whitespaceRegEx.test(char);
+}
+/**
+ * Strips and counts the indentation from the given string.
+ *
+ * @example
+ *     |        hello
+ *     |          world
+ *     |        foo bar
+ *   becomes
+ *     | hello
+ *     |   world
+ *     | foo bar
+ *
+ * @param {string} str String prior to newline-normalization and escape parsing.
+ * @returns {[string, number]} The indentation-stripped string and the number
+ *                             of whitespace characters removed.
+ */
+function stripIndentation(str) {
+  if (str === '') {
+    return ['', 0];
+  }
+  // Note: We have to check all newline characters, as the string is not normalized, yet.
+  const lines = str.split(newLineRegEx);
+  const n = lines.length;
+  const hasTrailingLineBreak = newLineRegEx.test(str[str.length - 1]);
+  if (hasTrailingLineBreak) {
+    // Shortcut:
+    // If there is a trailing line break, it means that ``` is on newline and
+    // therefore the indentation to remove is 0.
+    // Remove the last newline, which may be CRLF.
+    return [lines.slice(0, -1).join('\n'), 0];
+  }
+  const min = lines.reduce((min, line, index) => {
+    // Note: Last line is the line containing ```.  There, we always count the indentation,
+    //       even if blank.  For all other lines, blank lines are ignored.
+    if (isWhiteSpaceOnly(line) && index !== (n-1))
+      return min;
+    let count = 0;
+    const length = Math.min(min, line.length);
+    while (count < length && isWhitespaceCharacter(line[count])) {
+      count++;
+    }
+    return Math.min(min, count);
+  }, Number.MAX_SAFE_INTEGER);
+  for (let i = 0; i < n; ++i) {
+    // Note: Line may be empty and have fewer characters than `min`.
+    //       In that case, slice() returns an empty string.
+    lines[i] = lines[i].slice(min);
+  }
+  // Remove trailing last line, if there was nothing else in that line.
+  if (lines[n-1] === '')
+    lines.pop();
+  return [lines.join('\n'), min];
+}
+class MultiLineStringParser {
+  constructor(antlrParser, token) {
+    this.parser = antlrParser; // for message functions
+    this.token = token;
+    this.str = token.text; // Copy because .text is a getter
+    if (this.str[0] !== '`' || this.str[this.str.length-1] !== '`') {
+      throw new Error('Invalid multi-line string sequence: Require string to be surrounded by back-ticks!');
+    }
+    this.output = [];
+    this.isTextBlock = this.str.startsWith('```');
+    this._indentation = 0;
+    // For message locations
+    this._lineInString = 0;
+    this._currentLineBreakIndex = 0;
+    if (this.isTextBlock) {
+      this.i = 3;
+      this.end = this.str.length - 3;
+    } else {
+      this.i = 1;
+      this.end = this.str.length - 1;
+    }
+  }
+  /**
+   * Parse the token's text and return it.
+   *
+   * @return {string}
+   */
+  parse() {
+    if (this.str.length === 2) {
+      return ''; // Nothing to do: ``
+    }
+    if (this.isTextBlock) {
+      // If there are no line breaks, emit an error as normal single-back-tick
+      // strings should be used instead.  Because the first line is skipped,
+      // there is no text without at least one line break.
+      if (!newLineRegEx.test(this.str)) {
+        const loc = this._locationForCharacters(this.end, 1);
+        this.parser.message('syntax-invalid-text-block', loc);
+        return '';
+      }
+      this._skipOptionalLanguageIdentifierLine();
+      // Indentation needs to be stripped _before_ escape sequences are parsed and
+      // _after_ the first line is skipped, because otherwise `\n` in the string
+      // will interfere with calculating indentation and the language identifier
+      // is not part of the actual string.
+      // Because of message locations, we still need to keep track of indentation count
+      // and need to update the cursor and end position as well as the currentLineBreakIndex.
+      const [ str, indent ] = stripIndentation(this.str.slice(this.i, -3));
+      this.str = str;
+      this._indentation = indent;
+      this.i = 0;
+      this.end = this.str.length;
+      // this._lineInString is > 0, but having this._currentLineBreakIndex = 0 would be incorrect,
+      // as the line break isn't the first character in the indentation-stripped string
+      this._currentLineBreakIndex = -1;
+    }
+    // Note: Index is at first character of string
+    do {
+      switch(this._current()) {
+        case this._matchLineBreakAtCurrentChar():
+          this.output.push('\n');
+          break;
+        case '\\':
+          this._move();
+          this._innerEscape();
+          break;
+        case '$':
+          if (this._lookahead() === '{') {
+            const loc = this._locationForCharacters(this.i, 2);
+            this.parser.message('syntax-missing-escape', loc,
+              { '#': 'placeholder', code: '${', newcode: '\\${' });
+          }
+          this.output.push(this.str[this.i]);
+          break;
+        default:
+          this.output.push(this.str[this.i]);
+          break;
+      }
+    } while(this._move());
+    return this.output.join('');
+  }
+  /**
+   * Parse the escape sequence after the first '\'.
+   *
+   * @private
+   */
+  _innerEscape() {
+    switch(this._current()) {
+      case this._matchLineBreakAtCurrentChar():
+        // Don't add to output -> line break is escaped
+        break;
+      case 'b': // backspace
+        this.output.push(`\b`);
+        break;
+      case 'f': // form feed
+        this.output.push(`\f`);
+        break;
+      case 'v': // vertical tabulator
+        this.output.push(`\v`);
+        break;
+      case 'r': // carriage return
+        this.output.push(`\r`);
+        break;
+      case 'n': // line feed
+        this.output.push(`\n`);
+        break;
+      case 't': // tab
+        this.output.push(`\t`);
+        break;
+      case '\\':
+      case '"':
+      case '\'':
+      case '`':
+      case '$':
+        this.output.push(this._current());
+        break;
+      case 'x':
+        this._parseHexEscape('x', 2);
+        break;
+      case 'u':
+        if (this._lookahead() === '{')
+          this._parseBracedUnicodeEscape();
+        else
+          this._parseHexEscape('u', 4);
+        break;
+      case '0': // null terminator
+        if (!/^\d$/.test(this._lookahead())) {
+          this.output.push(`\0`);
+          break;
+        }
+        // Let the default case handle octal representation.
+        // fallthrough
+      default: {
+        this.output.push(this._current());
+        const loc = this._locationForCharacters(this.i-1, 2);
+        if (/\s/.test(this._current())) {
+          this.parser.message('syntax-invalid-escape', loc, { '#': 'whitespace' });
+        } else if (/\d/.test(this._current())) {
+          this.parser.message('syntax-invalid-escape', loc, { '#': 'octal' });
+        } else {
+          const code = this._makeCode('\\' + this._current());
+          this.parser.message('syntax-unknown-escape', loc,  { '#': 'std', code });
+        }
+        break;
+      }
+    }
+  }
+  /**
+   * Parse the given hexadecimal string to a unicode code-point.
+   *
+   * @param {string} codePoint Code-point represented as hexadecimal string, e.g. 'ABCD'.
+   * @private
+   */
+  _parseHexCodePoint(codePoint) {
+    // Notes:
+    // It isn't possible to get an invalid code point with the \u0000
+    // syntax variant as the first invalid code point is \u{110000}
+    // and an empty `codePoint` is only possible with the braced variant.
+    const reportInvalidCodePoint = () => {
+      const code = this._makeCode(`\\u{${codePoint}}`);
+      const loc = this._locationForCharacters(this.i-codePoint.length, codePoint.length);
+      this.parser.message('syntax-invalid-escape', loc, { '#': 'codepoint', code });
+    };
+    const n = Number.parseInt(codePoint, 16);
+    if (Number.isNaN(n)) {
+      reportInvalidCodePoint();
+      return;
+    }
+    try {
+      this.output.push(String.fromCodePoint(n));
+    } catch (e) {
+      // RangeError is thrown if number isn't a valid code point
+      reportInvalidCodePoint();
+    }
+  }
+  /**
+   * Parse a hex escape-sequence.  Useful for unicode escapes and hex escapes.
+   * Cursor is at the `x`: `\x00`
+   *                         ^
+   * or at the `u`: `\u0000`
+   *                  ^
+   * @param {string} mode  Either `x` or `u`. Used for error messages.
+   * @param {number} count Number of expected hexadecimal numbers
+   * @private
+   */
+  _parseHexEscape(mode, count) {
+    let codePoint = '';
+    for (let j = 0; j < count; ++j) {
+      if (!this._eos() && /^[0-9A-Fa-f]$/.test(this._lookahead())) {
+        this._move();
+        codePoint += this._current();
+      } else {
+        break;
+      }
+    }
+    if (codePoint.length === count) {
+      this._parseHexCodePoint(codePoint);
+    } else {
+      const loc = this._locationForCharacters(this.i+1, 1);
+      const code = this._eos(this.i+1) ? `\\${mode}${codePoint}` : `\\${mode}${codePoint}${this._lookahead()}`;
+      this.parser.message('syntax-invalid-escape', loc,
+        { '#': 'hex-count', number: count, code: this._makeCode(code) });
+    }
+  }
+  /**
+   * Parse a unicode escape-sequence with braces.
+   * Cursor is at the `u`: `\u{0000}`
+   *                         ^
+   * @private
+   */
+  _parseBracedUnicodeEscape() {
+    let codePoint = '';
+    this._move(); // 'u'
+    while (!this._eos()) {
+      if (/^[0-9A-Fa-f]$/.test(this._lookahead())) {
+        this._move();
+        codePoint += this._current();
+      } else if (this._lookahead() === '}') {
+        break;
+      } else if (!this._eos(this.i+1)) {
+        const loc = this._locationForCharacters(this.i+1, 1); // Point to the exact character
+        const code = this._makeCode(`\\u{${codePoint}${this._lookahead()}…}`);
+        this.parser.message('syntax-invalid-escape', loc, { '#': 'unicode-hex', code });
+        return;
+      } else {
+        break;
+      }
+    }
+    if (this._lookahead() === '}') {
+      this._move();
+      this._parseHexCodePoint(codePoint);
+    } else {
+      const loc = this._locationForCharacters(this.i, 1);
+      this.parser.message('syntax-invalid-escape', loc, { '#': 'unicode-brace' });
+    }
+  }
+  /**
+   * This function skips the language identifier, i.e. until the next line.
+   * After this function, the cursor will be at the character _after_ the newline.
+   *
+   * @private
+   */
+  _skipOptionalLanguageIdentifierLine() {
+    while(!this._eos()) {
+      switch (this._current()) {
+        case this._matchLineBreakAtCurrentChar():
+          this._move();
+          return;
+        case '\\': {
+          // Do not allow an escape in the language identifier. If at the line's end, users
+          // may expect the identifier to span more than the first line, which is _not_ the case.
+          const loc = this._locationForCharacters(this.i, 1);
+          this.parser.message('syntax-invalid-escape', loc, { '#': 'language-identifier' });
+          this._move();
+          break;
+        }
+        default:
+          this._move();
+          break;
+      }
+    }
+  }
+  /**
+   * Consume a line-break Character.  Because CDS is close to JavaScript, we
+   * also support LS and PS.  This function also ensures that CRLF (`\r\n`) is
+   * recognized as a single character.
+   * We increase the line number for LF (`\n`) for correct message locations.
+   *
+   * This function returns the input character, so that it can be used
+   * in a switch-case.
+   *
+   * @returns {string|null}
+   * @private
+   */
+  _matchLineBreakAtCurrentChar() {
+    // Only increase line number for \n, because ANTLR does the same
+    switch(this._current()) {
+      case '\r':
+        if (this._lookahead() === '\n') {
+          this._move(); // \r\n is normalized
+          this._lineInString++;
+          this._currentLineBreakIndex = this.i;
+        }
+        return '\r';
+      case '\n':
+        this._lineInString++;
+        this._currentLineBreakIndex = this.i;
+      // fallthrough
+      case '\u2028': // LS
+      case '\u2029': // PS
+        return this._current();
+    }
+    return null;
+  }
+  /**
+   * Move the cursor to the next character _if_ we're not at the end.
+   *
+   * @private
+   * @returns {boolean} `true` if we're not at the end
+   */
+  _move() {
+    if (this.i < this.end) { // Don't move past last char and `
+      ++this.i;
+    }
+    return this.i < this.end;
+  }
+  /**
+   * Returns `true` if we're at the end of the string
+   *
+   * @param {Number} [i=this.i] Index to check for EOS
+   * @private
+   * @returns {boolean}
+   */
+  _eos(i = this.i) {
+    // end-of-string -> char before `
+    return i >= this.end;
+  }
+  /**
+   * Get the next character without increasing the cursor.
+   * @note Does not check for `eos()`
+   *
+   * @private
+   * @returns {string}
+   */
+  _lookahead() {
+    return this.str[this.i+1];
+  }
+  /**
+   * Get the current character without increasing the cursor.
+   *
+   * @private
+   * @returns {string}
+   */
+  _current() {
+    return this.str[this.i];
+  }
+  /**
+   * Get the previous character without decreasing the cursor.
+   *
+   * @private
+   * @returns {string}
+   */
+  _previous() {
+    return this.str[this.i-1];
+  }
+  /**
+   * Get message location for the given cursor position inside the string.
+   *
+   * @param {Number} i Cursor position
+   * @param {Number} width Width of the location
+   * @private
+   * @returns {CSN.Location}
+   */
+  _locationForCharacters(i, width) {
+    return {
+      file: this.parser.filename,
+      line: this.token.line + this._lineInString,
+      endLine: this.token.line + this._lineInString,
+      col: this._lineInString > 0 ? i - this._currentLineBreakIndex + this._indentation : this.token.column + i + 1,
+      endCol: this._lineInString > 0 ? i - this._currentLineBreakIndex + width + this._indentation :  this.token.column + i + width + 1,
+    };
+  }
+  /**
+   * For text messages, escape the given string for $(CODE).
+   * Escaping is required to avoid line breaks in compiler messages, e.g.
+   * if \u000<LF> is the code, the line-feed must be escaped.
+   *
+   * @param {string} code
+   * @private
+   */
+  _makeCode(code) {
+    // For characters that may be rendered as newline,
+    // see <https://www.unicode.org/reports/tr14/tr14-32.html>.
+    //
+    // Note: Unicode class `General_Category=Line_Separator` does not work for '\n'.
+    //
+    // U+000A: Line Feed (short: LF)
+    // U+000B: Vertical Tab (short: VT)
+    // U+000C: Form Feed (short: FF)
+    // U+000D: Carriage Return (short: CR)
+    // U+0085: Next Line (short: NEL)
+    // U+2028: Line Separator (short: LS)
+    // U+2029: Paragraph Separator (short: PS)
+    //
+    // For Visualization, see <https://en.wikipedia.org/wiki/Newline#Unicode>
+    //   U+23CE: ⏎
+    const newLineRegEx = /[\u{000A}\u{000B}\u{000C}\u{000D}\u{0085}\u{2028}\u{2029}]/ug;
+    return code.replace(newLineRegEx, '\u{23CE}');
+  }
+}
+/**
+ * Parse a back-tick string and return it.  This includes escape
+ * sequences, newlines, etc.
+ *
+ * Does _not_ modify the token's text.
+ *
+ * @param {object} token
+ */
+function parseMultiLineStringLiteral(token) {
+  const p = new MultiLineStringParser(this, token);
+  return p.parse();
+}
+module.exports = {
+  parseMultiLineStringLiteral,
+};