npm - eyeling - Versions diffs - 1.5.25 → 1.5.27 - Mend

eyeling 1.5.25 → 1.5.27

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/eyeling.js CHANGED Viewed

@@ -280,8 +280,41 @@ function lex(inputText) {
       continue;
     }
-    // String literal
+    // String literal: short "..." or long """..."""
     if (c === '"') {
+      // Long string literal """ ... """
+      if (peek(1) === '"' && peek(2) === '"') {
+        i += 3; // consume opening """
+        const sChars = [];
+        let closed = false;
+        while (i < n) {
+          // closing delimiter?
+          if (peek() === '"' && peek(1) === '"' && peek(2) === '"') {
+            i += 3; // consume closing """
+            closed = true;
+            break;
+          }
+          let cc = chars[i];
+          i++;
+          if (cc === "\\") {
+            // Preserve escapes verbatim (same behavior as short strings)
+            if (i < n) {
+              const esc = chars[i];
+              i++;
+              sChars.push("\\");
+              sChars.push(esc);
+            }
+            continue;
+          }
+          sChars.push(cc);
+        }
+        if (!closed) throw new Error('Unterminated long string literal """..."""');
+        const s = '"""' + sChars.join("") + '"""';
+        tokens.push(new Token("Literal", s));
+        continue;
+      }
+      // Short string literal " ... "
       i++; // consume opening "
       const sChars = [];
       while (i < n) {
@@ -318,9 +351,47 @@ function lex(inputText) {
       continue;
     }
-    // Directives: @prefix, @base
+    // Directives: @prefix, @base (and language tags after string literals)
     if (c === "@") {
-      i++;
+      const prevTok = tokens.length ? tokens[tokens.length - 1] : null;
+      const prevWasQuotedLiteral =
+        prevTok &&
+        prevTok.typ === "Literal" &&
+        typeof prevTok.value === "string" &&
+        prevTok.value.startsWith('"');
+      i++; // consume '@'
+      if (prevWasQuotedLiteral) {
+        // N3 grammar production LANGTAG:
+        //   "@" [a-zA-Z]+ ("-" [a-zA-Z0-9]+)*
+        const tagChars = [];
+        let cc = peek();
+        if (cc === null || !/[A-Za-z]/.test(cc)) {
+          throw new Error("Invalid language tag (expected [A-Za-z] after '@')");
+        }
+        while ((cc = peek()) !== null && /[A-Za-z]/.test(cc)) {
+          tagChars.push(cc);
+          i++;
+        }
+        while (peek() === "-") {
+          tagChars.push("-");
+          i++; // consume '-'
+          const segChars = [];
+          while ((cc = peek()) !== null && /[A-Za-z0-9]/.test(cc)) {
+            segChars.push(cc);
+            i++;
+          }
+          if (!segChars.length) {
+            throw new Error("Invalid language tag (expected [A-Za-z0-9]+ after '-')");
+          }
+          tagChars.push(...segChars);
+        }
+        tokens.push(new Token("LangTag", tagChars.join("")));
+        continue;
+      }
+      // Otherwise, treat as a directive (@prefix, @base)
       const wordChars = [];
       let cc;
       while ((cc = peek()) !== null && /[A-Za-z]/.test(cc)) {
@@ -684,6 +755,23 @@ class Parser {
     if (typ === "Literal") {
       let s = val || "";
+      // Optional language tag: "..."@en, per N3 LANGTAG production.
+      if (this.peek().typ === "LangTag") {
+        // Only quoted string literals can carry a language tag.
+        if (!(s.startsWith('"') && s.endsWith('"'))) {
+          throw new Error("Language tag is only allowed on quoted string literals");
+        }
+        const langTok = this.next();
+        const lang = langTok.value || "";
+        s = `${s}@${lang}`;
+        // N3/Turtle: language tags and datatypes are mutually exclusive.
+        if (this.peek().typ === "HatHat") {
+          throw new Error("A literal cannot have both a language tag (@...) and a datatype (^^...)");
+        }
+      }
       if (this.peek().typ === "HatHat") {
         this.next();
         const dtTok = this.next();
@@ -1594,19 +1682,40 @@ function composeSubst(outer, delta) {
 // ============================================================================
 function literalParts(lit) {
+  // Split a literal into lexical form and datatype IRI (if any).
+  // Also strip an optional language tag from the lexical form:
+  //   "\"hello\"@en"  -> "\"hello\""
+  //   "\"hello\"@en^^<...>" is rejected earlier in the parser.
   const idx = lit.indexOf("^^");
+  let lex = lit;
+  let dt = null;
   if (idx >= 0) {
-    let lex = lit.slice(0, idx);
-    let dt = lit.slice(idx + 2).trim();
+    lex = lit.slice(0, idx);
+    dt = lit.slice(idx + 2).trim();
     if (dt.startsWith("<") && dt.endsWith(">")) {
       dt = dt.slice(1, -1);
     }
-    return [lex, dt];
   }
-  return [lit, null];
+  // Strip LANGTAG from the lexical form when present.
+  if (lex.length >= 2 && lex[0] === '"') {
+    const lastQuote = lex.lastIndexOf('"');
+    if (lastQuote > 0 && lastQuote < lex.length - 1 && lex[lastQuote + 1] === "@") {
+      const lang = lex.slice(lastQuote + 2);
+      if (/^[A-Za-z]+(?:-[A-Za-z0-9]+)*$/.test(lang)) {
+        lex = lex.slice(0, lastQuote + 1);
+      }
+    }
+  }
+  return [lex, dt];
 }
 function stripQuotes(lex) {
+  if (lex.length >= 6 && lex.startsWith('"""') && lex.endsWith('"""')) {
+    return lex.slice(3, -3);
+  }
   if (lex.length >= 2 && lex[0] === '"' && lex[lex.length - 1] === '"') {
     return lex.slice(1, -1);
   }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "eyeling",
-  "version": "1.5.25",
+  "version": "1.5.27",
   "description": "A minimal Notation3 (N3) reasoner in JavaScript.",
   "main": "./index.js",
   "keywords": [

package/test/api.test.js CHANGED Viewed

@@ -621,6 +621,21 @@ ${U('s')} ${U('p')} ${U('o')}. # another trailing comment
       mustOccurExactly(out, reD, 1, 'diamond subclass should not duplicate x type D');
     },
   },
+  {
+    name: '42 literals: language tags are accepted and preserved',
+    opt: { proofComments: false },
+    input: ` { ?s ${U('p')} ?o } => { ?s ${U('q')} ?o }. ${U('s')} ${U('p')} "colour"@en-GB.`,
+    expect: [new RegExp(`${EX}s>\\s+<${EX}q>\\s+"colour"@en-GB\\s*\\.`)],
+  },
+  {
+    name: '43 literals: long """...""" strings are accepted (with lang tag)',
+    opt: { proofComments: false },
+    input: ` { ?s ${U('p')} ?o } => { ?s ${U('q')} ?o }. ${U('s')} ${U('p')} """Hello
+world"""@en.`,
+    expect: [new RegExp(`${EX}s>\\s+<${EX}q>\\s+(?:"""Hello[\\s\\S]*?world"""@en|"Hello\\\\nworld"@en)\\s*\\.`)],
+  },
 ];
 let passed = 0;