npm - katex - Versions diffs - 0.10.0-rc → 0.10.2 - Mend

katex 0.10.0-rc → 0.10.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (144) hide show

package/CHANGELOG.md +214 -126
package/README.md +18 -17
package/cli.js +5 -1
package/contrib/auto-render/README.md +1 -1
package/contrib/auto-render/auto-render.js +4 -1
package/contrib/auto-render/test/auto-render-spec.js +17 -0
package/contrib/copy-tex/README.md +8 -2
package/contrib/copy-tex/copy-tex.js +0 -1
package/contrib/copy-tex/copy-tex.webpack.js +6 -0
package/contrib/mathtex-script-type/README.md +10 -6
package/contrib/mhchem/README.md +19 -0
package/contrib/mhchem/mhchem.js +1695 -0
package/contrib/mhchem/mhchem.patch +235 -0
package/dist/README.md +18 -17
package/dist/contrib/auto-render.js +179 -161
package/dist/contrib/auto-render.min.js +1 -1
package/dist/contrib/auto-render.mjs +215 -0
package/dist/contrib/copy-tex.js +84 -62
package/dist/contrib/copy-tex.min.css +1 -1
package/dist/contrib/copy-tex.min.js +1 -1
package/dist/contrib/copy-tex.mjs +85 -0
package/dist/contrib/mathtex-script-type.js +17 -14
package/dist/contrib/mathtex-script-type.mjs +24 -0
package/dist/contrib/mhchem.js +3241 -0
package/dist/contrib/mhchem.min.js +1 -0
package/dist/contrib/mhchem.mjs +3109 -0
package/dist/fonts/KaTeX_AMS-Regular.ttf +0 -0
package/dist/fonts/KaTeX_AMS-Regular.woff +0 -0
package/dist/fonts/KaTeX_AMS-Regular.woff2 +0 -0
package/dist/fonts/KaTeX_Caligraphic-Bold.ttf +0 -0
package/dist/fonts/KaTeX_Caligraphic-Bold.woff +0 -0
package/dist/fonts/KaTeX_Caligraphic-Bold.woff2 +0 -0
package/dist/fonts/KaTeX_Caligraphic-Regular.ttf +0 -0
package/dist/fonts/KaTeX_Caligraphic-Regular.woff +0 -0
package/dist/fonts/KaTeX_Caligraphic-Regular.woff2 +0 -0
package/dist/fonts/KaTeX_Fraktur-Bold.ttf +0 -0
package/dist/fonts/KaTeX_Fraktur-Bold.woff +0 -0
package/dist/fonts/KaTeX_Fraktur-Bold.woff2 +0 -0
package/dist/fonts/KaTeX_Fraktur-Regular.ttf +0 -0
package/dist/fonts/KaTeX_Fraktur-Regular.woff +0 -0
package/dist/fonts/KaTeX_Fraktur-Regular.woff2 +0 -0
package/dist/fonts/KaTeX_Main-Bold.ttf +0 -0
package/dist/fonts/KaTeX_Main-Bold.woff +0 -0
package/dist/fonts/KaTeX_Main-Bold.woff2 +0 -0
package/dist/fonts/KaTeX_Main-BoldItalic.ttf +0 -0
package/dist/fonts/KaTeX_Main-BoldItalic.woff +0 -0
package/dist/fonts/KaTeX_Main-BoldItalic.woff2 +0 -0
package/dist/fonts/KaTeX_Main-Italic.ttf +0 -0
package/dist/fonts/KaTeX_Main-Italic.woff +0 -0
package/dist/fonts/KaTeX_Main-Italic.woff2 +0 -0
package/dist/fonts/KaTeX_Main-Regular.ttf +0 -0
package/dist/fonts/KaTeX_Main-Regular.woff +0 -0
package/dist/fonts/KaTeX_Main-Regular.woff2 +0 -0
package/dist/fonts/KaTeX_Math-BoldItalic.ttf +0 -0
package/dist/fonts/KaTeX_Math-BoldItalic.woff +0 -0
package/dist/fonts/KaTeX_Math-BoldItalic.woff2 +0 -0
package/dist/fonts/KaTeX_Math-Italic.ttf +0 -0
package/dist/fonts/KaTeX_Math-Italic.woff +0 -0
package/dist/fonts/KaTeX_Math-Italic.woff2 +0 -0
package/dist/fonts/KaTeX_SansSerif-Bold.ttf +0 -0
package/dist/fonts/KaTeX_SansSerif-Bold.woff +0 -0
package/dist/fonts/KaTeX_SansSerif-Bold.woff2 +0 -0
package/dist/fonts/KaTeX_SansSerif-Italic.ttf +0 -0
package/dist/fonts/KaTeX_SansSerif-Italic.woff +0 -0
package/dist/fonts/KaTeX_SansSerif-Italic.woff2 +0 -0
package/dist/fonts/KaTeX_SansSerif-Regular.ttf +0 -0
package/dist/fonts/KaTeX_SansSerif-Regular.woff +0 -0
package/dist/fonts/KaTeX_SansSerif-Regular.woff2 +0 -0
package/dist/fonts/KaTeX_Script-Regular.ttf +0 -0
package/dist/fonts/KaTeX_Script-Regular.woff +0 -0
package/dist/fonts/KaTeX_Script-Regular.woff2 +0 -0
package/dist/fonts/KaTeX_Size1-Regular.ttf +0 -0
package/dist/fonts/KaTeX_Size1-Regular.woff +0 -0
package/dist/fonts/KaTeX_Size1-Regular.woff2 +0 -0
package/dist/fonts/KaTeX_Size2-Regular.ttf +0 -0
package/dist/fonts/KaTeX_Size2-Regular.woff +0 -0
package/dist/fonts/KaTeX_Size2-Regular.woff2 +0 -0
package/dist/fonts/KaTeX_Size3-Regular.ttf +0 -0
package/dist/fonts/KaTeX_Size3-Regular.woff +0 -0
package/dist/fonts/KaTeX_Size3-Regular.woff2 +0 -0
package/dist/fonts/KaTeX_Size4-Regular.ttf +0 -0
package/dist/fonts/KaTeX_Size4-Regular.woff +0 -0
package/dist/fonts/KaTeX_Size4-Regular.woff2 +0 -0
package/dist/fonts/KaTeX_Typewriter-Regular.ttf +0 -0
package/dist/fonts/KaTeX_Typewriter-Regular.woff +0 -0
package/dist/fonts/KaTeX_Typewriter-Regular.woff2 +0 -0
package/dist/katex.css +24 -9
package/dist/katex.js +13295 -12413
package/dist/katex.min.css +1 -1
package/dist/katex.min.js +1 -1
package/dist/katex.mjs +13388 -11826
package/katex.js +1 -2
package/package.json +60 -48
package/src/Lexer.js +25 -25
package/src/MacroExpander.js +0 -1
package/src/Options.js +11 -75
package/src/Parser.js +231 -313
package/src/Settings.js +6 -0
package/src/buildCommon.js +140 -103
package/src/buildHTML.js +125 -121
package/src/buildMathML.js +14 -4
package/src/buildTree.js +16 -10
package/src/delimiter.js +4 -3
package/src/domTree.js +91 -44
package/src/environments/array.js +120 -7
package/src/fontMetrics.js +3 -2
package/src/functions/arrow.js +21 -7
package/src/functions/color.js +2 -37
package/src/functions/delimsizing.js +18 -11
package/src/functions/enclose.js +19 -4
package/src/functions/environment.js +35 -4
package/src/functions/font.js +1 -2
package/src/functions/genfrac.js +35 -20
package/src/functions/href.js +5 -3
package/src/functions/includegraphics.js +146 -0
package/src/functions/mclass.js +1 -0
package/src/functions/op.js +21 -32
package/src/functions/operatorname.js +1 -2
package/src/functions/ordgroup.js +4 -0
package/src/functions/phantom.js +7 -3
package/src/functions/rule.js +20 -9
package/src/functions/sizing.js +2 -4
package/src/functions/smash.js +5 -2
package/src/functions/sqrt.js +1 -4
package/src/functions/styling.js +0 -1
package/src/functions/supsub.js +6 -2
package/src/functions/symbolsOp.js +4 -0
package/src/functions/symbolsSpacing.js +29 -6
package/src/functions/tag.js +20 -4
package/src/functions/text.js +6 -4
package/src/functions/verb.js +16 -4
package/src/functions.js +2 -0
package/src/katex.less +35 -12
package/src/macros.js +161 -36
package/src/mathMLTree.js +17 -19
package/src/parseNode.js +27 -1
package/src/stretchy.js +3 -1
package/src/svgGeometry.js +1 -1
package/src/symbols.js +39 -17
package/src/tree.js +0 -4
package/src/types.js +4 -3
package/src/unicodeMake.js +1 -1
package/src/utils.js +1 -62
package/src/wide-character.js +2 -2

package/src/Parser.js CHANGED Viewed

@@ -1,21 +1,20 @@
 // @flow
 /* eslint no-constant-condition:0 */
 import functions from "./functions";
-import environments from "./environments";
-import MacroExpander from "./MacroExpander";
+import MacroExpander, {implicitCommands} from "./MacroExpander";
 import symbols, {ATOMS, extraLatin} from "./symbols";
 import {validUnit} from "./units";
 import {supportedCodepoint} from "./unicodeScripts";
 import unicodeAccents from "./unicodeAccents";
 import unicodeSymbols from "./unicodeSymbols";
 import utils from "./utils";
-import {assertNodeType, checkNodeType} from "./parseNode";
+import {checkNodeType} from "./parseNode";
 import ParseError from "./ParseError";
-import {combiningDiacriticalMarksEndRegex, urlFunctionRegex} from "./Lexer";
+import {combiningDiacriticalMarksEndRegex} from "./Lexer";
 import Settings from "./Settings";
 import SourceLocation from "./SourceLocation";
 import {Token} from "./Token";
-import type {AnyParseNode, SymbolParseNode} from "./parseNode";
+import type {ParseNode, AnyParseNode, SymbolParseNode} from "./parseNode";
 import type {Atom, Group} from "./symbols";
 import type {Mode, ArgType, BreakToken} from "./types";
 import type {FunctionContext, FunctionSpec} from "./defineFunction";
@@ -48,33 +47,9 @@ import type {EnvSpec} from "./defineEnvironment";
  * There are also extra `.handle...` functions, which pull out some reused
  * functionality into self-contained functions.
  *
- * The earlier functions return ParseNodes.
- * The later functions (which are called deeper in the parse) sometimes return
- * ParsedFuncOrArg, which contain a ParseNode as well as some data about
- * whether the parsed object is a function which is missing some arguments, or a
- * standalone object which can be used as an argument to another function.
+ * The functions return ParseNodes.
  */
-type ParsedFunc = {|
-    type: "fn",
-    result: string, // Function name defined via defineFunction (e.g. "\\frac").
-    token: Token,
-|};
-type ParsedArg = {|
-    type: "arg",
-    result: AnyParseNode,
-    token: Token,
-|};
-type ParsedFuncOrArg = ParsedFunc | ParsedArg;
-function newArgument(result: AnyParseNode, token: Token): ParsedArg {
-    return {type: "arg", result, token};
-}
-function newFunction(token: Token): ParsedFunc {
-    return {type: "fn", result: token.text, token};
-}
 export default class Parser {
     mode: Mode;
     gullet: MacroExpander;
@@ -153,7 +128,13 @@ export default class Parser {
         return parse;
     }
-    static endOfExpression = ["}", "\\end", "\\right", "&"];
+    static endOfExpression = ["}", "\\endgroup", "\\end", "\\right", "&"];
+    static endOfGroup = {
+        "[": "]",
+        "{": "}",
+        "\\begingroup": "\\endgroup",
+    }
     /**
      * Parses an "expression", which is a list of atoms.
@@ -190,12 +171,6 @@ export default class Parser {
             }
             const atom = this.parseAtom(breakOnTokenText);
             if (!atom) {
-                if (!this.settings.throwOnError && lex.text[0] === "\\") {
-                    const errorNode = this.handleUnsupportedCmd();
-                    body.push(errorNode);
-                    continue;
-                }
                 break;
             }
             body.push(atom);
@@ -275,33 +250,16 @@ export default class Parser {
         const symbol = symbolToken.text;
         this.consume();
         this.consumeSpaces(); // ignore spaces before sup/subscript argument
-        const group = this.parseGroup();
+        const group = this.parseGroup(name, false, Parser.SUPSUB_GREEDINESS);
         if (!group) {
-            if (!this.settings.throwOnError && this.nextToken.text[0] === "\\") {
-                return this.handleUnsupportedCmd();
-            } else {
-                throw new ParseError(
-                    "Expected group after '" + symbol + "'",
-                    symbolToken
-                );
-            }
+            throw new ParseError(
+                "Expected group after '" + symbol + "'",
+                symbolToken
+            );
         }
-        if (group.type === "fn") {
-            // ^ and _ have a greediness, so handle interactions with functions'
-            // greediness
-            const funcGreediness = functions[group.result].greediness;
-            if (funcGreediness > Parser.SUPSUB_GREEDINESS) {
-                return this.parseGivenFunction(group);
-            } else {
-                throw new ParseError(
-                    "Got function '" + group.result + "' with no arguments " +
-                        "as " + name, symbolToken);
-            }
-        } else {
-            return group.result;
-        }
+        return group;
     }
     /**
@@ -339,7 +297,7 @@ export default class Parser {
     parseAtom(breakOnTokenText?: BreakToken): ?AnyParseNode {
         // The body of an atom is an implicit group, so that things like
         // \left(x\right)^2 work correctly.
-        const base = this.parseImplicitGroup(breakOnTokenText);
+        const base = this.parseGroup("atom", false, null, breakOnTokenText);
         // In text mode, we don't have superscripts or subscripts
         if (this.mode === "text") {
@@ -429,115 +387,49 @@ export default class Parser {
     }
     /**
-     * Parses an implicit group, which is a group that starts at the end of a
-     * specified, and ends right before a higher explicit group ends, or at EOL. It
-     * is used for functions that appear to affect the current style, like \Large or
-     * \textrm, where instead of keeping a style we just pretend that there is an
-     * implicit grouping after it until the end of the group. E.g.
-     *   small text {\Large large text} small text again
+     * Parses an entire function, including its base and all of its arguments.
      */
-    parseImplicitGroup(breakOnTokenText?: BreakToken): ?AnyParseNode {
-        const start = this.parseSymbol();
-        if (start == null) {
-            // If we didn't get anything we handle, fall back to parseFunction
-            return this.parseFunction();
-        } else if (start.type === "arg") {
-            // Defer to parseGivenFunction if it's not a function we handle
-            return this.parseGivenFunction(start);
+    parseFunction(
+        breakOnTokenText?: BreakToken,
+        name?: string, // For error reporting.
+        greediness?: ?number,
+    ): ?AnyParseNode {
+        const token = this.nextToken;
+        const func = token.text;
+        const funcData = functions[func];
+        if (!funcData) {
+            return null;
         }
-        const func = start.result;
-        if (func === "\\begin") {
-            // begin...end is similar to left...right
-            const begin =
-                assertNodeType(this.parseGivenFunction(start), "environment");
-            const envName = begin.name;
-            if (!environments.hasOwnProperty(envName)) {
-                throw new ParseError(
-                    "No such environment: " + envName, begin.nameGroup);
-            }
-            // Build the environment object. Arguments and other information will
-            // be made available to the begin and end methods using properties.
-            const env = environments[envName];
-            const {args, optArgs} =
-                this.parseArguments("\\begin{" + envName + "}", env);
-            const context = {
-                mode: this.mode,
-                envName: envName,
-                parser: this,
-            };
-            const result = env.handler(context, args, optArgs);
-            this.expect("\\end", false);
-            const endNameToken = this.nextToken;
-            let end = this.parseFunction();
-            if (!end) {
-                throw new ParseError("failed to parse function after \\end");
-            }
-            end = assertNodeType(end, "environment");
-            if (end.name !== envName) {
-                throw new ParseError(
-                    `Mismatch: \\begin{${envName}} matched by \\end{${end.name}}`,
-                    endNameToken);
-            }
-            return result;
-        } else {
-            // Defer to parseGivenFunction if it's not a function we handle
-            return this.parseGivenFunction(start, breakOnTokenText);
+        if (greediness != null && funcData.greediness <= greediness) {
+            throw new ParseError(
+                "Got function '" + func + "' with no arguments" +
+                (name ? " as " + name : ""), token);
+        } else if (this.mode === "text" && !funcData.allowedInText) {
+            throw new ParseError(
+                "Can't use function '" + func + "' in text mode", token);
+        } else if (this.mode === "math" && funcData.allowedInMath === false) {
+            throw new ParseError(
+                "Can't use function '" + func + "' in math mode", token);
         }
-    }
-    /**
-     * Parses an entire function, including its base and all of its arguments.
-     * It also handles the case where the parsed node is not a function.
-     */
-    parseFunction(): ?AnyParseNode {
-        const baseGroup = this.parseGroup();
-        return baseGroup ? this.parseGivenFunction(baseGroup) : null;
-    }
-    /**
-     * Same as parseFunction(), except that the base is provided, guaranteeing a
-     * non-nullable result.
-     */
-    parseGivenFunction(
-        baseGroup: ParsedFuncOrArg,
-        breakOnTokenText?: BreakToken,
-    ): AnyParseNode {
-        if (baseGroup.type === "fn") {
-            const func = baseGroup.result;
-            const funcData = functions[func];
-            if (this.mode === "text" && !funcData.allowedInText) {
-                throw new ParseError(
-                    "Can't use function '" + func + "' in text mode",
-                    baseGroup.token);
-            } else if (this.mode === "math" &&
-                funcData.allowedInMath === false) {
-                throw new ParseError(
-                    "Can't use function '" + func + "' in math mode",
-                    baseGroup.token);
-            }
+        // hyperref package sets the catcode of % as an active character
+        if (funcData.argTypes && funcData.argTypes[0] === "url") {
+            this.gullet.lexer.setCatcode("%", 13);
+        }
-            // Consume the command token after possibly switching to the
-            // mode specified by the function (for instant mode switching),
-            // and then immediately switch back.
-            if (funcData.consumeMode) {
-                const oldMode = this.mode;
-                this.switchMode(funcData.consumeMode);
-                this.consume();
-                this.switchMode(oldMode);
-            } else {
-                this.consume();
-            }
-            const {args, optArgs} = this.parseArguments(func, funcData);
-            const token = baseGroup.token;
-            return this.callFunction(
-                func, args, optArgs, token, breakOnTokenText);
+        // Consume the command token after possibly switching to the
+        // mode specified by the function (for instant mode switching),
+        // and then immediately switch back.
+        if (funcData.consumeMode) {
+            const oldMode = this.mode;
+            this.switchMode(funcData.consumeMode);
+            this.consume();
+            this.switchMode(oldMode);
         } else {
-            return baseGroup.result;
+            this.consume();
         }
+        const {args, optArgs} = this.parseArguments(func, funcData);
+        return this.callFunction(func, args, optArgs, token, breakOnTokenText);
     }
     /**
@@ -603,37 +495,17 @@ export default class Parser {
                 this.consumeSpaces();
             }
             const nextToken = this.nextToken;
-            let arg = argType ?
-                this.parseGroupOfType(argType, isOptional) :
-                this.parseGroup(isOptional);
+            const arg = this.parseGroupOfType("argument to '" + func + "'",
+                argType, isOptional, baseGreediness);
             if (!arg) {
                 if (isOptional) {
                     optArgs.push(null);
                     continue;
                 }
-                if (!this.settings.throwOnError &&
-                    this.nextToken.text[0] === "\\") {
-                    arg = newArgument(this.handleUnsupportedCmd(), nextToken);
-                } else {
-                    throw new ParseError(
-                        "Expected group after '" + func + "'", nextToken);
-                }
-            }
-            let argNode: AnyParseNode;
-            if (arg.type === "fn") {
-                const argGreediness =
-                    functions[arg.result].greediness;
-                if (argGreediness > baseGreediness) {
-                    argNode = this.parseGivenFunction(arg);
-                } else {
-                    throw new ParseError(
-                        "Got function '" + arg.result + "' as " +
-                        "argument to '" + func + "'", nextToken);
-                }
-            } else {
-                argNode = arg.result;
+                throw new ParseError(
+                    "Expected group after '" + func + "'", nextToken);
             }
-            (isOptional ? optArgs : args).push(argNode);
+            (isOptional ? optArgs : args).push(arg);
         }
         return {args, optArgs};
@@ -643,29 +515,44 @@ export default class Parser {
      * Parses a group when the mode is changing.
      */
     parseGroupOfType(
-        type: ArgType,  // Used to describe the mode in error messages.
+        name: string,
+        type: ?ArgType,
         optional: boolean,
-    ): ?ParsedFuncOrArg {
-        // Handle `original` argTypes
-        if (type === "original") {
-            type = this.mode;
-        }
-        if (type === "color") {
-            return this.parseColorGroup(optional);
-        }
-        if (type === "size") {
-            return this.parseSizeGroup(optional);
-        }
-        if (type === "url") {
-            throw new ParseError(
-                "Internal bug: 'url' arguments should be handled by Lexer",
-                this.nextToken);
+        greediness: ?number,
+    ): ?AnyParseNode {
+        switch (type) {
+            case "color":
+                return this.parseColorGroup(optional);
+            case "size":
+                return this.parseSizeGroup(optional);
+            case "url":
+                return this.parseUrlGroup(optional);
+            case "math":
+            case "text":
+                return this.parseGroup(name, optional, greediness, undefined, type);
+            case "raw": {
+                if (optional && this.nextToken.text === "{") {
+                    return null;
+                }
+                const token = this.parseStringGroup("raw", optional, true);
+                if (token) {
+                    return {
+                        type: "raw",
+                        mode: "text",
+                        string: token.text,
+                    };
+                } else {
+                    throw new ParseError("Expected raw group", this.nextToken);
+                }
+            }
+            case "original":
+            case null:
+            case undefined:
+                return this.parseGroup(name, optional, greediness);
+            default:
+                throw new ParseError(
+                    "Unknown group type as " + name, this.nextToken);
         }
-        // By the time we get here, type is one of "text" or "math".
-        // Specify this as mode to parseGroup.
-        return this.parseGroup(optional, type);
     }
     consumeSpaces() {
@@ -681,28 +568,49 @@ export default class Parser {
     parseStringGroup(
         modeName: ArgType,  // Used to describe the mode in error messages.
         optional: boolean,
+        raw?: boolean,
     ): ?Token {
-        if (optional && this.nextToken.text !== "[") {
-            return null;
+        const groupBegin = optional ? "[" : "{";
+        const groupEnd = optional ? "]" : "}";
+        const nextToken = this.nextToken;
+        if (nextToken.text !== groupBegin) {
+            if (optional) {
+                return null;
+            } else if (raw && nextToken.text !== "EOF" &&
+                    /[^{}[\]]/.test(nextToken.text)) {
+                // allow a single character in raw string group
+                this.gullet.lexer.setCatcode("%", 14); // reset the catcode of %
+                this.consume();
+                return nextToken;
+            }
         }
         const outerMode = this.mode;
         this.mode = "text";
-        this.expect(optional ? "[" : "{");
+        this.expect(groupBegin);
         let str = "";
         const firstToken = this.nextToken;
+        let nested = 0; // allow nested braces in raw string group
         let lastToken = firstToken;
-        while (this.nextToken.text !== (optional ? "]" : "}")) {
-            if (this.nextToken.text === "EOF") {
-                throw new ParseError(
-                    "Unexpected end of input in " + modeName,
-                    firstToken.range(this.nextToken, str));
+        while ((raw && nested > 0) || this.nextToken.text !== groupEnd) {
+            switch (this.nextToken.text) {
+                case "EOF":
+                    throw new ParseError(
+                        "Unexpected end of input in " + modeName,
+                        firstToken.range(lastToken, str));
+                case groupBegin:
+                    nested++;
+                    break;
+                case groupEnd:
+                    nested--;
+                    break;
             }
             lastToken = this.nextToken;
             str += lastToken.text;
             this.consume();
         }
         this.mode = outerMode;
-        this.expect(optional ? "]" : "}");
+        this.gullet.lexer.setCatcode("%", 14); // reset the catcode of %
+        this.expect(groupEnd);
         return firstToken.range(lastToken, str);
     }
@@ -720,8 +628,8 @@ export default class Parser {
         const firstToken = this.nextToken;
         let lastToken = firstToken;
         let str = "";
-        while (this.nextToken.text !== "EOF"
-            && regex.test(str + this.nextToken.text)) {
+        while (this.nextToken.text !== "EOF" &&
+                regex.test(str + this.nextToken.text)) {
             lastToken = this.nextToken;
             str += lastToken.text;
             this.consume();
@@ -738,26 +646,33 @@ export default class Parser {
     /**
      * Parses a color description.
      */
-    parseColorGroup(optional: boolean): ?ParsedArg {
+    parseColorGroup(optional: boolean): ?ParseNode<"color-token"> {
         const res = this.parseStringGroup("color", optional);
         if (!res) {
             return null;
         }
-        const match = (/^(#[a-f0-9]{3}|#[a-f0-9]{6}|[a-z]+)$/i).exec(res.text);
+        const match = (/^(#[a-f0-9]{3}|#?[a-f0-9]{6}|[a-z]+)$/i).exec(res.text);
         if (!match) {
             throw new ParseError("Invalid color: '" + res.text + "'", res);
         }
-        return newArgument({
+        let color = match[0];
+        if (/^[0-9a-f]{6}$/i.test(color)) {
+            // We allow a 6-digit HTML color spec without a leading "#".
+            // This follows the xcolor package's HTML color model.
+            // Predefined color names are all missed by this RegEx pattern.
+            color = "#" + color;
+        }
+        return {
             type: "color-token",
             mode: this.mode,
-            color: match[0],
-        }, res);
+            color,
+        };
     }
     /**
      * Parses a size specification, consisting of magnitude and unit.
      */
-    parseSizeGroup(optional: boolean): ?ParsedArg {
+    parseSizeGroup(optional: boolean): ?ParseNode<"size"> {
         let res;
         let isBlank = false;
         if (!optional && this.nextToken.text !== "{") {
@@ -787,64 +702,120 @@ export default class Parser {
         if (!validUnit(data)) {
             throw new ParseError("Invalid unit: '" + data.unit + "'", res);
         }
-        return newArgument({
+        return {
             type: "size",
             mode: this.mode,
             value: data,
             isBlank,
-        }, res);
+        };
+    }
+    /**
+     * Parses an URL, checking escaped letters and allowed protocols.
+     */
+    parseUrlGroup(optional: boolean): ?ParseNode<"url"> {
+        const res = this.parseStringGroup("url", optional, true); // get raw string
+        if (!res) {
+            return null;
+        }
+        // hyperref package allows backslashes alone in href, but doesn't
+        // generate valid links in such cases; we interpret this as
+        // "undefined" behaviour, and keep them as-is. Some browser will
+        // replace backslashes with forward slashes.
+        const url = res.text.replace(/\\([#$%&~_^{}])/g, '$1');
+        let protocol = /^\s*([^\\/#]*?)(?::|&#0*58|&#x0*3a)/i.exec(url);
+        protocol = (protocol != null ? protocol[1] : "_relative");
+        const allowed = this.settings.allowedProtocols;
+        if (!utils.contains(allowed,  "*") &&
+            !utils.contains(allowed, protocol)) {
+            throw new ParseError(
+                `Forbidden protocol '${protocol}'`, res);
+        }
+        return {
+            type: "url",
+            mode: this.mode,
+            url,
+        };
     }
     /**
      * If `optional` is false or absent, this parses an ordinary group,
      * which is either a single nucleus (like "x") or an expression
-     * in braces (like "{x+y}").
+     * in braces (like "{x+y}") or an implicit group, a group that starts
+     * at the current position, and ends right before a higher explicit
+     * group ends, or at EOF.
      * If `optional` is true, it parses either a bracket-delimited expression
      * (like "[x+y]") or returns null to indicate the absence of a
      * bracket-enclosed group.
      * If `mode` is present, switches to that mode while parsing the group,
      * and switches back after.
      */
-    parseGroup(optional?: boolean, mode?: Mode): ?ParsedFuncOrArg {
+    parseGroup(
+        name: string, // For error reporting.
+        optional?: boolean,
+        greediness?: ?number,
+        breakOnTokenText?: BreakToken,
+        mode?: Mode,
+    ): ?AnyParseNode {
         const outerMode = this.mode;
         const firstToken = this.nextToken;
-        // Try to parse an open brace
-        if (this.nextToken.text === (optional ? "[" : "{")) {
-            // Switch to specified mode before we expand symbol after brace
-            if (mode) {
-                this.switchMode(mode);
-            }
+        const text = firstToken.text;
+        // Switch to specified mode
+        if (mode) {
+            this.switchMode(mode);
+        }
+        let groupEnd;
+        let result;
+        // Try to parse an open brace or \begingroup
+        if (optional ? text === "["  : text === "{" || text === "\\begingroup") {
+            groupEnd = Parser.endOfGroup[text];
             // Start a new group namespace
             this.gullet.beginGroup();
             // If we get a brace, parse an expression
             this.consume();
-            const expression = this.parseExpression(false, optional ? "]" : "}");
+            const expression = this.parseExpression(false, groupEnd);
             const lastToken = this.nextToken;
-            // Switch mode back before consuming symbol after close brace
-            if (mode) {
-                this.switchMode(outerMode);
-            }
             // End group namespace before consuming symbol after close brace
             this.gullet.endGroup();
-            // Make sure we get a close brace
-            this.expect(optional ? "]" : "}");
-            return newArgument({
+            result = {
                 type: "ordgroup",
                 mode: this.mode,
                 loc: SourceLocation.range(firstToken, lastToken),
                 body: expression,
-            }, firstToken.range(lastToken, firstToken.text));
+                // A group formed by \begingroup...\endgroup is a semi-simple group
+                // which doesn't affect spacing in math mode, i.e., is transparent.
+                // https://tex.stackexchange.com/questions/1930/when-should-one-
+                // use-begingroup-instead-of-bgroup
+                semisimple: text === "\\begingroup" || undefined,
+            };
+        } else if (optional) {
+            // Return nothing for an optional group
+            result = null;
         } else {
-            // Otherwise, just return a nucleus, or nothing for an optional group
-            if (mode) {
-                this.switchMode(mode);
-            }
-            const result = optional ? null : this.parseSymbol();
-            if (mode) {
-                this.switchMode(outerMode);
+            // If there exists a function with this name, parse the function.
+            // Otherwise, just return a nucleus
+            result = this.parseFunction(breakOnTokenText, name, greediness) ||
+                this.parseSymbol();
+            if (result == null && text[0] === "\\" &&
+                    !implicitCommands.hasOwnProperty(text)) {
+                if (this.settings.throwOnError) {
+                    throw new ParseError(
+                        "Undefined control sequence: " + text, firstToken);
+                }
+                result = this.handleUnsupportedCmd();
             }
-            return result;
         }
+        // Switch mode back
+        if (mode) {
+            this.switchMode(outerMode);
+        }
+        // Make sure we got a close brace
+        if (groupEnd) {
+            this.expect(groupEnd);
+        }
+        return result;
     }
     /**
@@ -893,67 +864,14 @@ export default class Parser {
     }
     /**
-     * Parse a single symbol out of the string. Here, we handle both the functions
-     * we have defined, as well as the single character symbols
+     * Parse a single symbol out of the string. Here, we handle single character
+     * symbols and special functions like verbatim
      */
-    parseSymbol(): ?ParsedFuncOrArg {
+    parseSymbol(): ?AnyParseNode {
         const nucleus = this.nextToken;
         let text = nucleus.text;
-        if (functions[text]) {
-            // If there exists a function with this name, we return the
-            // function and say that it is a function.
-            // The token will be consumed later in parseGivenFunction
-            // (after possibly switching modes).
-            return newFunction(nucleus);
-        } else if (/^\\(href|url)[^a-zA-Z]/.test(text)) {
-            const match = text.match(urlFunctionRegex);
-            if (!match) {
-                throw new ParseError(
-                    `Internal error: invalid URL token '${text}'`, nucleus);
-            }
-            const funcName = match[1];
-            // match[2] is the only one that can be an empty string,
-            // so it must be at the end of the following or chain:
-            const rawUrl = match[4] || match[3] || match[2];
-            // hyperref package allows backslashes alone in href, but doesn't
-            // generate valid links in such cases; we interpret this as
-            // "undefined" behaviour, and keep them as-is. Some browser will
-            // replace backslashes with forward slashes.
-            const url = rawUrl.replace(/\\([#$%&~_^{}])/g, '$1');
-            let protocol = /^\s*([^\\/#]*?)(?::|&#0*58|&#x0*3a)/i.exec(url);
-            protocol = (protocol != null ? protocol[1] : "_relative");
-            const allowed = this.settings.allowedProtocols;
-            if (!utils.contains(allowed,  "*") &&
-                !utils.contains(allowed, protocol)) {
-                throw new ParseError(
-                    `Forbidden protocol '${protocol}' in ${funcName}`, nucleus);
-            }
-            const urlArg = {
-                type: "url",
-                mode: this.mode,
-                url,
-            };
-            this.consume();
-            if (funcName === "\\href") {  // two arguments
-                this.consumeSpaces();  // ignore spaces between arguments
-                let description = this.parseGroupOfType("original", false);
-                if (description == null) {
-                    throw new ParseError(`${funcName} missing second argument`,
-                        nucleus);
-                }
-                if (description.type === "fn") {
-                    description = this.parseGivenFunction(description);
-                } else { // arg.type === "arg"
-                    description = description.result;
-                }
-                return newArgument(this.callFunction(
-                    funcName, [urlArg, description], []), nucleus);
-            } else {  // one argument (\url)
-                return newArgument(this.callFunction(
-                    funcName, [urlArg], []), nucleus);
-            }
-        } else if (/^\\verb[^a-zA-Z]/.test(text)) {
+        if (/^\\verb[^a-zA-Z]/.test(text)) {
             this.consume();
             let arg = text.slice(5);
             const star = (arg.charAt(0) === "*");
@@ -967,12 +885,12 @@ export default class Parser {
                     please report what input caused this bug`);
             }
             arg = arg.slice(1, -1);  // remove first and last char
-            return newArgument({
+            return {
                 type: "verb",
                 mode: "text",
                 body: arg,
                 star,
-            }, nucleus);
+            };
         }
         // At this point, we should have a symbol, possibly with accents.
         // First expand any accented base symbol according to unicodeSymbols.
@@ -1074,6 +992,6 @@ export default class Parser {
                 };
             }
         }
-        return newArgument(symbol, nucleus);
+        return symbol;
     }
 }