npm - @herb-tools/node - Versions diffs - 0.1.0 - Mend

@herb-tools/node 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (131) hide show

package/CHANGELOG.md +3 -0
package/README.md +9 -0
package/binding.gyp +98 -0
package/dist/herb-node.cjs +20 -0
package/dist/herb-node.cjs.map +1 -0
package/dist/herb-node.esm.js +33 -0
package/dist/herb-node.esm.js.map +1 -0
package/dist/types/index-cjs.d.cts +1 -0
package/dist/types/index-esm.d.mts +8 -0
package/dist/types/node-backend.d.ts +4 -0
package/dist/types/util.d.ts +2 -0
package/extension/error_helpers.cpp +340 -0
package/extension/error_helpers.h +26 -0
package/extension/extension_helpers.cpp +206 -0
package/extension/extension_helpers.h +22 -0
package/extension/herb.cpp +232 -0
package/extension/libherb/analyze.c +989 -0
package/extension/libherb/analyze_helpers.c +241 -0
package/extension/libherb/analyzed_ruby.c +35 -0
package/extension/libherb/array.c +137 -0
package/extension/libherb/ast_node.c +81 -0
package/extension/libherb/ast_nodes.c +866 -0
package/extension/libherb/ast_pretty_print.c +588 -0
package/extension/libherb/buffer.c +199 -0
package/extension/libherb/errors.c +740 -0
package/extension/libherb/extract.c +110 -0
package/extension/libherb/herb.c +103 -0
package/extension/libherb/html_util.c +143 -0
package/extension/libherb/include/analyze.h +36 -0
package/extension/libherb/include/analyze_helpers.h +43 -0
package/extension/libherb/include/analyzed_ruby.h +33 -0
package/extension/libherb/include/array.h +33 -0
package/extension/libherb/include/ast_node.h +35 -0
package/extension/libherb/include/ast_nodes.h +303 -0
package/extension/libherb/include/ast_pretty_print.h +17 -0
package/extension/libherb/include/buffer.h +36 -0
package/extension/libherb/include/errors.h +125 -0
package/extension/libherb/include/extract.h +20 -0
package/extension/libherb/include/herb.h +32 -0
package/extension/libherb/include/html_util.h +13 -0
package/extension/libherb/include/io.h +9 -0
package/extension/libherb/include/json.h +28 -0
package/extension/libherb/include/lexer.h +13 -0
package/extension/libherb/include/lexer_peek_helpers.h +23 -0
package/extension/libherb/include/lexer_struct.h +32 -0
package/extension/libherb/include/location.h +25 -0
package/extension/libherb/include/macros.h +10 -0
package/extension/libherb/include/memory.h +12 -0
package/extension/libherb/include/parser.h +22 -0
package/extension/libherb/include/parser_helpers.h +33 -0
package/extension/libherb/include/position.h +22 -0
package/extension/libherb/include/pretty_print.h +53 -0
package/extension/libherb/include/prism_helpers.h +18 -0
package/extension/libherb/include/range.h +23 -0
package/extension/libherb/include/ruby_parser.h +6 -0
package/extension/libherb/include/token.h +25 -0
package/extension/libherb/include/token_matchers.h +21 -0
package/extension/libherb/include/token_struct.h +51 -0
package/extension/libherb/include/util.h +25 -0
package/extension/libherb/include/version.h +6 -0
package/extension/libherb/include/visitor.h +11 -0
package/extension/libherb/io.c +30 -0
package/extension/libherb/json.c +205 -0
package/extension/libherb/lexer.c +284 -0
package/extension/libherb/lexer_peek_helpers.c +59 -0
package/extension/libherb/location.c +41 -0
package/extension/libherb/main.c +162 -0
package/extension/libherb/memory.c +53 -0
package/extension/libherb/parser.c +704 -0
package/extension/libherb/parser_helpers.c +161 -0
package/extension/libherb/position.c +33 -0
package/extension/libherb/pretty_print.c +242 -0
package/extension/libherb/prism_helpers.c +50 -0
package/extension/libherb/range.c +38 -0
package/extension/libherb/ruby_parser.c +47 -0
package/extension/libherb/token.c +194 -0
package/extension/libherb/token_matchers.c +32 -0
package/extension/libherb/util.c +128 -0
package/extension/libherb/visitor.c +321 -0
package/extension/nodes.cpp +1060 -0
package/extension/nodes.h +44 -0
package/extension/prism/include/prism/ast.h +7964 -0
package/extension/prism/include/prism/defines.h +260 -0
package/extension/prism/include/prism/diagnostic.h +451 -0
package/extension/prism/include/prism/encoding.h +283 -0
package/extension/prism/include/prism/node.h +129 -0
package/extension/prism/include/prism/options.h +442 -0
package/extension/prism/include/prism/pack.h +163 -0
package/extension/prism/include/prism/parser.h +933 -0
package/extension/prism/include/prism/prettyprint.h +34 -0
package/extension/prism/include/prism/regexp.h +43 -0
package/extension/prism/include/prism/static_literals.h +121 -0
package/extension/prism/include/prism/util/pm_buffer.h +228 -0
package/extension/prism/include/prism/util/pm_char.h +204 -0
package/extension/prism/include/prism/util/pm_constant_pool.h +218 -0
package/extension/prism/include/prism/util/pm_integer.h +126 -0
package/extension/prism/include/prism/util/pm_list.h +97 -0
package/extension/prism/include/prism/util/pm_memchr.h +29 -0
package/extension/prism/include/prism/util/pm_newline_list.h +113 -0
package/extension/prism/include/prism/util/pm_string.h +190 -0
package/extension/prism/include/prism/util/pm_strncasecmp.h +32 -0
package/extension/prism/include/prism/util/pm_strpbrk.h +46 -0
package/extension/prism/include/prism/version.h +29 -0
package/extension/prism/include/prism.h +383 -0
package/extension/prism/src/diagnostic.c +842 -0
package/extension/prism/src/encoding.c +5235 -0
package/extension/prism/src/node.c +8674 -0
package/extension/prism/src/options.c +328 -0
package/extension/prism/src/pack.c +509 -0
package/extension/prism/src/prettyprint.c +8939 -0
package/extension/prism/src/prism.c +23184 -0
package/extension/prism/src/regexp.c +790 -0
package/extension/prism/src/serialize.c +2266 -0
package/extension/prism/src/static_literals.c +617 -0
package/extension/prism/src/token_type.c +701 -0
package/extension/prism/src/util/pm_buffer.c +357 -0
package/extension/prism/src/util/pm_char.c +318 -0
package/extension/prism/src/util/pm_constant_pool.c +342 -0
package/extension/prism/src/util/pm_integer.c +670 -0
package/extension/prism/src/util/pm_list.c +49 -0
package/extension/prism/src/util/pm_memchr.c +35 -0
package/extension/prism/src/util/pm_newline_list.c +125 -0
package/extension/prism/src/util/pm_string.c +383 -0
package/extension/prism/src/util/pm_strncasecmp.c +36 -0
package/extension/prism/src/util/pm_strpbrk.c +206 -0
package/package.json +74 -0
package/src/index-cjs.cts +22 -0
package/src/index-esm.mts +28 -0
package/src/node-backend.ts +9 -0
package/src/types/global.d.ts +18 -0
package/src/util.ts +35 -0

package/extension/prism/src/util/pm_strpbrk.c ADDED Viewed

@@ -0,0 +1,206 @@
+#include "prism/util/pm_strpbrk.h"
+/**
+ * Add an invalid multibyte character error to the parser.
+ */
+static inline void
+pm_strpbrk_invalid_multibyte_character(pm_parser_t *parser, const uint8_t *start, const uint8_t *end) {
+    pm_diagnostic_list_append_format(&parser->error_list, start, end, PM_ERR_INVALID_MULTIBYTE_CHARACTER, *start);
+}
+/**
+ * Set the explicit encoding for the parser to the current encoding.
+ */
+static inline void
+pm_strpbrk_explicit_encoding_set(pm_parser_t *parser, const uint8_t *source, size_t width) {
+    if (parser->explicit_encoding != NULL) {
+        if (parser->explicit_encoding == parser->encoding) {
+            // Okay, we already locked to this encoding.
+        } else if (parser->explicit_encoding == PM_ENCODING_UTF_8_ENTRY) {
+            // Not okay, we already found a Unicode escape sequence and this
+            // conflicts.
+            pm_diagnostic_list_append_format(&parser->error_list, source, source + width, PM_ERR_MIXED_ENCODING, parser->encoding->name);
+        } else {
+            // Should not be anything else.
+            assert(false && "unreachable");
+        }
+    }
+    parser->explicit_encoding = parser->encoding;
+}
+/**
+ * This is the default path.
+ */
+static inline const uint8_t *
+pm_strpbrk_utf8(pm_parser_t *parser, const uint8_t *source, const uint8_t *charset, size_t maximum, bool validate) {
+    size_t index = 0;
+    while (index < maximum) {
+        if (strchr((const char *) charset, source[index]) != NULL) {
+            return source + index;
+        }
+        if (source[index] < 0x80) {
+            index++;
+        } else {
+            size_t width = pm_encoding_utf_8_char_width(source + index, (ptrdiff_t) (maximum - index));
+            if (width > 0) {
+                index += width;
+            } else if (!validate) {
+                index++;
+            } else {
+                // At this point we know we have an invalid multibyte character.
+                // We'll walk forward as far as we can until we find the next
+                // valid character so that we don't spam the user with a ton of
+                // the same kind of error.
+                const size_t start = index;
+                do {
+                    index++;
+                } while (index < maximum && pm_encoding_utf_8_char_width(source + index, (ptrdiff_t) (maximum - index)) == 0);
+                pm_strpbrk_invalid_multibyte_character(parser, source + start, source + index);
+            }
+        }
+    }
+    return NULL;
+}
+/**
+ * This is the path when the encoding is ASCII-8BIT.
+ */
+static inline const uint8_t *
+pm_strpbrk_ascii_8bit(pm_parser_t *parser, const uint8_t *source, const uint8_t *charset, size_t maximum, bool validate) {
+    size_t index = 0;
+    while (index < maximum) {
+        if (strchr((const char *) charset, source[index]) != NULL) {
+            return source + index;
+        }
+        if (validate && source[index] >= 0x80) pm_strpbrk_explicit_encoding_set(parser, source, 1);
+        index++;
+    }
+    return NULL;
+}
+/**
+ * This is the slow path that does care about the encoding.
+ */
+static inline const uint8_t *
+pm_strpbrk_multi_byte(pm_parser_t *parser, const uint8_t *source, const uint8_t *charset, size_t maximum, bool validate) {
+    size_t index = 0;
+    const pm_encoding_t *encoding = parser->encoding;
+    while (index < maximum) {
+        if (strchr((const char *) charset, source[index]) != NULL) {
+            return source + index;
+        }
+        if (source[index] < 0x80) {
+            index++;
+        } else {
+            size_t width = encoding->char_width(source + index, (ptrdiff_t) (maximum - index));
+            if (validate) pm_strpbrk_explicit_encoding_set(parser, source, width);
+            if (width > 0) {
+                index += width;
+            } else if (!validate) {
+                index++;
+            } else {
+                // At this point we know we have an invalid multibyte character.
+                // We'll walk forward as far as we can until we find the next
+                // valid character so that we don't spam the user with a ton of
+                // the same kind of error.
+                const size_t start = index;
+                do {
+                    index++;
+                } while (index < maximum && encoding->char_width(source + index, (ptrdiff_t) (maximum - index)) == 0);
+                pm_strpbrk_invalid_multibyte_character(parser, source + start, source + index);
+            }
+        }
+    }
+    return NULL;
+}
+/**
+ * This is the fast path that does not care about the encoding because we know
+ * the encoding only supports single-byte characters.
+ */
+static inline const uint8_t *
+pm_strpbrk_single_byte(pm_parser_t *parser, const uint8_t *source, const uint8_t *charset, size_t maximum, bool validate) {
+    size_t index = 0;
+    const pm_encoding_t *encoding = parser->encoding;
+    while (index < maximum) {
+        if (strchr((const char *) charset, source[index]) != NULL) {
+            return source + index;
+        }
+        if (source[index] < 0x80 || !validate) {
+            index++;
+        } else {
+            size_t width = encoding->char_width(source + index, (ptrdiff_t) (maximum - index));
+            pm_strpbrk_explicit_encoding_set(parser, source, width);
+            if (width > 0) {
+                index += width;
+            } else {
+                // At this point we know we have an invalid multibyte character.
+                // We'll walk forward as far as we can until we find the next
+                // valid character so that we don't spam the user with a ton of
+                // the same kind of error.
+                const size_t start = index;
+                do {
+                    index++;
+                } while (index < maximum && encoding->char_width(source + index, (ptrdiff_t) (maximum - index)) == 0);
+                pm_strpbrk_invalid_multibyte_character(parser, source + start, source + index);
+            }
+        }
+    }
+    return NULL;
+}
+/**
+ * Here we have rolled our own version of strpbrk. The standard library strpbrk
+ * has undefined behavior when the source string is not null-terminated. We want
+ * to support strings that are not null-terminated because pm_parse does not
+ * have the contract that the string is null-terminated. (This is desirable
+ * because it means the extension can call pm_parse with the result of a call to
+ * mmap).
+ *
+ * The standard library strpbrk also does not support passing a maximum length
+ * to search. We want to support this for the reason mentioned above, but we
+ * also don't want it to stop on null bytes. Ruby actually allows null bytes
+ * within strings, comments, regular expressions, etc. So we need to be able to
+ * skip past them.
+ *
+ * Finally, we want to support encodings wherein the charset could contain
+ * characters that are trailing bytes of multi-byte characters. For example, in
+ * Shift_JIS, the backslash character can be a trailing byte. In that case we
+ * need to take a slower path and iterate one multi-byte character at a time.
+ */
+const uint8_t *
+pm_strpbrk(pm_parser_t *parser, const uint8_t *source, const uint8_t *charset, ptrdiff_t length, bool validate) {
+    if (length <= 0) {
+        return NULL;
+    } else if (!parser->encoding_changed) {
+        return pm_strpbrk_utf8(parser, source, charset, (size_t) length, validate);
+    } else if (parser->encoding == PM_ENCODING_ASCII_8BIT_ENTRY) {
+        return pm_strpbrk_ascii_8bit(parser, source, charset, (size_t) length, validate);
+    } else if (parser->encoding->multibyte) {
+        return pm_strpbrk_multi_byte(parser, source, charset, (size_t) length, validate);
+    } else {
+        return pm_strpbrk_single_byte(parser, source, charset, (size_t) length, validate);
+    }
+}

package/package.json ADDED Viewed

@@ -0,0 +1,74 @@
+{
+  "name": "@herb-tools/node",
+  "version": "0.1.0",
+  "type": "module",
+  "license": "MIT",
+  "homepage": "https://herb-tools.dev",
+  "bugs": "https://github.com/marcoroth/herb/issues/new?title=Package%20%60@herb-tools/node%60:%20",
+  "repository": {
+    "type": "git",
+    "url": "https://github.com/marcoroth/herb.git",
+    "directory": "javascript/packages/node"
+  },
+  "gypfile": true,
+  "main": "./dist/herb-node.cjs",
+  "module": "./dist/herb-node.esm.js",
+  "types": "./dist/types/index-esm.d.mts",
+  "exports": {
+    "./package.json": "./package.json",
+    ".": {
+      "types": "./dist/types/index-esm.d.mts",
+      "import": "./dist/herb-node.esm.js",
+      "require": "./dist/herb-node.cjs",
+      "default": "./dist/herb-node.esm.js"
+    }
+  },
+  "scripts": {
+    "install": "yarn vendor:libherb && yarn vendor:prism && node-pre-gyp install --fallback-to-build",
+    "dev": "rollup -c -w",
+    "build": "yarn rebuild",
+    "build:javascript": "rollup -c",
+    "vendor:libherb": "yarn clean && rake templates && cp -r ../../../src ./extension/libherb",
+    "vendor:prism": "node ./bin/vendor-prism.cjs",
+    "rebuild": "yarn clean && yarn vendor:libherb && yarn vendor:prism && node-pre-gyp rebuild && yarn build:javascript",
+    "configure": "node-pre-gyp configure",
+    "package": "node-pre-gyp package",
+    "clean": "node-pre-gyp clean && rimraf dist/ && rimraf extension/libherb/ && rimraf build/",
+    "test": "vitest run",
+    "test:watch": "vitest --watch",
+    "prepublishOnly": "yarn clean && yarn build && yarn test"
+  },
+  "binary": {
+    "module_name": "herb",
+    "module_path": "./build/{configuration}/{node_abi}-{platform}-{arch}/",
+    "remote_path": "{version}",
+    "package_name": "{module_name}-v{version}-{node_abi}-{platform}-{arch}.tar.gz",
+    "host": "https://github.com/marcoroth/herb/releases/download/"
+  },
+  "dependencies": {
+    "@herb-tools/core": "0.1.0",
+    "@mapbox/node-pre-gyp": "^2.0.0"
+  },
+  "devDependencies": {
+    "@rollup/plugin-json": "^6.1.0",
+    "@rollup/plugin-node-resolve": "^16.0.1",
+    "@rollup/plugin-typescript": "^12.1.2",
+    "node-addon-api": "^5.1.0",
+    "node-pre-gyp-github": "^2.0.0",
+    "rimraf": "^6.0.1",
+    "rollup": "^4.35.0",
+    "tslib": "^2.8.1",
+    "typescript": "^5.8.2",
+    "vitest": "^3.0.0"
+  },
+  "files": [
+    "package.json",
+    "README.md",
+    "binding.gyp",
+    "dist/",
+    "src/",
+    "extension/**/*.c",
+    "extension/**/*.cpp",
+    "extension/**/*.h"
+  ]
+}

package/src/index-cjs.cts ADDED Viewed

@@ -0,0 +1,22 @@
+const path = require("path")
+const binary = require("@mapbox/node-pre-gyp")
+const { Visitor } = require("@herb-tools/core")
+const { HerbBackendNode } = require("./node-backend.js")
+const packagePath = path.resolve(__dirname, "../package.json")
+const libherbPath = binary.find(packagePath)
+const libHerbBinary = require(libherbPath)
+/**
+ * An instance of the `Herb` class using a Node.js backend.
+ * This loads `libherb` in a Node.js C++ native extension.
+ */
+const Herb = new HerbBackendNode(
+  new Promise((resolve, _reject) => resolve(libHerbBinary)),
+)
+module.exports = {
+  Herb: Herb,
+  Visitor: Visitor,
+}

package/src/index-esm.mts ADDED Viewed

@@ -0,0 +1,28 @@
+export * from "@herb-tools/core"
+import path from "path"
+import binary from "@mapbox/node-pre-gyp"
+import { createRequire } from "module"
+import { fileURLToPath } from "url"
+const __filename = fileURLToPath(import.meta.url)
+const __dirname = path.dirname(__filename)
+const require = createRequire(import.meta.url)
+const packagePath = path.resolve(__dirname, "../package.json")
+const libherbPath = binary.find(packagePath)
+const libHerbBinary = require(libherbPath)
+import { HerbBackendNode } from "./node-backend.js"
+/**
+ * An instance of the `Herb` class using a Node.js backend.
+ * This loads `libherb` in a Node.js C++ native extension.
+ */
+const Herb = new HerbBackendNode(
+  () => new Promise((resolve, _reject) => resolve(libHerbBinary)),
+)
+export { Herb, HerbBackendNode }

package/src/node-backend.ts ADDED Viewed

@@ -0,0 +1,9 @@
+import packageJSON from "../package.json" with { type: "json" }
+import { HerbBackend } from "@herb-tools/core"
+export class HerbBackendNode extends HerbBackend {
+  backendVersion(): string {
+    return `${packageJSON.name}@${packageJSON.version}`
+  }
+}

package/src/types/global.d.ts ADDED Viewed

@@ -0,0 +1,18 @@
+declare module "*.node" {
+  const content: any
+  export default content
+}
+declare module "@mapbox/node-pre-gyp" {
+  export interface FindOptions {
+    module_root?: string
+    [key: string]: any
+  }
+  export interface NodePreGyp {
+    find(packageJsonPath: string, opts?: FindOptions): string
+  }
+  declare const nodePreGyp: NodePreGyp
+  export default nodePreGyp
+}

package/src/util.ts ADDED Viewed

@@ -0,0 +1,35 @@
+import path from "path"
+import { stat as fileExists } from "node:fs/promises"
+import { ensureString } from "@herb-tools/core"
+export async function ensureFile(object: any): Promise<string> {
+  const string = ensureString(object)
+  if (await fileExists(string)) {
+    return string
+  }
+  throw new TypeError("Argument must be a string")
+}
+export function resolvePath(relativePath: string) {
+  let basePath
+  // Check if we"re in ESM or CJS context
+  if (typeof __dirname !== "undefined") {
+    // CommonJS environment
+    basePath = __dirname
+  } else {
+    // ESM environment - need to use import.meta.url
+    // This needs to be in a try/catch for bundlers and environments that don"t support it
+    try {
+      const { fileURLToPath } = require("url")
+      const currentFileUrl = import.meta.url
+      basePath = path.dirname(fileURLToPath(currentFileUrl))
+    } catch (error) {
+      // Fallback for environments where neither is available
+      basePath = process.cwd()
+    }
+  }
+  return path.join(basePath, relativePath)
+}