npm - bluera-knowledge - Versions diffs - 0.33.1 → 0.33.2 - Mend

bluera-knowledge 0.33.1 → 0.33.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

package/dist/{chunk-KDZDLJUY.js → chunk-OMXQBWCR.js} +21 -139
package/dist/chunk-OMXQBWCR.js.map +1 -0
package/dist/{chunk-YDTTD53Y.js → chunk-OPLZTNKK.js} +2 -2
package/dist/{chunk-3TB7TDVF.js → chunk-SROFPHRA.js} +1 -2
package/dist/chunk-SROFPHRA.js.map +1 -0
package/dist/index.js +18 -23
package/dist/index.js.map +1 -1
package/dist/mcp/server.js +2 -2
package/dist/workers/background-worker-cli.js +5 -8
package/dist/workers/background-worker-cli.js.map +1 -1
package/package.json +1 -1
package/scripts/validate-local.sh +0 -16
package/skills/crawl/SKILL.md +1 -7
package/dist/chunk-3TB7TDVF.js.map +0 -1
package/dist/chunk-KDZDLJUY.js.map +0 -1
/package/dist/{chunk-YDTTD53Y.js.map → chunk-OPLZTNKK.js.map} +0 -0

package/dist/index.js CHANGED Viewed

@@ -3,11 +3,11 @@ import {
   ZilAdapter,
   runMCPServer,
   spawnBackgroundWorker
-} from "./chunk-YDTTD53Y.js";
+} from "./chunk-OPLZTNKK.js";
 import {
   IntelligentCrawler,
   getCrawlStrategy
-} from "./chunk-KDZDLJUY.js";
+} from "./chunk-OMXQBWCR.js";
 import {
   ASTParser,
   AdapterRegistry,
@@ -25,7 +25,7 @@ import {
   isRepoStoreDefinition,
   isWebStoreDefinition,
   ok
-} from "./chunk-3TB7TDVF.js";
+} from "./chunk-SROFPHRA.js";
 import {
   createDocumentId
 } from "./chunk-CLIMKLTW.js";
@@ -46,7 +46,7 @@ function createCrawlCommand(getOptions) {
   ).option(
     "--extract <instruction>",
     'Natural language instruction for what to extract (e.g., "extract API references")'
-  ).option("--simple", "Use simple BFS mode instead of intelligent crawling").option("--max-pages <number>", "Maximum number of pages to crawl", "50").option("--fast", "Use fast axios-only mode (may fail on JavaScript-heavy sites)").allowUnknownOption().action(
+  ).option("--max-pages <number>", "Maximum number of pages to crawl", "50").option("--fast", "Use fast axios-only mode (may fail on JavaScript-heavy sites)").allowUnknownOption().action(
     async (url, storeIdOrName, cmdOptions) => {
       const storeArg = process.argv.find((arg) => arg.startsWith("--store"));
       if (storeArg !== void 0) {
@@ -65,19 +65,16 @@ Example: bluera-knowledge crawl https://docs.example.com my-docs
       }
       const globalOpts = getOptions();
       const useHeadless = !(cmdOptions.fast ?? false);
-      let preComputedStrategy;
-      const useIntelligentMode = cmdOptions.simple !== true && cmdOptions.crawl !== void 0 && cmdOptions.crawl !== "";
-      if (useIntelligentMode && cmdOptions.crawl !== void 0) {
-        if (globalOpts.quiet !== true && globalOpts.format !== "json") {
-          console.log(`Crawling ${url}`);
-          console.log("Analyzing page structure with Claude...");
-        }
-        preComputedStrategy = await getCrawlStrategy(url, cmdOptions.crawl, useHeadless);
-        if (globalOpts.quiet !== true && globalOpts.format !== "json") {
-          console.log(
-            `Claude identified ${String(preComputedStrategy.urls.length)} URLs: ${preComputedStrategy.reasoning}`
-          );
-        }
+      const crawlInstruction = cmdOptions.crawl ?? "crawl all pages linked from this URL";
+      if (globalOpts.quiet !== true && globalOpts.format !== "json") {
+        console.log(`Crawling ${url}`);
+        console.log("Analyzing page structure with Claude...");
+      }
+      const preComputedStrategy = await getCrawlStrategy(url, crawlInstruction, useHeadless);
+      if (globalOpts.quiet !== true && globalOpts.format !== "json") {
+        console.log(
+          `Claude identified ${String(preComputedStrategy.urls.length)} URLs: ${preComputedStrategy.reasoning}`
+        );
       }
       const services = await createServices(
         globalOpts.config,
@@ -123,8 +120,7 @@ Example: bluera-knowledge crawl https://docs.example.com my-docs
       const isInteractive = process.stdout.isTTY && globalOpts.quiet !== true && globalOpts.format !== "json";
       let spinner;
       if (isInteractive) {
-        const mode = cmdOptions.simple === true ? "simple" : "intelligent";
-        spinner = ora(`Crawling ${url} (${mode} mode)`).start();
+        spinner = ora(`Crawling ${url} (intelligent mode)`).start();
       } else if (globalOpts.quiet !== true && globalOpts.format !== "json") {
         console.log(`Crawling ${url}`);
       }
@@ -154,12 +150,11 @@ Example: bluera-knowledge crawl https://docs.example.com my-docs
         await services.lance.initialize(store.id);
         const docs = [];
         for await (const result of crawler.crawl(url, {
-          ...cmdOptions.crawl !== void 0 && { crawlInstruction: cmdOptions.crawl },
+          crawlInstruction,
           ...cmdOptions.extract !== void 0 && { extractInstruction: cmdOptions.extract },
           maxPages,
-          ...cmdOptions.simple !== void 0 && { simple: cmdOptions.simple },
           useHeadless,
-          ...preComputedStrategy !== void 0 && { preComputedStrategy }
+          preComputedStrategy
         })) {
           const contentToProcess = result.extracted ?? result.markdown;
           const chunks = webChunker.chunk(contentToProcess, `${result.url}.md`);
@@ -205,7 +200,7 @@ Example: bluera-knowledge crawl https://docs.example.com my-docs
           url,
           pagesCrawled: pagesIndexed,
           chunksCreated,
-          mode: cmdOptions.simple === true ? "simple" : "intelligent",
+          mode: "intelligent",
           hadCrawlInstruction: cmdOptions.crawl !== void 0,
           hadExtractInstruction: cmdOptions.extract !== void 0
         };