npm - @apmantza/greedysearch-pi - Versions diffs - 1.8.2 → 1.8.4 - Mend

@apmantza/greedysearch-pi 1.8.2 → 1.8.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

package/CHANGELOG.md +17 -0
package/README.md +10 -1
package/bin/launch.mjs +366 -366
package/bin/search.mjs +388 -388
package/extractors/common.mjs +291 -291
package/extractors/gemini.mjs +146 -146
package/extractors/google-ai.mjs +125 -125
package/extractors/perplexity.mjs +147 -145
package/extractors/selectors.mjs +54 -54
package/index.ts +256 -278
package/package.json +1 -1
package/src/github.mjs +237 -237
package/src/reddit.mjs +210 -0
package/src/search/chrome.mjs +222 -222
package/src/search/constants.mjs +37 -37
package/src/search/defaults.mjs +14 -14
package/src/search/engines.mjs +62 -62
package/src/search/fetch-source.mjs +35 -3
package/src/search/output.mjs +58 -58
package/src/search/sources.mjs +445 -445
package/src/search/synthesis-runner.mjs +63 -63
package/src/search/synthesis.mjs +223 -223
package/src/tools/deep-research-handler.ts +36 -36
package/src/tools/greedy-search-handler.ts +53 -57
package/src/tools/shared.ts +135 -130
package/src/types.ts +103 -103
package/test.mjs +423 -377

package/src/search/fetch-source.mjs CHANGED Viewed

@@ -8,9 +8,9 @@ import { tmpdir } from "node:os";
 import { join } from "node:path";
 import { fetchSourceHttp, shouldUseBrowser } from "../fetcher.mjs";
 import { fetchGitHubContent, parseGitHubUrl } from "../github.mjs";
+import { fetchRedditContent, parseRedditUrl } from "../reddit.mjs";
 import { trimContentHeadTail } from "../utils/content.mjs";
-import { cdp } from "./chrome.mjs";
-import { openNewTab, closeTab, closeTabs } from "./chrome.mjs";
+import { cdp, closeTab, closeTabs, openNewTab } from "./chrome.mjs";
 import { SOURCE_FETCH_CONCURRENCY } from "./constants.mjs";
 import { trimText } from "./sources.mjs";
@@ -50,6 +50,38 @@ export async function fetchSourceContent(url, maxChars = 8000) {
 		}
 	}
+	// Check if it's a Reddit URL (posts and comments)
+	const redditInfo = parseRedditUrl(url);
+	if (redditInfo?.type === "post") {
+		process.stderr.write(
+			`[greedysearch] Using Reddit JSON API for: ${url.slice(0, 60)}...\n`,
+		);
+		const redditResult = await fetchRedditContent(url, maxChars);
+		if (redditResult.ok) {
+			const content = trimContentHeadTail(redditResult.markdown, maxChars);
+			return {
+				url,
+				finalUrl: redditResult.finalUrl,
+				status: redditResult.status,
+				contentType: "text/markdown",
+				lastModified: redditResult.lastModified || "",
+				publishedTime: redditResult.publishedTime || "",
+				byline: redditResult.byline || "",
+				siteName: redditResult.siteName || "",
+				lang: redditResult.lang || "",
+				title: redditResult.title,
+				snippet: redditResult.excerpt,
+				content,
+				contentChars: content.length,
+				source: "reddit-api",
+				duration: Date.now() - start,
+			};
+		}
+		process.stderr.write(
+			`[greedysearch] Reddit API fetch failed, falling back to HTTP: ${redditResult.error}\n`,
+		);
+	}
 	// Try HTTP first
 	const httpResult = await fetchSourceHttp(url, { timeoutMs: 15000 });
@@ -227,4 +259,4 @@ export async function fetchTopSource(url) {
 	} finally {
 		await closeTab(tab);
 	}
-}
+}

package/src/search/output.mjs CHANGED Viewed

@@ -1,59 +1,59 @@
-// src/search/output.mjs — Output serialization for search results
-//
-// Extracted from search.mjs.
-import { existsSync, mkdirSync, writeFileSync } from "node:fs";
-import { join } from "node:path";
-import { tmpdir } from "node:os";
-const __dir = import.meta.dirname || new URL(".", import.meta.url).pathname.replace(/^\/([A-Z]:)/, "$1");
-export function slugify(query) {
-	return query
-		.toLowerCase()
-		.replace(/[^a-z0-9]+/g, "-")
-		.replace(/^-|-$/g, "")
-		.slice(0, 60);
-}
-export function resultsDir() {
-	const dir = join(__dir, "..", "..", "results");
-	mkdirSync(dir, { recursive: true });
-	return dir;
-}
-export function writeOutput(
-	data,
-	outFile,
-	{ inline = false, synthesize = false, query = "" } = {},
-) {
-	const json = `${JSON.stringify(data, null, 2)}\n`;
-	if (outFile) {
-		writeFileSync(outFile, json, "utf8");
-		process.stderr.write(`Results written to ${outFile}\n`);
-		return;
-	}
-	if (inline) {
-		process.stdout.write(json);
-		return;
-	}
-	const ts = new Date()
-		.toISOString()
-		.replace("T", "_")
-		.replace(/[:.]/g, "-")
-		.slice(0, 19);
-	const slug = slugify(query);
-	const base = join(resultsDir(), `${ts}_${slug}`);
-	writeFileSync(`${base}.json`, json, "utf8");
-	if (synthesize && data._synthesis?.answer) {
-		writeFileSync(`${base}-synthesis.md`, data._synthesis.answer, "utf8");
-		process.stdout.write(`${base}-synthesis.md\n`);
-	} else {
-		process.stdout.write(`${base}.json\n`);
-	}
+// src/search/output.mjs — Output serialization for search results
+//
+// Extracted from search.mjs.
+import { existsSync, mkdirSync, writeFileSync } from "node:fs";
+import { join } from "node:path";
+import { tmpdir } from "node:os";
+const __dir = import.meta.dirname || new URL(".", import.meta.url).pathname.replace(/^\/([A-Z]:)/, "$1");
+export function slugify(query) {
+	return query
+		.toLowerCase()
+		.replace(/[^a-z0-9]+/g, "-")
+		.replace(/^-|-$/g, "")
+		.slice(0, 60);
+}
+export function resultsDir() {
+	const dir = join(__dir, "..", "..", "results");
+	mkdirSync(dir, { recursive: true });
+	return dir;
+}
+export function writeOutput(
+	data,
+	outFile,
+	{ inline = false, synthesize = false, query = "" } = {},
+) {
+	const json = `${JSON.stringify(data, null, 2)}\n`;
+	if (outFile) {
+		writeFileSync(outFile, json, "utf8");
+		process.stderr.write(`Results written to ${outFile}\n`);
+		return;
+	}
+	if (inline) {
+		process.stdout.write(json);
+		return;
+	}
+	const ts = new Date()
+		.toISOString()
+		.replace("T", "_")
+		.replace(/[:.]/g, "-")
+		.slice(0, 19);
+	const slug = slugify(query);
+	const base = join(resultsDir(), `${ts}_${slug}`);
+	writeFileSync(`${base}.json`, json, "utf8");
+	if (synthesize && data._synthesis?.answer) {
+		writeFileSync(`${base}-synthesis.md`, data._synthesis.answer, "utf8");
+		process.stdout.write(`${base}-synthesis.md\n`);
+	} else {
+		process.stdout.write(`${base}.json\n`);
+	}
 }