@staticn0va/wigolo 0.3.1 → 0.5.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +57 -2
- package/SKILL.md +196 -0
- package/dist/agent/executor.d.ts +13 -0
- package/dist/agent/executor.d.ts.map +1 -0
- package/dist/agent/executor.js +128 -0
- package/dist/agent/executor.js.map +1 -0
- package/dist/agent/pipeline.d.ts +5 -0
- package/dist/agent/pipeline.d.ts.map +1 -0
- package/dist/agent/pipeline.js +198 -0
- package/dist/agent/pipeline.js.map +1 -0
- package/dist/agent/planner.d.ts +9 -0
- package/dist/agent/planner.d.ts.map +1 -0
- package/dist/agent/planner.js +190 -0
- package/dist/agent/planner.js.map +1 -0
- package/dist/cache/change-detector.d.ts +7 -0
- package/dist/cache/change-detector.d.ts.map +1 -0
- package/dist/cache/change-detector.js +43 -0
- package/dist/cache/change-detector.js.map +1 -0
- package/dist/cache/db.d.ts.map +1 -1
- package/dist/cache/db.js +32 -0
- package/dist/cache/db.js.map +1 -1
- package/dist/cache/diff-summary.d.ts +2 -0
- package/dist/cache/diff-summary.d.ts.map +1 -0
- package/dist/cache/diff-summary.js +87 -0
- package/dist/cache/diff-summary.js.map +1 -0
- package/dist/cache/store.d.ts +16 -0
- package/dist/cache/store.d.ts.map +1 -1
- package/dist/cache/store.js +79 -0
- package/dist/cache/store.js.map +1 -1
- package/dist/cli/auth.d.ts +2 -0
- package/dist/cli/auth.d.ts.map +1 -0
- package/dist/cli/auth.js +95 -0
- package/dist/cli/auth.js.map +1 -0
- package/dist/cli/daemon.d.ts +6 -1
- package/dist/cli/daemon.d.ts.map +1 -1
- package/dist/cli/daemon.js +56 -3
- package/dist/cli/daemon.js.map +1 -1
- package/dist/cli/health.d.ts +1 -1
- package/dist/cli/health.d.ts.map +1 -1
- package/dist/cli/health.js +41 -3
- package/dist/cli/health.js.map +1 -1
- package/dist/cli/index.d.ts +1 -1
- package/dist/cli/index.d.ts.map +1 -1
- package/dist/cli/index.js +1 -1
- package/dist/cli/index.js.map +1 -1
- package/dist/cli/plugin.d.ts +5 -0
- package/dist/cli/plugin.d.ts.map +1 -0
- package/dist/cli/plugin.js +188 -0
- package/dist/cli/plugin.js.map +1 -0
- package/dist/cli/shell.d.ts +2 -0
- package/dist/cli/shell.d.ts.map +1 -0
- package/dist/cli/shell.js +86 -0
- package/dist/cli/shell.js.map +1 -0
- package/dist/cli/warmup.d.ts +8 -0
- package/dist/cli/warmup.d.ts.map +1 -1
- package/dist/cli/warmup.js +106 -1
- package/dist/cli/warmup.js.map +1 -1
- package/dist/config.d.ts +15 -0
- package/dist/config.d.ts.map +1 -1
- package/dist/config.js +23 -0
- package/dist/config.js.map +1 -1
- package/dist/daemon/health-check.d.ts +16 -0
- package/dist/daemon/health-check.d.ts.map +1 -0
- package/dist/daemon/health-check.js +36 -0
- package/dist/daemon/health-check.js.map +1 -0
- package/dist/daemon/http-server.d.ts +26 -0
- package/dist/daemon/http-server.d.ts.map +1 -0
- package/dist/daemon/http-server.js +282 -0
- package/dist/daemon/http-server.js.map +1 -0
- package/dist/daemon/proxy.d.ts +10 -0
- package/dist/daemon/proxy.d.ts.map +1 -0
- package/dist/daemon/proxy.js +99 -0
- package/dist/daemon/proxy.js.map +1 -0
- package/dist/embedding/embed.d.ts +19 -0
- package/dist/embedding/embed.d.ts.map +1 -0
- package/dist/embedding/embed.js +131 -0
- package/dist/embedding/embed.js.map +1 -0
- package/dist/embedding/key-terms.d.ts +12 -0
- package/dist/embedding/key-terms.d.ts.map +1 -0
- package/dist/embedding/key-terms.js +138 -0
- package/dist/embedding/key-terms.js.map +1 -0
- package/dist/embedding/subprocess.d.ts +31 -0
- package/dist/embedding/subprocess.d.ts.map +1 -0
- package/dist/embedding/subprocess.js +213 -0
- package/dist/embedding/subprocess.js.map +1 -0
- package/dist/embedding/vector-index.d.ts +26 -0
- package/dist/embedding/vector-index.d.ts.map +1 -0
- package/dist/embedding/vector-index.js +78 -0
- package/dist/embedding/vector-index.js.map +1 -0
- package/dist/fetch/action-executor.d.ts +28 -0
- package/dist/fetch/action-executor.d.ts.map +1 -0
- package/dist/fetch/action-executor.js +86 -0
- package/dist/fetch/action-executor.js.map +1 -0
- package/dist/fetch/auth.d.ts +2 -1
- package/dist/fetch/auth.d.ts.map +1 -1
- package/dist/fetch/auth.js +30 -2
- package/dist/fetch/auth.js.map +1 -1
- package/dist/fetch/browser-pool.d.ts +30 -11
- package/dist/fetch/browser-pool.d.ts.map +1 -1
- package/dist/fetch/browser-pool.js +228 -51
- package/dist/fetch/browser-pool.js.map +1 -1
- package/dist/fetch/browser-selector.d.ts +17 -0
- package/dist/fetch/browser-selector.d.ts.map +1 -0
- package/dist/fetch/browser-selector.js +70 -0
- package/dist/fetch/browser-selector.js.map +1 -0
- package/dist/fetch/browser-types.d.ts +3 -0
- package/dist/fetch/browser-types.d.ts.map +1 -0
- package/dist/fetch/browser-types.js +45 -0
- package/dist/fetch/browser-types.js.map +1 -0
- package/dist/fetch/cdp-client.d.ts +9 -0
- package/dist/fetch/cdp-client.d.ts.map +1 -0
- package/dist/fetch/cdp-client.js +90 -0
- package/dist/fetch/cdp-client.js.map +1 -0
- package/dist/fetch/lightpanda.d.ts +28 -0
- package/dist/fetch/lightpanda.d.ts.map +1 -0
- package/dist/fetch/lightpanda.js +177 -0
- package/dist/fetch/lightpanda.js.map +1 -0
- package/dist/fetch/router.d.ts +4 -1
- package/dist/fetch/router.d.ts.map +1 -1
- package/dist/fetch/router.js +8 -2
- package/dist/fetch/router.js.map +1 -1
- package/dist/index.js +32 -3
- package/dist/index.js.map +1 -1
- package/dist/instructions.d.ts +29 -0
- package/dist/instructions.d.ts.map +1 -0
- package/dist/instructions.js +176 -0
- package/dist/instructions.js.map +1 -0
- package/dist/logger.d.ts +1 -1
- package/dist/logger.d.ts.map +1 -1
- package/dist/plugins/loader.d.ts +20 -0
- package/dist/plugins/loader.d.ts.map +1 -0
- package/dist/plugins/loader.js +162 -0
- package/dist/plugins/loader.js.map +1 -0
- package/dist/plugins/registry.d.ts +26 -0
- package/dist/plugins/registry.d.ts.map +1 -0
- package/dist/plugins/registry.js +68 -0
- package/dist/plugins/registry.js.map +1 -0
- package/dist/plugins/validate.d.ts +9 -0
- package/dist/plugins/validate.d.ts.map +1 -0
- package/dist/plugins/validate.js +70 -0
- package/dist/plugins/validate.js.map +1 -0
- package/dist/repl/commands/agent.d.ts +5 -0
- package/dist/repl/commands/agent.d.ts.map +1 -0
- package/dist/repl/commands/agent.js +48 -0
- package/dist/repl/commands/agent.js.map +1 -0
- package/dist/repl/commands/cache.d.ts +4 -0
- package/dist/repl/commands/cache.d.ts.map +1 -0
- package/dist/repl/commands/cache.js +44 -0
- package/dist/repl/commands/cache.js.map +1 -0
- package/dist/repl/commands/crawl.d.ts +7 -0
- package/dist/repl/commands/crawl.d.ts.map +1 -0
- package/dist/repl/commands/crawl.js +42 -0
- package/dist/repl/commands/crawl.js.map +1 -0
- package/dist/repl/commands/extract.d.ts +5 -0
- package/dist/repl/commands/extract.d.ts.map +1 -0
- package/dist/repl/commands/extract.js +37 -0
- package/dist/repl/commands/extract.js.map +1 -0
- package/dist/repl/commands/fetch.d.ts +5 -0
- package/dist/repl/commands/fetch.d.ts.map +1 -0
- package/dist/repl/commands/fetch.js +53 -0
- package/dist/repl/commands/fetch.js.map +1 -0
- package/dist/repl/commands/find-similar.d.ts +5 -0
- package/dist/repl/commands/find-similar.d.ts.map +1 -0
- package/dist/repl/commands/find-similar.js +61 -0
- package/dist/repl/commands/find-similar.js.map +1 -0
- package/dist/repl/commands/research.d.ts +5 -0
- package/dist/repl/commands/research.d.ts.map +1 -0
- package/dist/repl/commands/research.js +50 -0
- package/dist/repl/commands/research.js.map +1 -0
- package/dist/repl/commands/search.d.ts +5 -0
- package/dist/repl/commands/search.d.ts.map +1 -0
- package/dist/repl/commands/search.js +62 -0
- package/dist/repl/commands/search.js.map +1 -0
- package/dist/repl/commands/types.d.ts +9 -0
- package/dist/repl/commands/types.d.ts.map +1 -0
- package/dist/repl/commands/types.js +2 -0
- package/dist/repl/commands/types.js.map +1 -0
- package/dist/repl/formatters.d.ts +13 -0
- package/dist/repl/formatters.d.ts.map +1 -0
- package/dist/repl/formatters.js +282 -0
- package/dist/repl/formatters.js.map +1 -0
- package/dist/repl/parser.d.ts +9 -0
- package/dist/repl/parser.d.ts.map +1 -0
- package/dist/repl/parser.js +84 -0
- package/dist/repl/parser.js.map +1 -0
- package/dist/repl/shell.d.ts +8 -0
- package/dist/repl/shell.d.ts.map +1 -0
- package/dist/repl/shell.js +177 -0
- package/dist/repl/shell.js.map +1 -0
- package/dist/research/decompose.d.ts +7 -0
- package/dist/research/decompose.d.ts.map +1 -0
- package/dist/research/decompose.js +195 -0
- package/dist/research/decompose.js.map +1 -0
- package/dist/research/pipeline.d.ts +5 -0
- package/dist/research/pipeline.d.ts.map +1 -0
- package/dist/research/pipeline.js +135 -0
- package/dist/research/pipeline.js.map +1 -0
- package/dist/research/synthesize.d.ts +10 -0
- package/dist/research/synthesize.d.ts.map +1 -0
- package/dist/research/synthesize.js +119 -0
- package/dist/research/synthesize.js.map +1 -0
- package/dist/search/answer-synthesis.d.ts +13 -0
- package/dist/search/answer-synthesis.d.ts.map +1 -0
- package/dist/search/answer-synthesis.js +120 -0
- package/dist/search/answer-synthesis.js.map +1 -0
- package/dist/search/context-formatter.d.ts +3 -0
- package/dist/search/context-formatter.d.ts.map +1 -0
- package/dist/search/context-formatter.js +56 -0
- package/dist/search/context-formatter.js.map +1 -0
- package/dist/search/find-similar.d.ts +5 -0
- package/dist/search/find-similar.d.ts.map +1 -0
- package/dist/search/find-similar.js +329 -0
- package/dist/search/find-similar.js.map +1 -0
- package/dist/search/multi-query.d.ts +22 -0
- package/dist/search/multi-query.d.ts.map +1 -0
- package/dist/search/multi-query.js +157 -0
- package/dist/search/multi-query.js.map +1 -0
- package/dist/search/rrf.d.ts +17 -0
- package/dist/search/rrf.d.ts.map +1 -0
- package/dist/search/rrf.js +48 -0
- package/dist/search/rrf.js.map +1 -0
- package/dist/search/sampling.d.ts +25 -0
- package/dist/search/sampling.d.ts.map +1 -0
- package/dist/search/sampling.js +52 -0
- package/dist/search/sampling.js.map +1 -0
- package/dist/server.d.ts +17 -0
- package/dist/server.d.ts.map +1 -1
- package/dist/server.js +366 -105
- package/dist/server.js.map +1 -1
- package/dist/tools/agent.d.ts +5 -0
- package/dist/tools/agent.d.ts.map +1 -0
- package/dist/tools/agent.js +67 -0
- package/dist/tools/agent.js.map +1 -0
- package/dist/tools/cache.d.ts +2 -1
- package/dist/tools/cache.d.ts.map +1 -1
- package/dist/tools/cache.js +56 -1
- package/dist/tools/cache.js.map +1 -1
- package/dist/tools/fetch.d.ts.map +1 -1
- package/dist/tools/fetch.js +26 -1
- package/dist/tools/fetch.js.map +1 -1
- package/dist/tools/find-similar.d.ts +5 -0
- package/dist/tools/find-similar.d.ts.map +1 -0
- package/dist/tools/find-similar.js +48 -0
- package/dist/tools/find-similar.js.map +1 -0
- package/dist/tools/research.d.ts +5 -0
- package/dist/tools/research.d.ts.map +1 -0
- package/dist/tools/research.js +50 -0
- package/dist/tools/research.js.map +1 -0
- package/dist/tools/search.d.ts +2 -1
- package/dist/tools/search.d.ts.map +1 -1
- package/dist/tools/search.js +179 -13
- package/dist/tools/search.js.map +1 -1
- package/dist/types.d.ts +147 -2
- package/dist/types.d.ts.map +1 -1
- package/package.json +43 -4
|
@@ -0,0 +1,329 @@
|
|
|
1
|
+
import { extractKeyTerms, buildFTS5Query } from '../embedding/key-terms.js';
|
|
2
|
+
import { reciprocalRankFusion, sortByRRFScore } from './rrf.js';
|
|
3
|
+
import { searchCache, getCachedContent, normalizeUrl } from '../cache/store.js';
|
|
4
|
+
import { filterByDomains } from './filters.js';
|
|
5
|
+
import { handleSearch } from '../tools/search.js';
|
|
6
|
+
import { extractContent } from '../extraction/pipeline.js';
|
|
7
|
+
import { getEmbeddingService } from '../embedding/embed.js';
|
|
8
|
+
import { createLogger } from '../logger.js';
|
|
9
|
+
const log = createLogger('search');
|
|
10
|
+
const DEFAULT_MAX_RESULTS = 10;
|
|
11
|
+
const MAX_FTS5_CANDIDATES = 20;
|
|
12
|
+
const WEB_SEARCH_QUERY_COUNT = 3;
|
|
13
|
+
export async function findSimilar(input, engines, router, backendStatus) {
|
|
14
|
+
const start = Date.now();
|
|
15
|
+
try {
|
|
16
|
+
const url = input.url?.trim();
|
|
17
|
+
const concept = input.concept?.trim();
|
|
18
|
+
if (!url && !concept) {
|
|
19
|
+
return {
|
|
20
|
+
results: [],
|
|
21
|
+
method: 'fts5',
|
|
22
|
+
cache_hits: 0,
|
|
23
|
+
search_hits: 0,
|
|
24
|
+
embedding_available: false,
|
|
25
|
+
error: 'Either url or concept must be provided',
|
|
26
|
+
total_time_ms: Date.now() - start,
|
|
27
|
+
};
|
|
28
|
+
}
|
|
29
|
+
const maxResults = input.max_results ?? DEFAULT_MAX_RESULTS;
|
|
30
|
+
const includeCache = input.include_cache ?? true;
|
|
31
|
+
const includeWeb = input.include_web ?? true;
|
|
32
|
+
const signal = await prepareSignal(url, concept, router);
|
|
33
|
+
if (signal.terms.length === 0) {
|
|
34
|
+
log.warn('no key terms extracted, falling back to web search');
|
|
35
|
+
if (!includeWeb) {
|
|
36
|
+
return {
|
|
37
|
+
results: [],
|
|
38
|
+
method: 'fts5',
|
|
39
|
+
cache_hits: 0,
|
|
40
|
+
search_hits: 0,
|
|
41
|
+
embedding_available: false,
|
|
42
|
+
error: 'Could not extract key terms from input and web search is disabled',
|
|
43
|
+
total_time_ms: Date.now() - start,
|
|
44
|
+
};
|
|
45
|
+
}
|
|
46
|
+
}
|
|
47
|
+
// FTS5 search on cache
|
|
48
|
+
let cacheResults = [];
|
|
49
|
+
const fts5RankMap = new Map();
|
|
50
|
+
if (includeCache && signal.terms.length > 0) {
|
|
51
|
+
cacheResults = runFTS5Search(signal.terms, signal.inputNormalizedUrl, input.include_domains, input.exclude_domains, MAX_FTS5_CANDIDATES, fts5RankMap);
|
|
52
|
+
log.debug('FTS5 search complete', { hits: cacheResults.length });
|
|
53
|
+
}
|
|
54
|
+
// Web search fallback
|
|
55
|
+
let searchResults = [];
|
|
56
|
+
const searchRankMap = new Map();
|
|
57
|
+
if (cacheResults.length < maxResults && includeWeb) {
|
|
58
|
+
searchResults = await runWebSearchFallback(signal, engines, router, backendStatus, maxResults, signal.inputNormalizedUrl, input.include_domains, input.exclude_domains, searchRankMap);
|
|
59
|
+
log.debug('web search fallback complete', { hits: searchResults.length });
|
|
60
|
+
}
|
|
61
|
+
// Fuse results via RRF
|
|
62
|
+
const rankedLists = [];
|
|
63
|
+
if (fts5RankMap.size > 0)
|
|
64
|
+
rankedLists.push(fts5RankMap);
|
|
65
|
+
if (searchRankMap.size > 0)
|
|
66
|
+
rankedLists.push(searchRankMap);
|
|
67
|
+
let finalResults;
|
|
68
|
+
if (rankedLists.length >= 1) {
|
|
69
|
+
finalResults = fuseResults(rankedLists, cacheResults, searchResults, maxResults);
|
|
70
|
+
}
|
|
71
|
+
else {
|
|
72
|
+
finalResults = [...cacheResults, ...searchResults]
|
|
73
|
+
.sort((a, b) => b.relevance_score - a.relevance_score)
|
|
74
|
+
.slice(0, maxResults);
|
|
75
|
+
}
|
|
76
|
+
const method = determineMethod(cacheResults.length > 0, searchResults.length > 0);
|
|
77
|
+
const cacheHits = finalResults.filter(r => r.source === 'cache').length;
|
|
78
|
+
const searchHits = finalResults.filter(r => r.source === 'search').length;
|
|
79
|
+
return {
|
|
80
|
+
results: finalResults,
|
|
81
|
+
method,
|
|
82
|
+
cache_hits: cacheHits,
|
|
83
|
+
search_hits: searchHits,
|
|
84
|
+
embedding_available: false,
|
|
85
|
+
total_time_ms: Date.now() - start,
|
|
86
|
+
};
|
|
87
|
+
}
|
|
88
|
+
catch (err) {
|
|
89
|
+
log.error('findSimilar failed', { error: String(err) });
|
|
90
|
+
return {
|
|
91
|
+
results: [],
|
|
92
|
+
method: 'fts5',
|
|
93
|
+
cache_hits: 0,
|
|
94
|
+
search_hits: 0,
|
|
95
|
+
embedding_available: false,
|
|
96
|
+
error: `find_similar failed: ${err instanceof Error ? err.message : String(err)}`,
|
|
97
|
+
total_time_ms: Date.now() - start,
|
|
98
|
+
};
|
|
99
|
+
}
|
|
100
|
+
}
|
|
101
|
+
async function prepareSignal(url, concept, router) {
|
|
102
|
+
if (url) {
|
|
103
|
+
return await prepareSignalFromUrl(url, router);
|
|
104
|
+
}
|
|
105
|
+
if (concept) {
|
|
106
|
+
const terms = extractKeyTerms(concept, '');
|
|
107
|
+
return { terms, title: concept };
|
|
108
|
+
}
|
|
109
|
+
return { terms: [], title: '' };
|
|
110
|
+
}
|
|
111
|
+
async function prepareSignalFromUrl(url, router) {
|
|
112
|
+
let normalizedInputUrl;
|
|
113
|
+
try {
|
|
114
|
+
normalizedInputUrl = normalizeUrl(url);
|
|
115
|
+
}
|
|
116
|
+
catch {
|
|
117
|
+
normalizedInputUrl = url;
|
|
118
|
+
}
|
|
119
|
+
const cached = getCachedContent(url);
|
|
120
|
+
if (cached) {
|
|
121
|
+
const terms = extractKeyTerms(cached.markdown, cached.title);
|
|
122
|
+
return {
|
|
123
|
+
terms,
|
|
124
|
+
title: cached.title,
|
|
125
|
+
inputUrl: url,
|
|
126
|
+
inputNormalizedUrl: normalizedInputUrl,
|
|
127
|
+
};
|
|
128
|
+
}
|
|
129
|
+
try {
|
|
130
|
+
log.info('fetching URL for signal extraction', { url });
|
|
131
|
+
const raw = await router.fetch(url, { renderJs: 'auto' });
|
|
132
|
+
const extraction = await extractContent(raw.html, raw.finalUrl, {
|
|
133
|
+
contentType: raw.contentType,
|
|
134
|
+
});
|
|
135
|
+
const terms = extractKeyTerms(extraction.markdown, extraction.title);
|
|
136
|
+
return {
|
|
137
|
+
terms,
|
|
138
|
+
title: extraction.title,
|
|
139
|
+
inputUrl: url,
|
|
140
|
+
inputNormalizedUrl: normalizedInputUrl,
|
|
141
|
+
};
|
|
142
|
+
}
|
|
143
|
+
catch (err) {
|
|
144
|
+
log.warn('failed to fetch URL for signal extraction', { url, error: String(err) });
|
|
145
|
+
const urlTerms = extractKeyTerms('', url);
|
|
146
|
+
return {
|
|
147
|
+
terms: urlTerms,
|
|
148
|
+
title: url,
|
|
149
|
+
inputUrl: url,
|
|
150
|
+
inputNormalizedUrl: normalizedInputUrl,
|
|
151
|
+
};
|
|
152
|
+
}
|
|
153
|
+
}
|
|
154
|
+
function runFTS5Search(terms, excludeNormalizedUrl, includeDomains, excludeDomains, maxCandidates, rankMap) {
|
|
155
|
+
try {
|
|
156
|
+
const fts5Query = buildFTS5Query(terms);
|
|
157
|
+
if (!fts5Query)
|
|
158
|
+
return [];
|
|
159
|
+
let cached = searchCache(fts5Query);
|
|
160
|
+
if (excludeNormalizedUrl) {
|
|
161
|
+
cached = cached.filter(c => {
|
|
162
|
+
try {
|
|
163
|
+
return normalizeUrl(c.url) !== excludeNormalizedUrl;
|
|
164
|
+
}
|
|
165
|
+
catch {
|
|
166
|
+
return c.url !== excludeNormalizedUrl;
|
|
167
|
+
}
|
|
168
|
+
});
|
|
169
|
+
}
|
|
170
|
+
cached = filterByDomains(cached, includeDomains, excludeDomains);
|
|
171
|
+
cached = cached.slice(0, maxCandidates);
|
|
172
|
+
const results = [];
|
|
173
|
+
for (let i = 0; i < cached.length; i++) {
|
|
174
|
+
const entry = cached[i];
|
|
175
|
+
let nUrl;
|
|
176
|
+
try {
|
|
177
|
+
nUrl = normalizeUrl(entry.url);
|
|
178
|
+
}
|
|
179
|
+
catch {
|
|
180
|
+
nUrl = entry.url;
|
|
181
|
+
}
|
|
182
|
+
rankMap.set(nUrl, i + 1);
|
|
183
|
+
results.push({
|
|
184
|
+
url: entry.url,
|
|
185
|
+
title: entry.title,
|
|
186
|
+
markdown: entry.markdown.slice(0, 5000),
|
|
187
|
+
relevance_score: 0,
|
|
188
|
+
source: 'cache',
|
|
189
|
+
match_signals: {
|
|
190
|
+
fts5_rank: i + 1,
|
|
191
|
+
fused_score: 0,
|
|
192
|
+
},
|
|
193
|
+
});
|
|
194
|
+
}
|
|
195
|
+
return results;
|
|
196
|
+
}
|
|
197
|
+
catch (err) {
|
|
198
|
+
log.error('FTS5 search failed', { error: String(err) });
|
|
199
|
+
return [];
|
|
200
|
+
}
|
|
201
|
+
}
|
|
202
|
+
async function runWebSearchFallback(signal, engines, router, backendStatus, maxResults, excludeNormalizedUrl, includeDomains, excludeDomains, rankMap) {
|
|
203
|
+
try {
|
|
204
|
+
const queries = generateSearchQueries(signal.terms, signal.title);
|
|
205
|
+
if (queries.length === 0)
|
|
206
|
+
return [];
|
|
207
|
+
const allResults = [];
|
|
208
|
+
const seenUrls = new Set();
|
|
209
|
+
if (excludeNormalizedUrl) {
|
|
210
|
+
seenUrls.add(excludeNormalizedUrl);
|
|
211
|
+
}
|
|
212
|
+
for (const query of queries) {
|
|
213
|
+
try {
|
|
214
|
+
const searchOutput = await handleSearch({
|
|
215
|
+
query,
|
|
216
|
+
max_results: maxResults,
|
|
217
|
+
include_content: true,
|
|
218
|
+
include_domains: includeDomains,
|
|
219
|
+
exclude_domains: excludeDomains,
|
|
220
|
+
}, engines, router, backendStatus);
|
|
221
|
+
for (const item of searchOutput.results) {
|
|
222
|
+
let nUrl;
|
|
223
|
+
try {
|
|
224
|
+
nUrl = normalizeUrl(item.url);
|
|
225
|
+
}
|
|
226
|
+
catch {
|
|
227
|
+
nUrl = item.url;
|
|
228
|
+
}
|
|
229
|
+
if (seenUrls.has(nUrl))
|
|
230
|
+
continue;
|
|
231
|
+
seenUrls.add(nUrl);
|
|
232
|
+
const rank = allResults.length + 1;
|
|
233
|
+
rankMap.set(nUrl, rank);
|
|
234
|
+
allResults.push({
|
|
235
|
+
url: item.url,
|
|
236
|
+
title: item.title,
|
|
237
|
+
markdown: (item.markdown_content ?? item.snippet).slice(0, 5000),
|
|
238
|
+
relevance_score: item.relevance_score,
|
|
239
|
+
source: 'search',
|
|
240
|
+
match_signals: {
|
|
241
|
+
fused_score: 0,
|
|
242
|
+
},
|
|
243
|
+
});
|
|
244
|
+
}
|
|
245
|
+
}
|
|
246
|
+
catch (err) {
|
|
247
|
+
log.warn('web search query failed', { query, error: String(err) });
|
|
248
|
+
}
|
|
249
|
+
}
|
|
250
|
+
try {
|
|
251
|
+
const embeddingService = getEmbeddingService();
|
|
252
|
+
if (embeddingService.isAvailable()) {
|
|
253
|
+
for (const result of allResults) {
|
|
254
|
+
if (result.markdown) {
|
|
255
|
+
embeddingService.embedAsync(result.url, result.markdown);
|
|
256
|
+
}
|
|
257
|
+
}
|
|
258
|
+
}
|
|
259
|
+
}
|
|
260
|
+
catch (err) {
|
|
261
|
+
log.debug('embedding hook skipped for find_similar results', { error: String(err) });
|
|
262
|
+
}
|
|
263
|
+
return allResults;
|
|
264
|
+
}
|
|
265
|
+
catch (err) {
|
|
266
|
+
log.error('web search fallback failed', { error: String(err) });
|
|
267
|
+
return [];
|
|
268
|
+
}
|
|
269
|
+
}
|
|
270
|
+
function generateSearchQueries(terms, title) {
|
|
271
|
+
if (terms.length === 0 && !title)
|
|
272
|
+
return [];
|
|
273
|
+
const queries = [];
|
|
274
|
+
if (title && title.length > 3) {
|
|
275
|
+
queries.push(title.slice(0, 150));
|
|
276
|
+
}
|
|
277
|
+
if (terms.length >= 3) {
|
|
278
|
+
queries.push(terms.slice(0, 5).join(' '));
|
|
279
|
+
}
|
|
280
|
+
if (terms.length >= 2) {
|
|
281
|
+
queries.push(`${terms.slice(0, 3).join(' ')} tutorial guide`);
|
|
282
|
+
}
|
|
283
|
+
const unique = [...new Set(queries)];
|
|
284
|
+
return unique.slice(0, WEB_SEARCH_QUERY_COUNT);
|
|
285
|
+
}
|
|
286
|
+
function fuseResults(rankedLists, cacheResults, searchResults, maxResults) {
|
|
287
|
+
const scores = reciprocalRankFusion(rankedLists);
|
|
288
|
+
const sorted = sortByRRFScore(scores);
|
|
289
|
+
const resultsByNormalizedUrl = new Map();
|
|
290
|
+
for (const r of [...cacheResults, ...searchResults]) {
|
|
291
|
+
let key;
|
|
292
|
+
try {
|
|
293
|
+
key = normalizeUrl(r.url);
|
|
294
|
+
}
|
|
295
|
+
catch {
|
|
296
|
+
key = r.url;
|
|
297
|
+
}
|
|
298
|
+
if (!resultsByNormalizedUrl.has(key)) {
|
|
299
|
+
resultsByNormalizedUrl.set(key, r);
|
|
300
|
+
}
|
|
301
|
+
}
|
|
302
|
+
const fused = [];
|
|
303
|
+
for (const [nUrl, score] of sorted) {
|
|
304
|
+
if (fused.length >= maxResults)
|
|
305
|
+
break;
|
|
306
|
+
const result = resultsByNormalizedUrl.get(nUrl);
|
|
307
|
+
if (!result)
|
|
308
|
+
continue;
|
|
309
|
+
fused.push({
|
|
310
|
+
...result,
|
|
311
|
+
relevance_score: score,
|
|
312
|
+
match_signals: {
|
|
313
|
+
...result.match_signals,
|
|
314
|
+
fused_score: score,
|
|
315
|
+
},
|
|
316
|
+
});
|
|
317
|
+
}
|
|
318
|
+
return fused;
|
|
319
|
+
}
|
|
320
|
+
function determineMethod(hasCache, hasSearch) {
|
|
321
|
+
if (hasCache && hasSearch)
|
|
322
|
+
return 'hybrid';
|
|
323
|
+
if (hasCache)
|
|
324
|
+
return 'fts5';
|
|
325
|
+
if (hasSearch)
|
|
326
|
+
return 'search';
|
|
327
|
+
return 'fts5';
|
|
328
|
+
}
|
|
329
|
+
//# sourceMappingURL=find-similar.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"find-similar.js","sourceRoot":"","sources":["../../src/search/find-similar.ts"],"names":[],"mappings":"AASA,OAAO,EAAE,eAAe,EAAE,cAAc,EAAE,MAAM,2BAA2B,CAAC;AAC5E,OAAO,EAAE,oBAAoB,EAAgB,cAAc,EAAE,MAAM,UAAU,CAAC;AAC9E,OAAO,EAAE,WAAW,EAAE,gBAAgB,EAAE,YAAY,EAAE,MAAM,mBAAmB,CAAC;AAChF,OAAO,EAAE,eAAe,EAAE,MAAM,cAAc,CAAC;AAC/C,OAAO,EAAE,YAAY,EAAE,MAAM,oBAAoB,CAAC;AAClD,OAAO,EAAE,cAAc,EAAE,MAAM,2BAA2B,CAAC;AAC3D,OAAO,EAAE,mBAAmB,EAAE,MAAM,uBAAuB,CAAC;AAC5D,OAAO,EAAE,YAAY,EAAE,MAAM,cAAc,CAAC;AAE5C,MAAM,GAAG,GAAG,YAAY,CAAC,QAAQ,CAAC,CAAC;AAEnC,MAAM,mBAAmB,GAAG,EAAE,CAAC;AAC/B,MAAM,mBAAmB,GAAG,EAAE,CAAC;AAC/B,MAAM,sBAAsB,GAAG,CAAC,CAAC;AASjC,MAAM,CAAC,KAAK,UAAU,WAAW,CAC/B,KAAuB,EACvB,OAAuB,EACvB,MAAmB,EACnB,aAA6B;IAE7B,MAAM,KAAK,GAAG,IAAI,CAAC,GAAG,EAAE,CAAC;IAEzB,IAAI,CAAC;QACH,MAAM,GAAG,GAAG,KAAK,CAAC,GAAG,EAAE,IAAI,EAAE,CAAC;QAC9B,MAAM,OAAO,GAAG,KAAK,CAAC,OAAO,EAAE,IAAI,EAAE,CAAC;QAEtC,IAAI,CAAC,GAAG,IAAI,CAAC,OAAO,EAAE,CAAC;YACrB,OAAO;gBACL,OAAO,EAAE,EAAE;gBACX,MAAM,EAAE,MAAM;gBACd,UAAU,EAAE,CAAC;gBACb,WAAW,EAAE,CAAC;gBACd,mBAAmB,EAAE,KAAK;gBAC1B,KAAK,EAAE,wCAAwC;gBAC/C,aAAa,EAAE,IAAI,CAAC,GAAG,EAAE,GAAG,KAAK;aAClC,CAAC;QACJ,CAAC;QAED,MAAM,UAAU,GAAG,KAAK,CAAC,WAAW,IAAI,mBAAmB,CAAC;QAC5D,MAAM,YAAY,GAAG,KAAK,CAAC,aAAa,IAAI,IAAI,CAAC;QACjD,MAAM,UAAU,GAAG,KAAK,CAAC,WAAW,IAAI,IAAI,CAAC;QAE7C,MAAM,MAAM,GAAG,MAAM,aAAa,CAAC,GAAG,EAAE,OAAO,EAAE,MAAM,CAAC,CAAC;QAEzD,IAAI,MAAM,CAAC,KAAK,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;YAC9B,GAAG,CAAC,IAAI,CAAC,oDAAoD,CAAC,CAAC;YAE/D,IAAI,CAAC,UAAU,EAAE,CAAC;gBAChB,OAAO;oBACL,OAAO,EAAE,EAAE;oBACX,MAAM,EAAE,MAAM;oBACd,UAAU,EAAE,CAAC;oBACb,WAAW,EAAE,CAAC;oBACd,mBAAmB,EAAE,KAAK;oBAC1B,KAAK,EAAE,mEAAmE;oBAC1E,aAAa,EAAE,IAAI,CAAC,GAAG,EAAE,GAAG,KAAK;iBAClC,CAAC;YACJ,CAAC;QACH,CAAC;QAED,uBAAuB;QACvB,IAAI,YAAY,GAAwB,EAAE,CAAC;QAC3C,MAAM,WAAW,GAAG,IAAI,GAAG,EAAkB,CAAC;QAE9C,IAAI,YAAY,IAAI,MAAM,CAAC,KAAK,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;YAC5C,YAAY,GAAG,aAAa,CAC1B,MAAM,CAAC,KAAK,EACZ,MAAM,CAAC,kBAAkB,EACzB,KAAK,CAAC,eAAe,EACrB,KAAK,CAAC,eAAe,EACrB,mBAAmB,EACnB,WAAW,CACZ,CAAC;YACF,GAAG,CAAC,KAAK,CAAC,sBAAsB,EAAE,EAAE,IAAI,EAAE,YAAY,CAAC,MAAM,EAAE,CAAC,CAAC;QACnE,CAAC;QAED,sBAAsB;QACtB,IAAI,aAAa,GAAwB,EAAE,CAAC;QAC5C,MAAM,aAAa,GAAG,IAAI,GAAG,EAAkB,CAAC;QAEhD,IAAI,YAAY,CAAC,MAAM,GAAG,UAAU,IAAI,UAAU,EAAE,CAAC;YACnD,aAAa,GAAG,MAAM,oBAAoB,CACxC,MAAM,EACN,OAAO,EACP,MAAM,EACN,aAAa,EACb,UAAU,EACV,MAAM,CAAC,kBAAkB,EACzB,KAAK,CAAC,eAAe,EACrB,KAAK,CAAC,eAAe,EACrB,aAAa,CACd,CAAC;YACF,GAAG,CAAC,KAAK,CAAC,8BAA8B,EAAE,EAAE,IAAI,EAAE,aAAa,CAAC,MAAM,EAAE,CAAC,CAAC;QAC5E,CAAC;QAED,uBAAuB;QACvB,MAAM,WAAW,GAA0B,EAAE,CAAC;QAC9C,IAAI,WAAW,CAAC,IAAI,GAAG,CAAC;YAAE,WAAW,CAAC,IAAI,CAAC,WAAW,CAAC,CAAC;QACxD,IAAI,aAAa,CAAC,IAAI,GAAG,CAAC;YAAE,WAAW,CAAC,IAAI,CAAC,aAAa,CAAC,CAAC;QAE5D,IAAI,YAAiC,CAAC;QAEtC,IAAI,WAAW,CAAC,MAAM,IAAI,CAAC,EAAE,CAAC;YAC5B,YAAY,GAAG,WAAW,CAAC,WAAW,EAAE,YAAY,EAAE,aAAa,EAAE,UAAU,CAAC,CAAC;QACnF,CAAC;aAAM,CAAC;YACN,YAAY,GAAG,CAAC,GAAG,YAAY,EAAE,GAAG,aAAa,CAAC;iBAC/C,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,eAAe,GAAG,CAAC,CAAC,eAAe,CAAC;iBACrD,KAAK,CAAC,CAAC,EAAE,UAAU,CAAC,CAAC;QAC1B,CAAC;QAED,MAAM,MAAM,GAAG,eAAe,CAAC,YAAY,CAAC,MAAM,GAAG,CAAC,EAAE,aAAa,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC;QAElF,MAAM,SAAS,GAAG,YAAY,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,MAAM,KAAK,OAAO,CAAC,CAAC,MAAM,CAAC;QACxE,MAAM,UAAU,GAAG,YAAY,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,MAAM,KAAK,QAAQ,CAAC,CAAC,MAAM,CAAC;QAE1E,OAAO;YACL,OAAO,EAAE,YAAY;YACrB,MAAM;YACN,UAAU,EAAE,SAAS;YACrB,WAAW,EAAE,UAAU;YACvB,mBAAmB,EAAE,KAAK;YAC1B,aAAa,EAAE,IAAI,CAAC,GAAG,EAAE,GAAG,KAAK;SAClC,CAAC;IACJ,CAAC;IAAC,OAAO,GAAG,EAAE,CAAC;QACb,GAAG,CAAC,KAAK,CAAC,oBAAoB,EAAE,EAAE,KAAK,EAAE,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;QACxD,OAAO;YACL,OAAO,EAAE,EAAE;YACX,MAAM,EAAE,MAAM;YACd,UAAU,EAAE,CAAC;YACb,WAAW,EAAE,CAAC;YACd,mBAAmB,EAAE,KAAK;YAC1B,KAAK,EAAE,wBAAwB,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,GAAG,CAAC,EAAE;YACjF,aAAa,EAAE,IAAI,CAAC,GAAG,EAAE,GAAG,KAAK;SAClC,CAAC;IACJ,CAAC;AACH,CAAC;AAED,KAAK,UAAU,aAAa,CAC1B,GAAuB,EACvB,OAA2B,EAC3B,MAAmB;IAEnB,IAAI,GAAG,EAAE,CAAC;QACR,OAAO,MAAM,oBAAoB,CAAC,GAAG,EAAE,MAAM,CAAC,CAAC;IACjD,CAAC;IAED,IAAI,OAAO,EAAE,CAAC;QACZ,MAAM,KAAK,GAAG,eAAe,CAAC,OAAO,EAAE,EAAE,CAAC,CAAC;QAC3C,OAAO,EAAE,KAAK,EAAE,KAAK,EAAE,OAAO,EAAE,CAAC;IACnC,CAAC;IAED,OAAO,EAAE,KAAK,EAAE,EAAE,EAAE,KAAK,EAAE,EAAE,EAAE,CAAC;AAClC,CAAC;AAED,KAAK,UAAU,oBAAoB,CACjC,GAAW,EACX,MAAmB;IAEnB,IAAI,kBAA0B,CAAC;IAC/B,IAAI,CAAC;QACH,kBAAkB,GAAG,YAAY,CAAC,GAAG,CAAC,CAAC;IACzC,CAAC;IAAC,MAAM,CAAC;QACP,kBAAkB,GAAG,GAAG,CAAC;IAC3B,CAAC;IAED,MAAM,MAAM,GAAG,gBAAgB,CAAC,GAAG,CAAC,CAAC;IACrC,IAAI,MAAM,EAAE,CAAC;QACX,MAAM,KAAK,GAAG,eAAe,CAAC,MAAM,CAAC,QAAQ,EAAE,MAAM,CAAC,KAAK,CAAC,CAAC;QAC7D,OAAO;YACL,KAAK;YACL,KAAK,EAAE,MAAM,CAAC,KAAK;YACnB,QAAQ,EAAE,GAAG;YACb,kBAAkB,EAAE,kBAAkB;SACvC,CAAC;IACJ,CAAC;IAED,IAAI,CAAC;QACH,GAAG,CAAC,IAAI,CAAC,oCAAoC,EAAE,EAAE,GAAG,EAAE,CAAC,CAAC;QACxD,MAAM,GAAG,GAAG,MAAM,MAAM,CAAC,KAAK,CAAC,GAAG,EAAE,EAAE,QAAQ,EAAE,MAAM,EAAE,CAAC,CAAC;QAC1D,MAAM,UAAU,GAAG,MAAM,cAAc,CAAC,GAAG,CAAC,IAAI,EAAE,GAAG,CAAC,QAAQ,EAAE;YAC9D,WAAW,EAAE,GAAG,CAAC,WAAW;SAC7B,CAAC,CAAC;QACH,MAAM,KAAK,GAAG,eAAe,CAAC,UAAU,CAAC,QAAQ,EAAE,UAAU,CAAC,KAAK,CAAC,CAAC;QACrE,OAAO;YACL,KAAK;YACL,KAAK,EAAE,UAAU,CAAC,KAAK;YACvB,QAAQ,EAAE,GAAG;YACb,kBAAkB,EAAE,kBAAkB;SACvC,CAAC;IACJ,CAAC;IAAC,OAAO,GAAG,EAAE,CAAC;QACb,GAAG,CAAC,IAAI,CAAC,2CAA2C,EAAE,EAAE,GAAG,EAAE,KAAK,EAAE,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;QACnF,MAAM,QAAQ,GAAG,eAAe,CAAC,EAAE,EAAE,GAAG,CAAC,CAAC;QAC1C,OAAO;YACL,KAAK,EAAE,QAAQ;YACf,KAAK,EAAE,GAAG;YACV,QAAQ,EAAE,GAAG;YACb,kBAAkB,EAAE,kBAAkB;SACvC,CAAC;IACJ,CAAC;AACH,CAAC;AAED,SAAS,aAAa,CACpB,KAAe,EACf,oBAAwC,EACxC,cAAoC,EACpC,cAAoC,EACpC,aAAqB,EACrB,OAA4B;IAE5B,IAAI,CAAC;QACH,MAAM,SAAS,GAAG,cAAc,CAAC,KAAK,CAAC,CAAC;QACxC,IAAI,CAAC,SAAS;YAAE,OAAO,EAAE,CAAC;QAE1B,IAAI,MAAM,GAAG,WAAW,CAAC,SAAS,CAAC,CAAC;QAEpC,IAAI,oBAAoB,EAAE,CAAC;YACzB,MAAM,GAAG,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE;gBACzB,IAAI,CAAC;oBACH,OAAO,YAAY,CAAC,CAAC,CAAC,GAAG,CAAC,KAAK,oBAAoB,CAAC;gBACtD,CAAC;gBAAC,MAAM,CAAC;oBACP,OAAO,CAAC,CAAC,GAAG,KAAK,oBAAoB,CAAC;gBACxC,CAAC;YACH,CAAC,CAAC,CAAC;QACL,CAAC;QAED,MAAM,GAAG,eAAe,CAAC,MAAM,EAAE,cAAc,EAAE,cAAc,CAAoB,CAAC;QACpF,MAAM,GAAG,MAAM,CAAC,KAAK,CAAC,CAAC,EAAE,aAAa,CAAC,CAAC;QAExC,MAAM,OAAO,GAAwB,EAAE,CAAC;QACxC,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,MAAM,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;YACvC,MAAM,KAAK,GAAG,MAAM,CAAC,CAAC,CAAC,CAAC;YACxB,IAAI,IAAY,CAAC;YACjB,IAAI,CAAC;gBACH,IAAI,GAAG,YAAY,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC;YACjC,CAAC;YAAC,MAAM,CAAC;gBACP,IAAI,GAAG,KAAK,CAAC,GAAG,CAAC;YACnB,CAAC;YAED,OAAO,CAAC,GAAG,CAAC,IAAI,EAAE,CAAC,GAAG,CAAC,CAAC,CAAC;YAEzB,OAAO,CAAC,IAAI,CAAC;gBACX,GAAG,EAAE,KAAK,CAAC,GAAG;gBACd,KAAK,EAAE,KAAK,CAAC,KAAK;gBAClB,QAAQ,EAAE,KAAK,CAAC,QAAQ,CAAC,KAAK,CAAC,CAAC,EAAE,IAAI,CAAC;gBACvC,eAAe,EAAE,CAAC;gBAClB,MAAM,EAAE,OAAO;gBACf,aAAa,EAAE;oBACb,SAAS,EAAE,CAAC,GAAG,CAAC;oBAChB,WAAW,EAAE,CAAC;iBACf;aACF,CAAC,CAAC;QACL,CAAC;QAED,OAAO,OAAO,CAAC;IACjB,CAAC;IAAC,OAAO,GAAG,EAAE,CAAC;QACb,GAAG,CAAC,KAAK,CAAC,oBAAoB,EAAE,EAAE,KAAK,EAAE,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;QACxD,OAAO,EAAE,CAAC;IACZ,CAAC;AACH,CAAC;AAED,KAAK,UAAU,oBAAoB,CACjC,MAAsB,EACtB,OAAuB,EACvB,MAAmB,EACnB,aAAwC,EACxC,UAAkB,EAClB,oBAAwC,EACxC,cAAoC,EACpC,cAAoC,EACpC,OAA4B;IAE5B,IAAI,CAAC;QACH,MAAM,OAAO,GAAG,qBAAqB,CAAC,MAAM,CAAC,KAAK,EAAE,MAAM,CAAC,KAAK,CAAC,CAAC;QAClE,IAAI,OAAO,CAAC,MAAM,KAAK,CAAC;YAAE,OAAO,EAAE,CAAC;QAEpC,MAAM,UAAU,GAAwB,EAAE,CAAC;QAC3C,MAAM,QAAQ,GAAG,IAAI,GAAG,EAAU,CAAC;QAEnC,IAAI,oBAAoB,EAAE,CAAC;YACzB,QAAQ,CAAC,GAAG,CAAC,oBAAoB,CAAC,CAAC;QACrC,CAAC;QAED,KAAK,MAAM,KAAK,IAAI,OAAO,EAAE,CAAC;YAC5B,IAAI,CAAC;gBACH,MAAM,YAAY,GAAG,MAAM,YAAY,CACrC;oBACE,KAAK;oBACL,WAAW,EAAE,UAAU;oBACvB,eAAe,EAAE,IAAI;oBACrB,eAAe,EAAE,cAAc;oBAC/B,eAAe,EAAE,cAAc;iBAChC,EACD,OAAO,EACP,MAAM,EACN,aAAa,CACd,CAAC;gBAEF,KAAK,MAAM,IAAI,IAAI,YAAY,CAAC,OAAO,EAAE,CAAC;oBACxC,IAAI,IAAY,CAAC;oBACjB,IAAI,CAAC;wBACH,IAAI,GAAG,YAAY,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;oBAChC,CAAC;oBAAC,MAAM,CAAC;wBACP,IAAI,GAAG,IAAI,CAAC,GAAG,CAAC;oBAClB,CAAC;oBAED,IAAI,QAAQ,CAAC,GAAG,CAAC,IAAI,CAAC;wBAAE,SAAS;oBACjC,QAAQ,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC;oBAEnB,MAAM,IAAI,GAAG,UAAU,CAAC,MAAM,GAAG,CAAC,CAAC;oBACnC,OAAO,CAAC,GAAG,CAAC,IAAI,EAAE,IAAI,CAAC,CAAC;oBAExB,UAAU,CAAC,IAAI,CAAC;wBACd,GAAG,EAAE,IAAI,CAAC,GAAG;wBACb,KAAK,EAAE,IAAI,CAAC,KAAK;wBACjB,QAAQ,EAAE,CAAC,IAAI,CAAC,gBAAgB,IAAI,IAAI,CAAC,OAAO,CAAC,CAAC,KAAK,CAAC,CAAC,EAAE,IAAI,CAAC;wBAChE,eAAe,EAAE,IAAI,CAAC,eAAe;wBACrC,MAAM,EAAE,QAAQ;wBAChB,aAAa,EAAE;4BACb,WAAW,EAAE,CAAC;yBACf;qBACF,CAAC,CAAC;gBACL,CAAC;YACH,CAAC;YAAC,OAAO,GAAG,EAAE,CAAC;gBACb,GAAG,CAAC,IAAI,CAAC,yBAAyB,EAAE,EAAE,KAAK,EAAE,KAAK,EAAE,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;YACrE,CAAC;QACH,CAAC;QAED,IAAI,CAAC;YACH,MAAM,gBAAgB,GAAG,mBAAmB,EAAE,CAAC;YAC/C,IAAI,gBAAgB,CAAC,WAAW,EAAE,EAAE,CAAC;gBACnC,KAAK,MAAM,MAAM,IAAI,UAAU,EAAE,CAAC;oBAChC,IAAI,MAAM,CAAC,QAAQ,EAAE,CAAC;wBACpB,gBAAgB,CAAC,UAAU,CAAC,MAAM,CAAC,GAAG,EAAE,MAAM,CAAC,QAAQ,CAAC,CAAC;oBAC3D,CAAC;gBACH,CAAC;YACH,CAAC;QACH,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACb,GAAG,CAAC,KAAK,CAAC,iDAAiD,EAAE,EAAE,KAAK,EAAE,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;QACvF,CAAC;QAED,OAAO,UAAU,CAAC;IACpB,CAAC;IAAC,OAAO,GAAG,EAAE,CAAC;QACb,GAAG,CAAC,KAAK,CAAC,4BAA4B,EAAE,EAAE,KAAK,EAAE,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;QAChE,OAAO,EAAE,CAAC;IACZ,CAAC;AACH,CAAC;AAED,SAAS,qBAAqB,CAAC,KAAe,EAAE,KAAa;IAC3D,IAAI,KAAK,CAAC,MAAM,KAAK,CAAC,IAAI,CAAC,KAAK;QAAE,OAAO,EAAE,CAAC;IAE5C,MAAM,OAAO,GAAa,EAAE,CAAC;IAE7B,IAAI,KAAK,IAAI,KAAK,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QAC9B,OAAO,CAAC,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC,EAAE,GAAG,CAAC,CAAC,CAAC;IACpC,CAAC;IAED,IAAI,KAAK,CAAC,MAAM,IAAI,CAAC,EAAE,CAAC;QACtB,OAAO,CAAC,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC;IAC5C,CAAC;IAED,IAAI,KAAK,CAAC,MAAM,IAAI,CAAC,EAAE,CAAC;QACtB,OAAO,CAAC,IAAI,CAAC,GAAG,KAAK,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,iBAAiB,CAAC,CAAC;IAChE,CAAC;IAED,MAAM,MAAM,GAAG,CAAC,GAAG,IAAI,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC;IACrC,OAAO,MAAM,CAAC,KAAK,CAAC,CAAC,EAAE,sBAAsB,CAAC,CAAC;AACjD,CAAC;AAED,SAAS,WAAW,CAClB,WAAkC,EAClC,YAAiC,EACjC,aAAkC,EAClC,UAAkB;IAElB,MAAM,MAAM,GAAG,oBAAoB,CAAC,WAAW,CAAC,CAAC;IACjD,MAAM,MAAM,GAAG,cAAc,CAAC,MAAM,CAAC,CAAC;IAEtC,MAAM,sBAAsB,GAAG,IAAI,GAAG,EAA6B,CAAC;IACpE,KAAK,MAAM,CAAC,IAAI,CAAC,GAAG,YAAY,EAAE,GAAG,aAAa,CAAC,EAAE,CAAC;QACpD,IAAI,GAAW,CAAC;QAChB,IAAI,CAAC;YACH,GAAG,GAAG,YAAY,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC;QAC5B,CAAC;QAAC,MAAM,CAAC;YACP,GAAG,GAAG,CAAC,CAAC,GAAG,CAAC;QACd,CAAC;QACD,IAAI,CAAC,sBAAsB,CAAC,GAAG,CAAC,GAAG,CAAC,EAAE,CAAC;YACrC,sBAAsB,CAAC,GAAG,CAAC,GAAG,EAAE,CAAC,CAAC,CAAC;QACrC,CAAC;IACH,CAAC;IAED,MAAM,KAAK,GAAwB,EAAE,CAAC;IACtC,KAAK,MAAM,CAAC,IAAI,EAAE,KAAK,CAAC,IAAI,MAAM,EAAE,CAAC;QACnC,IAAI,KAAK,CAAC,MAAM,IAAI,UAAU;YAAE,MAAM;QAEtC,MAAM,MAAM,GAAG,sBAAsB,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC;QAChD,IAAI,CAAC,MAAM;YAAE,SAAS;QAEtB,KAAK,CAAC,IAAI,CAAC;YACT,GAAG,MAAM;YACT,eAAe,EAAE,KAAK;YACtB,aAAa,EAAE;gBACb,GAAG,MAAM,CAAC,aAAa;gBACvB,WAAW,EAAE,KAAK;aACnB;SACF,CAAC,CAAC;IACL,CAAC;IAED,OAAO,KAAK,CAAC;AACf,CAAC;AAED,SAAS,eAAe,CACtB,QAAiB,EACjB,SAAkB;IAElB,IAAI,QAAQ,IAAI,SAAS;QAAE,OAAO,QAAQ,CAAC;IAC3C,IAAI,QAAQ;QAAE,OAAO,MAAM,CAAC;IAC5B,IAAI,SAAS;QAAE,OAAO,QAAQ,CAAC;IAC/B,OAAO,MAAM,CAAC;AAChB,CAAC"}
|
|
@@ -0,0 +1,22 @@
|
|
|
1
|
+
import type { RawSearchResult, SearchEngine } from '../types.js';
|
|
2
|
+
import type { MergedSearchResult } from './dedup.js';
|
|
3
|
+
export declare function normalizeQueries(queries: string[]): string[];
|
|
4
|
+
export interface FanOutOptions {
|
|
5
|
+
maxResults: number;
|
|
6
|
+
timeRange?: string;
|
|
7
|
+
language?: string;
|
|
8
|
+
includeDomains?: string[];
|
|
9
|
+
excludeDomains?: string[];
|
|
10
|
+
fromDate?: string;
|
|
11
|
+
toDate?: string;
|
|
12
|
+
category?: 'general' | 'news' | 'code' | 'docs' | 'papers' | 'images';
|
|
13
|
+
}
|
|
14
|
+
export interface FanOutResult {
|
|
15
|
+
results: RawSearchResult[];
|
|
16
|
+
enginesUsed: string[];
|
|
17
|
+
errors: string[];
|
|
18
|
+
}
|
|
19
|
+
export declare function fanOutSearch(queries: string[], engines: SearchEngine[], options: FanOutOptions): Promise<FanOutResult>;
|
|
20
|
+
export declare function synthesizeIntent(queries: string[]): string;
|
|
21
|
+
export declare function mergeWithRRF(rankedLists: MergedSearchResult[][]): MergedSearchResult[];
|
|
22
|
+
//# sourceMappingURL=multi-query.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"multi-query.d.ts","sourceRoot":"","sources":["../../src/search/multi-query.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,eAAe,EAAE,YAAY,EAAuB,MAAM,aAAa,CAAC;AACtF,OAAO,KAAK,EAAE,kBAAkB,EAAE,MAAM,YAAY,CAAC;AASrD,wBAAgB,gBAAgB,CAAC,OAAO,EAAE,MAAM,EAAE,GAAG,MAAM,EAAE,CA2B5D;AAED,MAAM,WAAW,aAAa;IAC5B,UAAU,EAAE,MAAM,CAAC;IACnB,SAAS,CAAC,EAAE,MAAM,CAAC;IACnB,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,cAAc,CAAC,EAAE,MAAM,EAAE,CAAC;IAC1B,cAAc,CAAC,EAAE,MAAM,EAAE,CAAC;IAC1B,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,QAAQ,CAAC,EAAE,SAAS,GAAG,MAAM,GAAG,MAAM,GAAG,MAAM,GAAG,QAAQ,GAAG,QAAQ,CAAC;CACvE;AAED,MAAM,WAAW,YAAY;IAC3B,OAAO,EAAE,eAAe,EAAE,CAAC;IAC3B,WAAW,EAAE,MAAM,EAAE,CAAC;IACtB,MAAM,EAAE,MAAM,EAAE,CAAC;CAClB;AAED,wBAAsB,YAAY,CAChC,OAAO,EAAE,MAAM,EAAE,EACjB,OAAO,EAAE,YAAY,EAAE,EACvB,OAAO,EAAE,aAAa,GACrB,OAAO,CAAC,YAAY,CAAC,CAsEvB;AAED,wBAAgB,gBAAgB,CAAC,OAAO,EAAE,MAAM,EAAE,GAAG,MAAM,CAO1D;AAED,wBAAgB,YAAY,CAAC,WAAW,EAAE,kBAAkB,EAAE,EAAE,GAAG,kBAAkB,EAAE,CAmDtF"}
|
|
@@ -0,0 +1,157 @@
|
|
|
1
|
+
import { normalizeUrl } from '../cache/store.js';
|
|
2
|
+
import { getConfig } from '../config.js';
|
|
3
|
+
import { createLogger } from '../logger.js';
|
|
4
|
+
const log = createLogger('search');
|
|
5
|
+
const RRF_K = 60;
|
|
6
|
+
export function normalizeQueries(queries) {
|
|
7
|
+
try {
|
|
8
|
+
const config = getConfig();
|
|
9
|
+
const seen = new Set();
|
|
10
|
+
const normalized = [];
|
|
11
|
+
for (const raw of queries) {
|
|
12
|
+
const q = raw.toLowerCase().trim().replace(/\s+/g, ' ');
|
|
13
|
+
if (q.length === 0)
|
|
14
|
+
continue;
|
|
15
|
+
if (seen.has(q))
|
|
16
|
+
continue;
|
|
17
|
+
seen.add(q);
|
|
18
|
+
normalized.push(q);
|
|
19
|
+
}
|
|
20
|
+
if (normalized.length > config.multiQueryMax) {
|
|
21
|
+
log.warn('multi-query array exceeds max, truncating', {
|
|
22
|
+
provided: normalized.length,
|
|
23
|
+
max: config.multiQueryMax,
|
|
24
|
+
});
|
|
25
|
+
return normalized.slice(0, config.multiQueryMax);
|
|
26
|
+
}
|
|
27
|
+
return normalized;
|
|
28
|
+
}
|
|
29
|
+
catch (err) {
|
|
30
|
+
log.error('normalizeQueries failed', { error: String(err) });
|
|
31
|
+
return [];
|
|
32
|
+
}
|
|
33
|
+
}
|
|
34
|
+
export async function fanOutSearch(queries, engines, options) {
|
|
35
|
+
const allResults = [];
|
|
36
|
+
const enginesUsed = new Set();
|
|
37
|
+
const errors = [];
|
|
38
|
+
if (queries.length === 0 || engines.length === 0) {
|
|
39
|
+
return { results: [], enginesUsed: [], errors: [] };
|
|
40
|
+
}
|
|
41
|
+
try {
|
|
42
|
+
const config = getConfig();
|
|
43
|
+
const concurrency = config.multiQueryConcurrency;
|
|
44
|
+
const hasFilterAttrition = !!(options.includeDomains?.length || options.excludeDomains?.length);
|
|
45
|
+
const overfetchFactor = hasFilterAttrition ? 3 : 2;
|
|
46
|
+
const engineOptions = {
|
|
47
|
+
maxResults: options.maxResults * overfetchFactor,
|
|
48
|
+
timeRange: options.timeRange,
|
|
49
|
+
language: options.language,
|
|
50
|
+
includeDomains: options.includeDomains,
|
|
51
|
+
excludeDomains: options.excludeDomains,
|
|
52
|
+
fromDate: options.fromDate,
|
|
53
|
+
toDate: options.toDate,
|
|
54
|
+
category: options.category,
|
|
55
|
+
};
|
|
56
|
+
const tasks = [];
|
|
57
|
+
for (const engine of engines) {
|
|
58
|
+
for (const query of queries) {
|
|
59
|
+
tasks.push({ engine, query });
|
|
60
|
+
}
|
|
61
|
+
}
|
|
62
|
+
for (let i = 0; i < tasks.length; i += concurrency) {
|
|
63
|
+
const batch = tasks.slice(i, i + concurrency);
|
|
64
|
+
const promises = batch.map(async ({ engine, query }) => {
|
|
65
|
+
try {
|
|
66
|
+
const results = await engine.search(query, engineOptions);
|
|
67
|
+
for (const r of results) {
|
|
68
|
+
allResults.push(r);
|
|
69
|
+
enginesUsed.add(engine.name);
|
|
70
|
+
}
|
|
71
|
+
}
|
|
72
|
+
catch (err) {
|
|
73
|
+
const msg = err instanceof Error ? err.message : String(err);
|
|
74
|
+
log.warn('multi-query engine search failed', {
|
|
75
|
+
engine: engine.name,
|
|
76
|
+
query,
|
|
77
|
+
error: msg,
|
|
78
|
+
});
|
|
79
|
+
errors.push(`${engine.name}(${query}): ${msg}`);
|
|
80
|
+
}
|
|
81
|
+
});
|
|
82
|
+
await Promise.allSettled(promises);
|
|
83
|
+
}
|
|
84
|
+
return {
|
|
85
|
+
results: allResults,
|
|
86
|
+
enginesUsed: [...enginesUsed],
|
|
87
|
+
errors,
|
|
88
|
+
};
|
|
89
|
+
}
|
|
90
|
+
catch (err) {
|
|
91
|
+
log.error('fanOutSearch failed', { error: String(err) });
|
|
92
|
+
return {
|
|
93
|
+
results: allResults,
|
|
94
|
+
enginesUsed: [...enginesUsed],
|
|
95
|
+
errors: [...errors, `fanOutSearch: ${String(err)}`],
|
|
96
|
+
};
|
|
97
|
+
}
|
|
98
|
+
}
|
|
99
|
+
export function synthesizeIntent(queries) {
|
|
100
|
+
try {
|
|
101
|
+
return queries.map(q => q.trim()).filter(Boolean).join('; ');
|
|
102
|
+
}
|
|
103
|
+
catch (err) {
|
|
104
|
+
log.error('synthesizeIntent failed', { error: String(err) });
|
|
105
|
+
return '';
|
|
106
|
+
}
|
|
107
|
+
}
|
|
108
|
+
export function mergeWithRRF(rankedLists) {
|
|
109
|
+
try {
|
|
110
|
+
if (rankedLists.length === 0)
|
|
111
|
+
return [];
|
|
112
|
+
const nonEmpty = rankedLists.filter(l => l.length > 0);
|
|
113
|
+
if (nonEmpty.length === 0)
|
|
114
|
+
return [];
|
|
115
|
+
const rrfScores = new Map();
|
|
116
|
+
const bestAppearance = new Map();
|
|
117
|
+
for (const list of nonEmpty) {
|
|
118
|
+
for (let rank = 0; rank < list.length; rank++) {
|
|
119
|
+
const item = list[rank];
|
|
120
|
+
let normalizedUrlStr;
|
|
121
|
+
try {
|
|
122
|
+
normalizedUrlStr = normalizeUrl(item.url);
|
|
123
|
+
}
|
|
124
|
+
catch {
|
|
125
|
+
normalizedUrlStr = item.url;
|
|
126
|
+
}
|
|
127
|
+
const rrfContribution = 1 / (RRF_K + rank + 1);
|
|
128
|
+
const current = rrfScores.get(normalizedUrlStr) ?? 0;
|
|
129
|
+
rrfScores.set(normalizedUrlStr, current + rrfContribution);
|
|
130
|
+
const existing = bestAppearance.get(normalizedUrlStr);
|
|
131
|
+
if (!existing || rank < existing.bestRank) {
|
|
132
|
+
bestAppearance.set(normalizedUrlStr, { result: item, bestRank: rank });
|
|
133
|
+
}
|
|
134
|
+
}
|
|
135
|
+
}
|
|
136
|
+
let maxScore = 0;
|
|
137
|
+
for (const score of rrfScores.values()) {
|
|
138
|
+
if (score > maxScore)
|
|
139
|
+
maxScore = score;
|
|
140
|
+
}
|
|
141
|
+
const merged = [];
|
|
142
|
+
for (const [normalizedUrlStr, score] of rrfScores.entries()) {
|
|
143
|
+
const appearance = bestAppearance.get(normalizedUrlStr);
|
|
144
|
+
merged.push({
|
|
145
|
+
...appearance.result,
|
|
146
|
+
relevance_score: maxScore > 0 ? score / maxScore : 0,
|
|
147
|
+
});
|
|
148
|
+
}
|
|
149
|
+
merged.sort((a, b) => b.relevance_score - a.relevance_score);
|
|
150
|
+
return merged;
|
|
151
|
+
}
|
|
152
|
+
catch (err) {
|
|
153
|
+
log.error('mergeWithRRF failed', { error: String(err) });
|
|
154
|
+
return [];
|
|
155
|
+
}
|
|
156
|
+
}
|
|
157
|
+
//# sourceMappingURL=multi-query.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"multi-query.js","sourceRoot":"","sources":["../../src/search/multi-query.ts"],"names":[],"mappings":"AAEA,OAAO,EAAE,YAAY,EAAE,MAAM,mBAAmB,CAAC;AACjD,OAAO,EAAE,SAAS,EAAE,MAAM,cAAc,CAAC;AACzC,OAAO,EAAE,YAAY,EAAE,MAAM,cAAc,CAAC;AAE5C,MAAM,GAAG,GAAG,YAAY,CAAC,QAAQ,CAAC,CAAC;AAEnC,MAAM,KAAK,GAAG,EAAE,CAAC;AAEjB,MAAM,UAAU,gBAAgB,CAAC,OAAiB;IAChD,IAAI,CAAC;QACH,MAAM,MAAM,GAAG,SAAS,EAAE,CAAC;QAC3B,MAAM,IAAI,GAAG,IAAI,GAAG,EAAU,CAAC;QAC/B,MAAM,UAAU,GAAa,EAAE,CAAC;QAEhC,KAAK,MAAM,GAAG,IAAI,OAAO,EAAE,CAAC;YAC1B,MAAM,CAAC,GAAG,GAAG,CAAC,WAAW,EAAE,CAAC,IAAI,EAAE,CAAC,OAAO,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;YACxD,IAAI,CAAC,CAAC,MAAM,KAAK,CAAC;gBAAE,SAAS;YAC7B,IAAI,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC;gBAAE,SAAS;YAC1B,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;YACZ,UAAU,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC;QACrB,CAAC;QAED,IAAI,UAAU,CAAC,MAAM,GAAG,MAAM,CAAC,aAAa,EAAE,CAAC;YAC7C,GAAG,CAAC,IAAI,CAAC,2CAA2C,EAAE;gBACpD,QAAQ,EAAE,UAAU,CAAC,MAAM;gBAC3B,GAAG,EAAE,MAAM,CAAC,aAAa;aAC1B,CAAC,CAAC;YACH,OAAO,UAAU,CAAC,KAAK,CAAC,CAAC,EAAE,MAAM,CAAC,aAAa,CAAC,CAAC;QACnD,CAAC;QAED,OAAO,UAAU,CAAC;IACpB,CAAC;IAAC,OAAO,GAAG,EAAE,CAAC;QACb,GAAG,CAAC,KAAK,CAAC,yBAAyB,EAAE,EAAE,KAAK,EAAE,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;QAC7D,OAAO,EAAE,CAAC;IACZ,CAAC;AACH,CAAC;AAmBD,MAAM,CAAC,KAAK,UAAU,YAAY,CAChC,OAAiB,EACjB,OAAuB,EACvB,OAAsB;IAEtB,MAAM,UAAU,GAAsB,EAAE,CAAC;IACzC,MAAM,WAAW,GAAG,IAAI,GAAG,EAAU,CAAC;IACtC,MAAM,MAAM,GAAa,EAAE,CAAC;IAE5B,IAAI,OAAO,CAAC,MAAM,KAAK,CAAC,IAAI,OAAO,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;QACjD,OAAO,EAAE,OAAO,EAAE,EAAE,EAAE,WAAW,EAAE,EAAE,EAAE,MAAM,EAAE,EAAE,EAAE,CAAC;IACtD,CAAC;IAED,IAAI,CAAC;QACH,MAAM,MAAM,GAAG,SAAS,EAAE,CAAC;QAC3B,MAAM,WAAW,GAAG,MAAM,CAAC,qBAAqB,CAAC;QAEjD,MAAM,kBAAkB,GAAG,CAAC,CAAC,CAAC,OAAO,CAAC,cAAc,EAAE,MAAM,IAAI,OAAO,CAAC,cAAc,EAAE,MAAM,CAAC,CAAC;QAChG,MAAM,eAAe,GAAG,kBAAkB,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;QAEnD,MAAM,aAAa,GAAwB;YACzC,UAAU,EAAE,OAAO,CAAC,UAAU,GAAG,eAAe;YAChD,SAAS,EAAE,OAAO,CAAC,SAAS;YAC5B,QAAQ,EAAE,OAAO,CAAC,QAAQ;YAC1B,cAAc,EAAE,OAAO,CAAC,cAAc;YACtC,cAAc,EAAE,OAAO,CAAC,cAAc;YACtC,QAAQ,EAAE,OAAO,CAAC,QAAQ;YAC1B,MAAM,EAAE,OAAO,CAAC,MAAM;YACtB,QAAQ,EAAE,OAAO,CAAC,QAAQ;SAC3B,CAAC;QAEF,MAAM,KAAK,GAAmD,EAAE,CAAC;QACjE,KAAK,MAAM,MAAM,IAAI,OAAO,EAAE,CAAC;YAC7B,KAAK,MAAM,KAAK,IAAI,OAAO,EAAE,CAAC;gBAC5B,KAAK,CAAC,IAAI,CAAC,EAAE,MAAM,EAAE,KAAK,EAAE,CAAC,CAAC;YAChC,CAAC;QACH,CAAC;QAED,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,KAAK,CAAC,MAAM,EAAE,CAAC,IAAI,WAAW,EAAE,CAAC;YACnD,MAAM,KAAK,GAAG,KAAK,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,GAAG,WAAW,CAAC,CAAC;YAC9C,MAAM,QAAQ,GAAG,KAAK,CAAC,GAAG,CAAC,KAAK,EAAE,EAAE,MAAM,EAAE,KAAK,EAAE,EAAE,EAAE;gBACrD,IAAI,CAAC;oBACH,MAAM,OAAO,GAAG,MAAM,MAAM,CAAC,MAAM,CAAC,KAAK,EAAE,aAAa,CAAC,CAAC;oBAC1D,KAAK,MAAM,CAAC,IAAI,OAAO,EAAE,CAAC;wBACxB,UAAU,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC;wBACnB,WAAW,CAAC,GAAG,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC;oBAC/B,CAAC;gBACH,CAAC;gBAAC,OAAO,GAAG,EAAE,CAAC;oBACb,MAAM,GAAG,GAAG,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,GAAG,CAAC,CAAC;oBAC7D,GAAG,CAAC,IAAI,CAAC,kCAAkC,EAAE;wBAC3C,MAAM,EAAE,MAAM,CAAC,IAAI;wBACnB,KAAK;wBACL,KAAK,EAAE,GAAG;qBACX,CAAC,CAAC;oBACH,MAAM,CAAC,IAAI,CAAC,GAAG,MAAM,CAAC,IAAI,IAAI,KAAK,MAAM,GAAG,EAAE,CAAC,CAAC;gBAClD,CAAC;YACH,CAAC,CAAC,CAAC;YAEH,MAAM,OAAO,CAAC,UAAU,CAAC,QAAQ,CAAC,CAAC;QACrC,CAAC;QAED,OAAO;YACL,OAAO,EAAE,UAAU;YACnB,WAAW,EAAE,CAAC,GAAG,WAAW,CAAC;YAC7B,MAAM;SACP,CAAC;IACJ,CAAC;IAAC,OAAO,GAAG,EAAE,CAAC;QACb,GAAG,CAAC,KAAK,CAAC,qBAAqB,EAAE,EAAE,KAAK,EAAE,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;QACzD,OAAO;YACL,OAAO,EAAE,UAAU;YACnB,WAAW,EAAE,CAAC,GAAG,WAAW,CAAC;YAC7B,MAAM,EAAE,CAAC,GAAG,MAAM,EAAE,iBAAiB,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC;SACpD,CAAC;IACJ,CAAC;AACH,CAAC;AAED,MAAM,UAAU,gBAAgB,CAAC,OAAiB;IAChD,IAAI,CAAC;QACH,OAAO,OAAO,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC,CAAC,MAAM,CAAC,OAAO,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;IAC/D,CAAC;IAAC,OAAO,GAAG,EAAE,CAAC;QACb,GAAG,CAAC,KAAK,CAAC,yBAAyB,EAAE,EAAE,KAAK,EAAE,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;QAC7D,OAAO,EAAE,CAAC;IACZ,CAAC;AACH,CAAC;AAED,MAAM,UAAU,YAAY,CAAC,WAAmC;IAC9D,IAAI,CAAC;QACH,IAAI,WAAW,CAAC,MAAM,KAAK,CAAC;YAAE,OAAO,EAAE,CAAC;QAExC,MAAM,QAAQ,GAAG,WAAW,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC;QACvD,IAAI,QAAQ,CAAC,MAAM,KAAK,CAAC;YAAE,OAAO,EAAE,CAAC;QAErC,MAAM,SAAS,GAAG,IAAI,GAAG,EAAkB,CAAC;QAC5C,MAAM,cAAc,GAAG,IAAI,GAAG,EAA4D,CAAC;QAE3F,KAAK,MAAM,IAAI,IAAI,QAAQ,EAAE,CAAC;YAC5B,KAAK,IAAI,IAAI,GAAG,CAAC,EAAE,IAAI,GAAG,IAAI,CAAC,MAAM,EAAE,IAAI,EAAE,EAAE,CAAC;gBAC9C,MAAM,IAAI,GAAG,IAAI,CAAC,IAAI,CAAC,CAAC;gBACxB,IAAI,gBAAwB,CAAC;gBAC7B,IAAI,CAAC;oBACH,gBAAgB,GAAG,YAAY,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;gBAC5C,CAAC;gBAAC,MAAM,CAAC;oBACP,gBAAgB,GAAG,IAAI,CAAC,GAAG,CAAC;gBAC9B,CAAC;gBAED,MAAM,eAAe,GAAG,CAAC,GAAG,CAAC,KAAK,GAAG,IAAI,GAAG,CAAC,CAAC,CAAC;gBAC/C,MAAM,OAAO,GAAG,SAAS,CAAC,GAAG,CAAC,gBAAgB,CAAC,IAAI,CAAC,CAAC;gBACrD,SAAS,CAAC,GAAG,CAAC,gBAAgB,EAAE,OAAO,GAAG,eAAe,CAAC,CAAC;gBAE3D,MAAM,QAAQ,GAAG,cAAc,CAAC,GAAG,CAAC,gBAAgB,CAAC,CAAC;gBACtD,IAAI,CAAC,QAAQ,IAAI,IAAI,GAAG,QAAQ,CAAC,QAAQ,EAAE,CAAC;oBAC1C,cAAc,CAAC,GAAG,CAAC,gBAAgB,EAAE,EAAE,MAAM,EAAE,IAAI,EAAE,QAAQ,EAAE,IAAI,EAAE,CAAC,CAAC;gBACzE,CAAC;YACH,CAAC;QACH,CAAC;QAED,IAAI,QAAQ,GAAG,CAAC,CAAC;QACjB,KAAK,MAAM,KAAK,IAAI,SAAS,CAAC,MAAM,EAAE,EAAE,CAAC;YACvC,IAAI,KAAK,GAAG,QAAQ;gBAAE,QAAQ,GAAG,KAAK,CAAC;QACzC,CAAC;QAED,MAAM,MAAM,GAAyB,EAAE,CAAC;QACxC,KAAK,MAAM,CAAC,gBAAgB,EAAE,KAAK,CAAC,IAAI,SAAS,CAAC,OAAO,EAAE,EAAE,CAAC;YAC5D,MAAM,UAAU,GAAG,cAAc,CAAC,GAAG,CAAC,gBAAgB,CAAE,CAAC;YACzD,MAAM,CAAC,IAAI,CAAC;gBACV,GAAG,UAAU,CAAC,MAAM;gBACpB,eAAe,EAAE,QAAQ,GAAG,CAAC,CAAC,CAAC,CAAC,KAAK,GAAG,QAAQ,CAAC,CAAC,CAAC,CAAC;aACrD,CAAC,CAAC;QACL,CAAC;QAED,MAAM,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,eAAe,GAAG,CAAC,CAAC,eAAe,CAAC,CAAC;QAC7D,OAAO,MAAM,CAAC;IAChB,CAAC;IAAC,OAAO,GAAG,EAAE,CAAC;QACb,GAAG,CAAC,KAAK,CAAC,qBAAqB,EAAE,EAAE,KAAK,EAAE,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;QACzD,OAAO,EAAE,CAAC;IACZ,CAAC;AACH,CAAC"}
|
|
@@ -0,0 +1,17 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Reciprocal Rank Fusion -- merges multiple ranked lists into a single
|
|
3
|
+
* score map. Each list maps URL -> rank (1-based). The fused score for
|
|
4
|
+
* a URL is the sum of 1/(k + rank) across all lists it appears in.
|
|
5
|
+
*/
|
|
6
|
+
export declare function reciprocalRankFusion(lists: Map<string, number>[], k?: number): Map<string, number>;
|
|
7
|
+
/**
|
|
8
|
+
* Convert a fused score map into a sorted array of [url, score] pairs,
|
|
9
|
+
* descending by score.
|
|
10
|
+
*/
|
|
11
|
+
export declare function sortByRRFScore(scores: Map<string, number>): Array<[string, number]>;
|
|
12
|
+
/**
|
|
13
|
+
* Build a rank map from an ordered array of URLs.
|
|
14
|
+
* First URL gets rank 1, second gets rank 2, etc.
|
|
15
|
+
*/
|
|
16
|
+
export declare function buildRankMap(urls: string[]): Map<string, number>;
|
|
17
|
+
//# sourceMappingURL=rrf.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"rrf.d.ts","sourceRoot":"","sources":["../../src/search/rrf.ts"],"names":[],"mappings":"AAIA;;;;GAIG;AACH,wBAAgB,oBAAoB,CAClC,KAAK,EAAE,GAAG,CAAC,MAAM,EAAE,MAAM,CAAC,EAAE,EAC5B,CAAC,GAAE,MAAW,GACb,GAAG,CAAC,MAAM,EAAE,MAAM,CAAC,CAqBrB;AAED;;;GAGG;AACH,wBAAgB,cAAc,CAC5B,MAAM,EAAE,GAAG,CAAC,MAAM,EAAE,MAAM,CAAC,GAC1B,KAAK,CAAC,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC,CAEzB;AAED;;;GAGG;AACH,wBAAgB,YAAY,CAAC,IAAI,EAAE,MAAM,EAAE,GAAG,GAAG,CAAC,MAAM,EAAE,MAAM,CAAC,CAQhE"}
|
|
@@ -0,0 +1,48 @@
|
|
|
1
|
+
import { createLogger } from '../logger.js';
|
|
2
|
+
const log = createLogger('search');
|
|
3
|
+
/**
|
|
4
|
+
* Reciprocal Rank Fusion -- merges multiple ranked lists into a single
|
|
5
|
+
* score map. Each list maps URL -> rank (1-based). The fused score for
|
|
6
|
+
* a URL is the sum of 1/(k + rank) across all lists it appears in.
|
|
7
|
+
*/
|
|
8
|
+
export function reciprocalRankFusion(lists, k = 60) {
|
|
9
|
+
try {
|
|
10
|
+
const scores = new Map();
|
|
11
|
+
for (const list of lists) {
|
|
12
|
+
for (const [url, rank] of list) {
|
|
13
|
+
const contribution = 1 / (k + rank);
|
|
14
|
+
scores.set(url, (scores.get(url) ?? 0) + contribution);
|
|
15
|
+
}
|
|
16
|
+
}
|
|
17
|
+
log.debug('RRF fusion complete', {
|
|
18
|
+
inputLists: lists.length,
|
|
19
|
+
uniqueUrls: scores.size,
|
|
20
|
+
});
|
|
21
|
+
return scores;
|
|
22
|
+
}
|
|
23
|
+
catch (err) {
|
|
24
|
+
log.error('RRF fusion failed', { error: String(err) });
|
|
25
|
+
return new Map();
|
|
26
|
+
}
|
|
27
|
+
}
|
|
28
|
+
/**
|
|
29
|
+
* Convert a fused score map into a sorted array of [url, score] pairs,
|
|
30
|
+
* descending by score.
|
|
31
|
+
*/
|
|
32
|
+
export function sortByRRFScore(scores) {
|
|
33
|
+
return [...scores.entries()].sort((a, b) => b[1] - a[1]);
|
|
34
|
+
}
|
|
35
|
+
/**
|
|
36
|
+
* Build a rank map from an ordered array of URLs.
|
|
37
|
+
* First URL gets rank 1, second gets rank 2, etc.
|
|
38
|
+
*/
|
|
39
|
+
export function buildRankMap(urls) {
|
|
40
|
+
const rankMap = new Map();
|
|
41
|
+
for (let i = 0; i < urls.length; i++) {
|
|
42
|
+
if (!rankMap.has(urls[i])) {
|
|
43
|
+
rankMap.set(urls[i], i + 1);
|
|
44
|
+
}
|
|
45
|
+
}
|
|
46
|
+
return rankMap;
|
|
47
|
+
}
|
|
48
|
+
//# sourceMappingURL=rrf.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"rrf.js","sourceRoot":"","sources":["../../src/search/rrf.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,YAAY,EAAE,MAAM,cAAc,CAAC;AAE5C,MAAM,GAAG,GAAG,YAAY,CAAC,QAAQ,CAAC,CAAC;AAEnC;;;;GAIG;AACH,MAAM,UAAU,oBAAoB,CAClC,KAA4B,EAC5B,IAAY,EAAE;IAEd,IAAI,CAAC;QACH,MAAM,MAAM,GAAG,IAAI,GAAG,EAAkB,CAAC;QAEzC,KAAK,MAAM,IAAI,IAAI,KAAK,EAAE,CAAC;YACzB,KAAK,MAAM,CAAC,GAAG,EAAE,IAAI,CAAC,IAAI,IAAI,EAAE,CAAC;gBAC/B,MAAM,YAAY,GAAG,CAAC,GAAG,CAAC,CAAC,GAAG,IAAI,CAAC,CAAC;gBACpC,MAAM,CAAC,GAAG,CAAC,GAAG,EAAE,CAAC,MAAM,CAAC,GAAG,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC,GAAG,YAAY,CAAC,CAAC;YACzD,CAAC;QACH,CAAC;QAED,GAAG,CAAC,KAAK,CAAC,qBAAqB,EAAE;YAC/B,UAAU,EAAE,KAAK,CAAC,MAAM;YACxB,UAAU,EAAE,MAAM,CAAC,IAAI;SACxB,CAAC,CAAC;QAEH,OAAO,MAAM,CAAC;IAChB,CAAC;IAAC,OAAO,GAAG,EAAE,CAAC;QACb,GAAG,CAAC,KAAK,CAAC,mBAAmB,EAAE,EAAE,KAAK,EAAE,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;QACvD,OAAO,IAAI,GAAG,EAAE,CAAC;IACnB,CAAC;AACH,CAAC;AAED;;;GAGG;AACH,MAAM,UAAU,cAAc,CAC5B,MAA2B;IAE3B,OAAO,CAAC,GAAG,MAAM,CAAC,OAAO,EAAE,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;AAC3D,CAAC;AAED;;;GAGG;AACH,MAAM,UAAU,YAAY,CAAC,IAAc;IACzC,MAAM,OAAO,GAAG,IAAI,GAAG,EAAkB,CAAC;IAC1C,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,IAAI,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;QACrC,IAAI,CAAC,OAAO,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC;YAC1B,OAAO,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,GAAG,CAAC,CAAC,CAAC;QAC9B,CAAC;IACH,CAAC;IACD,OAAO,OAAO,CAAC;AACjB,CAAC"}
|
|
@@ -0,0 +1,25 @@
|
|
|
1
|
+
export interface SamplingMessage {
|
|
2
|
+
role: 'user' | 'assistant';
|
|
3
|
+
content: {
|
|
4
|
+
type: 'text';
|
|
5
|
+
text: string;
|
|
6
|
+
};
|
|
7
|
+
}
|
|
8
|
+
export interface SamplingResponse {
|
|
9
|
+
model: string;
|
|
10
|
+
content: {
|
|
11
|
+
type: string;
|
|
12
|
+
text: string;
|
|
13
|
+
};
|
|
14
|
+
}
|
|
15
|
+
export interface SamplingCapableServer {
|
|
16
|
+
getClientCapabilities: () => Record<string, unknown> | null | undefined;
|
|
17
|
+
createMessage: (params: {
|
|
18
|
+
messages: SamplingMessage[];
|
|
19
|
+
maxTokens: number;
|
|
20
|
+
}) => Promise<SamplingResponse>;
|
|
21
|
+
}
|
|
22
|
+
export declare function checkSamplingSupport(server: SamplingCapableServer): boolean;
|
|
23
|
+
export declare function requestSampling(server: SamplingCapableServer, messages: SamplingMessage[], maxTokens: number): Promise<SamplingResponse>;
|
|
24
|
+
export declare function extractTextFromSamplingResponse(response: unknown): string;
|
|
25
|
+
//# sourceMappingURL=sampling.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"sampling.d.ts","sourceRoot":"","sources":["../../src/search/sampling.ts"],"names":[],"mappings":"AAIA,MAAM,WAAW,eAAe;IAC9B,IAAI,EAAE,MAAM,GAAG,WAAW,CAAC;IAC3B,OAAO,EAAE;QAAE,IAAI,EAAE,MAAM,CAAC;QAAC,IAAI,EAAE,MAAM,CAAA;KAAE,CAAC;CACzC;AAED,MAAM,WAAW,gBAAgB;IAC/B,KAAK,EAAE,MAAM,CAAC;IACd,OAAO,EAAE;QAAE,IAAI,EAAE,MAAM,CAAC;QAAC,IAAI,EAAE,MAAM,CAAA;KAAE,CAAC;CACzC;AAED,MAAM,WAAW,qBAAqB;IACpC,qBAAqB,EAAE,MAAM,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI,GAAG,SAAS,CAAC;IACxE,aAAa,EAAE,CAAC,MAAM,EAAE;QACtB,QAAQ,EAAE,eAAe,EAAE,CAAC;QAC5B,SAAS,EAAE,MAAM,CAAC;KACnB,KAAK,OAAO,CAAC,gBAAgB,CAAC,CAAC;CACjC;AAED,wBAAgB,oBAAoB,CAAC,MAAM,EAAE,qBAAqB,GAAG,OAAO,CAS3E;AAED,wBAAsB,eAAe,CACnC,MAAM,EAAE,qBAAqB,EAC7B,QAAQ,EAAE,eAAe,EAAE,EAC3B,SAAS,EAAE,MAAM,GAChB,OAAO,CAAC,gBAAgB,CAAC,CAsB3B;AAED,wBAAgB,+BAA+B,CAC7C,QAAQ,EAAE,OAAO,GAChB,MAAM,CAiBR"}
|