npm - @rkarim08/sia - Versions diffs - 1.0.0 - Mend

@rkarim08/sia 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (355) hide show

package/.claude-plugin/marketplace.json +35 -0
package/.claude-plugin/plugin.json +27 -0
package/.mcp.json +13 -0
package/CLAUDE.md +226 -0
package/LICENSE +202 -0
package/PLUGIN_README.md +253 -0
package/README.md +1013 -0
package/agents/sia-changelog-writer.md +89 -0
package/agents/sia-code-reviewer.md +86 -0
package/agents/sia-conflict-resolver.md +100 -0
package/agents/sia-convention-enforcer.md +69 -0
package/agents/sia-debug.md +106 -0
package/agents/sia-decision-reviewer.md +101 -0
package/agents/sia-dependency-tracker.md +80 -0
package/agents/sia-explain.md +126 -0
package/agents/sia-feature.md +116 -0
package/agents/sia-knowledge-capture.md +117 -0
package/agents/sia-lead-architecture-advisor.md +93 -0
package/agents/sia-lead-team-health.md +107 -0
package/agents/sia-migration.md +100 -0
package/agents/sia-onboarding.md +115 -0
package/agents/sia-orientation.md +99 -0
package/agents/sia-pm-briefing.md +106 -0
package/agents/sia-pm-risk-advisor.md +82 -0
package/agents/sia-qa-analyst.md +116 -0
package/agents/sia-qa-regression-map.md +94 -0
package/agents/sia-refactor.md +115 -0
package/agents/sia-regression.md +112 -0
package/agents/sia-security-audit.md +125 -0
package/agents/sia-test-advisor.md +91 -0
package/hooks/hooks.json +98 -0
package/migrations/bridge/001_initial.sql +34 -0
package/migrations/episodic/001_initial.sql +35 -0
package/migrations/meta/001_initial.sql +68 -0
package/migrations/semantic/001_initial.sql +292 -0
package/migrations/semantic/002_ontology.sql +89 -0
package/migrations/semantic/003_freshness.sql +63 -0
package/migrations/semantic/004_v5_unified_schema.sql +194 -0
package/migrations/semantic/005_backfill_event_kinds.sql +8 -0
package/migrations/semantic/006_tree_sitter.sql +6 -0
package/migrations/semantic/007_branch_snapshots.sql +22 -0
package/package.json +110 -0
package/scripts/branch-switch.sh +13 -0
package/scripts/build-wasm-grammars.sh +81 -0
package/scripts/post-compact.sh +8 -0
package/scripts/post-tool-use.sh +10 -0
package/scripts/pre-compact.sh +8 -0
package/scripts/session-end.sh +8 -0
package/scripts/session-start.sh +8 -0
package/scripts/start-mcp.ts +45 -0
package/scripts/stop-hook.sh +8 -0
package/scripts/user-prompt-submit.sh +8 -0
package/scripts/viz-server.ts +152 -0
package/skills/sia-brainstorm/SKILL.md +156 -0
package/skills/sia-brainstorm/scripts/frame-template.html +214 -0
package/skills/sia-brainstorm/scripts/helper.js +95 -0
package/skills/sia-brainstorm/scripts/server.cjs +338 -0
package/skills/sia-brainstorm/scripts/start-server.sh +153 -0
package/skills/sia-brainstorm/scripts/stop-server.sh +55 -0
package/skills/sia-brainstorm/spec-document-reviewer-prompt.md +49 -0
package/skills/sia-brainstorm/visual-companion.md +286 -0
package/skills/sia-capture/SKILL.md +64 -0
package/skills/sia-compare/SKILL.md +33 -0
package/skills/sia-conflicts/SKILL.md +38 -0
package/skills/sia-debug-workflow/SKILL.md +120 -0
package/skills/sia-debug-workflow/root-cause-tracing.md +70 -0
package/skills/sia-debug-workflow/scripts/find-polluter.sh +64 -0
package/skills/sia-debug-workflow/temporal-investigation.md +72 -0
package/skills/sia-digest/SKILL.md +23 -0
package/skills/sia-dispatch/SKILL.md +69 -0
package/skills/sia-dispatch/agent-task-template.md +99 -0
package/skills/sia-doctor/SKILL.md +39 -0
package/skills/sia-execute/SKILL.md +70 -0
package/skills/sia-execute-plan/SKILL.md +85 -0
package/skills/sia-export-import/SKILL.md +49 -0
package/skills/sia-export-knowledge/SKILL.md +46 -0
package/skills/sia-finish/SKILL.md +100 -0
package/skills/sia-finish/pr-summary-template.md +54 -0
package/skills/sia-freshness/SKILL.md +38 -0
package/skills/sia-history/SKILL.md +42 -0
package/skills/sia-impact/SKILL.md +70 -0
package/skills/sia-index/SKILL.md +54 -0
package/skills/sia-install/SKILL.md +39 -0
package/skills/sia-lead-compliance/SKILL.md +16 -0
package/skills/sia-lead-drift-report/SKILL.md +16 -0
package/skills/sia-lead-knowledge-map/SKILL.md +16 -0
package/skills/sia-learn/SKILL.md +58 -0
package/skills/sia-plan/SKILL.md +68 -0
package/skills/sia-plan/plan-reviewer-prompt.md +63 -0
package/skills/sia-playbooks/SKILL.md +29 -0
package/skills/sia-playbooks/reference-feature.md +100 -0
package/skills/sia-playbooks/reference-flagging.md +50 -0
package/skills/sia-playbooks/reference-orientation.md +92 -0
package/skills/sia-playbooks/reference-regression.md +115 -0
package/skills/sia-playbooks/reference-review.md +64 -0
package/skills/sia-playbooks/reference-tools.md +239 -0
package/skills/sia-pm-decision-log/SKILL.md +28 -0
package/skills/sia-pm-risk-dashboard/SKILL.md +24 -0
package/skills/sia-pm-sprint-summary/SKILL.md +27 -0
package/skills/sia-prune/SKILL.md +45 -0
package/skills/sia-qa-coverage/SKILL.md +28 -0
package/skills/sia-qa-flaky/SKILL.md +20 -0
package/skills/sia-qa-report/SKILL.md +26 -0
package/skills/sia-reindex/SKILL.md +30 -0
package/skills/sia-review-respond/SKILL.md +88 -0
package/skills/sia-review-respond/pushback-patterns.md +90 -0
package/skills/sia-search/SKILL.md +47 -0
package/skills/sia-setup/SKILL.md +82 -0
package/skills/sia-setup/setup-checklist.md +97 -0
package/skills/sia-stats/SKILL.md +36 -0
package/skills/sia-status/SKILL.md +44 -0
package/skills/sia-sync/SKILL.md +46 -0
package/skills/sia-team/SKILL.md +64 -0
package/skills/sia-test/SKILL.md +92 -0
package/skills/sia-test/testing-anti-patterns.md +104 -0
package/skills/sia-tour/SKILL.md +29 -0
package/skills/sia-upgrade/SKILL.md +43 -0
package/skills/sia-verify/SKILL.md +81 -0
package/skills/sia-visualize/SKILL.md +28 -0
package/skills/sia-visualize-live/SKILL.md +55 -0
package/skills/sia-visualize-live/scripts/graph-template.html +389 -0
package/skills/sia-visualize-live/scripts/start-visualizer.sh +161 -0
package/skills/sia-visualize-live/scripts/stop-visualizer.sh +55 -0
package/skills/sia-visualize-live/scripts/visualizer-server.cjs +264 -0
package/skills/sia-workspace/SKILL.md +57 -0
package/src/agent/claude-md-template-flagging.md +219 -0
package/src/agent/claude-md-template.md +213 -0
package/src/agent/modules/sia-feature.md +100 -0
package/src/agent/modules/sia-flagging.md +50 -0
package/src/agent/modules/sia-orientation.md +92 -0
package/src/agent/modules/sia-regression.md +115 -0
package/src/agent/modules/sia-review.md +64 -0
package/src/agent/modules/sia-tools.md +239 -0
package/src/ast/extractors/c-include.ts +189 -0
package/src/ast/extractors/csharp-project.ts +260 -0
package/src/ast/extractors/prisma-schema.ts +44 -0
package/src/ast/extractors/project-manifest.ts +111 -0
package/src/ast/extractors/sql-schema.ts +67 -0
package/src/ast/extractors/tier-a.ts +423 -0
package/src/ast/extractors/tier-b.ts +289 -0
package/src/ast/extractors/tier-dispatch.ts +247 -0
package/src/ast/index-worker.ts +108 -0
package/src/ast/indexer.ts +484 -0
package/src/ast/languages.ts +408 -0
package/src/ast/pagerank-builder.ts +125 -0
package/src/ast/path-utils.ts +137 -0
package/src/ast/tree-sitter/backends/native.ts +57 -0
package/src/ast/tree-sitter/backends/wasm.ts +39 -0
package/src/ast/tree-sitter/call-walker.ts +44 -0
package/src/ast/tree-sitter/edit-computer.ts +55 -0
package/src/ast/tree-sitter/query-runner.ts +46 -0
package/src/ast/tree-sitter/service.ts +174 -0
package/src/ast/tree-sitter/tree-cache.ts +39 -0
package/src/ast/tree-sitter/types.ts +79 -0
package/src/ast/watcher.ts +322 -0
package/src/capture/chunker.ts +169 -0
package/src/capture/consolidate.ts +127 -0
package/src/capture/edge-inferrer.ts +161 -0
package/src/capture/embedder.ts +166 -0
package/src/capture/embedding-cache.ts +73 -0
package/src/capture/flag-processor.ts +64 -0
package/src/capture/hook.ts +67 -0
package/src/capture/pipeline.ts +450 -0
package/src/capture/prompts/consolidate.ts +25 -0
package/src/capture/prompts/edge-infer.ts +29 -0
package/src/capture/prompts/extract-flagged.ts +36 -0
package/src/capture/prompts/extract.ts +42 -0
package/src/capture/tokenizer.ts +147 -0
package/src/capture/track-a-ast.ts +93 -0
package/src/capture/track-b-llm.ts +149 -0
package/src/capture/types.ts +64 -0
package/src/cli/commands/community.ts +137 -0
package/src/cli/commands/compare.ts +123 -0
package/src/cli/commands/conflicts.ts +41 -0
package/src/cli/commands/digest.ts +197 -0
package/src/cli/commands/disable-flagging.ts +34 -0
package/src/cli/commands/doctor.ts +240 -0
package/src/cli/commands/download-model.ts +161 -0
package/src/cli/commands/enable-flagging.ts +34 -0
package/src/cli/commands/export-knowledge.ts +208 -0
package/src/cli/commands/export.ts +85 -0
package/src/cli/commands/freshness.ts +164 -0
package/src/cli/commands/graph.ts +51 -0
package/src/cli/commands/history.ts +139 -0
package/src/cli/commands/import.ts +335 -0
package/src/cli/commands/install.ts +156 -0
package/src/cli/commands/lead-report.ts +241 -0
package/src/cli/commands/learn.ts +321 -0
package/src/cli/commands/pm-report.ts +413 -0
package/src/cli/commands/prune.ts +75 -0
package/src/cli/commands/qa-report.ts +278 -0
package/src/cli/commands/reindex.ts +104 -0
package/src/cli/commands/rollback.ts +70 -0
package/src/cli/commands/search.ts +103 -0
package/src/cli/commands/server.ts +91 -0
package/src/cli/commands/share.ts +33 -0
package/src/cli/commands/stats.ts +79 -0
package/src/cli/commands/status.ts +176 -0
package/src/cli/commands/sync.ts +96 -0
package/src/cli/commands/team.ts +118 -0
package/src/cli/commands/tour.ts +157 -0
package/src/cli/commands/visualize-live.ts +162 -0
package/src/cli/commands/workspace.ts +117 -0
package/src/cli/index.ts +424 -0
package/src/cli/learn-progress.ts +87 -0
package/src/community/detection-bridge.ts +344 -0
package/src/community/leiden.ts +462 -0
package/src/community/raptor.ts +210 -0
package/src/community/scheduler.ts +74 -0
package/src/community/summarize.ts +115 -0
package/src/decay/archiver.ts +73 -0
package/src/decay/bridge-orphan-cleanup.ts +212 -0
package/src/decay/consolidation-sweep.ts +112 -0
package/src/decay/decay.ts +116 -0
package/src/decay/deep-validator.ts +62 -0
package/src/decay/episodic-promoter.ts +132 -0
package/src/decay/maintenance-scheduler.ts +326 -0
package/src/decay/scheduler.ts +6 -0
package/src/decay/session-sweeper.ts +79 -0
package/src/decay/types.ts +17 -0
package/src/freshness/confidence-decay.ts +122 -0
package/src/freshness/cuckoo-filter.ts +176 -0
package/src/freshness/deep-validation.ts +345 -0
package/src/freshness/dirty-tracker.ts +237 -0
package/src/freshness/file-watcher-layer.ts +119 -0
package/src/freshness/firewall.ts +64 -0
package/src/freshness/git-reconcile-layer.ts +161 -0
package/src/freshness/inverted-index.ts +158 -0
package/src/freshness/stale-read-layer.ts +222 -0
package/src/graph/audit.ts +69 -0
package/src/graph/bridge-db.ts +141 -0
package/src/graph/communities.ts +195 -0
package/src/graph/db-interface.ts +259 -0
package/src/graph/edges.ts +163 -0
package/src/graph/entities.ts +327 -0
package/src/graph/episodic-db.ts +113 -0
package/src/graph/flags.ts +31 -0
package/src/graph/meta-db.ts +200 -0
package/src/graph/semantic-db.ts +101 -0
package/src/graph/session-resume.ts +56 -0
package/src/graph/snapshots.ts +342 -0
package/src/graph/staging.ts +151 -0
package/src/graph/types.ts +128 -0
package/src/hooks/adapters/claude-code.ts +21 -0
package/src/hooks/adapters/cline.ts +43 -0
package/src/hooks/adapters/cursor.ts +65 -0
package/src/hooks/adapters/generic.ts +12 -0
package/src/hooks/agent-detect.ts +34 -0
package/src/hooks/claude-md-directives.ts +32 -0
package/src/hooks/event-router.ts +182 -0
package/src/hooks/extractors/pattern-detector.ts +111 -0
package/src/hooks/handlers/post-compact.ts +30 -0
package/src/hooks/handlers/post-tool-use.ts +403 -0
package/src/hooks/handlers/pre-compact.ts +100 -0
package/src/hooks/handlers/session-end.ts +47 -0
package/src/hooks/handlers/session-start.ts +154 -0
package/src/hooks/handlers/stop.ts +128 -0
package/src/hooks/handlers/user-prompt-submit.ts +68 -0
package/src/hooks/plugin-branch-switch.ts +68 -0
package/src/hooks/plugin-common.ts +47 -0
package/src/hooks/plugin-post-compact.ts +28 -0
package/src/hooks/plugin-post-tool-use.ts +38 -0
package/src/hooks/plugin-pre-compact.ts +37 -0
package/src/hooks/plugin-session-end.ts +37 -0
package/src/hooks/plugin-session-start.ts +75 -0
package/src/hooks/plugin-stop.ts +61 -0
package/src/hooks/plugin-user-prompt-submit.ts +47 -0
package/src/hooks/types.ts +43 -0
package/src/knowledge/discovery.ts +238 -0
package/src/knowledge/external-refs.ts +98 -0
package/src/knowledge/freshness.ts +221 -0
package/src/knowledge/ingest.ts +330 -0
package/src/knowledge/markdown-export.ts +229 -0
package/src/knowledge/markdown-import.ts +359 -0
package/src/knowledge/patterns.ts +74 -0
package/src/knowledge/templates.ts +307 -0
package/src/llm/ai-sdk-adapter.ts +46 -0
package/src/llm/config.ts +88 -0
package/src/llm/cost-tracker.ts +110 -0
package/src/llm/prompts/extraction.ts +55 -0
package/src/llm/prompts/summarization.ts +36 -0
package/src/llm/prompts/validation.ts +37 -0
package/src/llm/provider-registry.ts +68 -0
package/src/llm/reliability.ts +179 -0
package/src/llm/schemas.ts +52 -0
package/src/mcp/freshness-annotator.ts +69 -0
package/src/mcp/server.ts +949 -0
package/src/mcp/tools/sia-ast-query.ts +225 -0
package/src/mcp/tools/sia-at-time.ts +151 -0
package/src/mcp/tools/sia-backlinks.ts +87 -0
package/src/mcp/tools/sia-batch-execute.ts +169 -0
package/src/mcp/tools/sia-by-file.ts +89 -0
package/src/mcp/tools/sia-community.ts +113 -0
package/src/mcp/tools/sia-doctor.ts +73 -0
package/src/mcp/tools/sia-execute-file.ts +122 -0
package/src/mcp/tools/sia-execute.ts +104 -0
package/src/mcp/tools/sia-expand.ts +158 -0
package/src/mcp/tools/sia-fetch-and-index.ts +241 -0
package/src/mcp/tools/sia-flag.ts +65 -0
package/src/mcp/tools/sia-index.ts +111 -0
package/src/mcp/tools/sia-note.ts +134 -0
package/src/mcp/tools/sia-search.ts +105 -0
package/src/mcp/tools/sia-stats.ts +63 -0
package/src/mcp/tools/sia-sync-status.ts +44 -0
package/src/mcp/tools/sia-upgrade.ts +247 -0
package/src/mcp/truncate.ts +231 -0
package/src/native/bridge.ts +167 -0
package/src/native/fallback-ast-diff.ts +144 -0
package/src/native/fallback-graph.ts +325 -0
package/src/ontology/constraints.ts +56 -0
package/src/ontology/errors.ts +8 -0
package/src/ontology/middleware.ts +266 -0
package/src/retrieval/bm25-search.ts +151 -0
package/src/retrieval/context-assembly.ts +76 -0
package/src/retrieval/graph-traversal.ts +168 -0
package/src/retrieval/pagerank.ts +40 -0
package/src/retrieval/query-classifier.ts +106 -0
package/src/retrieval/reranker.ts +156 -0
package/src/retrieval/search.ts +236 -0
package/src/retrieval/throttle.ts +102 -0
package/src/retrieval/vector-search.ts +203 -0
package/src/retrieval/workspace-search.ts +130 -0
package/src/sandbox/context-mode.ts +285 -0
package/src/sandbox/credential-pass.ts +55 -0
package/src/sandbox/executor.ts +235 -0
package/src/security/pattern-detector.ts +127 -0
package/src/security/rule-of-two.ts +50 -0
package/src/security/sanitize.ts +46 -0
package/src/security/semantic-consistency.ts +93 -0
package/src/security/staging-promoter.ts +154 -0
package/src/shared/config.ts +302 -0
package/src/shared/diagnostics.ts +210 -0
package/src/shared/errors.ts +48 -0
package/src/shared/git-utils.ts +143 -0
package/src/shared/llm-client.ts +120 -0
package/src/shared/logger.ts +99 -0
package/src/shared/types.ts +79 -0
package/src/sync/client.ts +43 -0
package/src/sync/conflict.ts +106 -0
package/src/sync/dedup.ts +183 -0
package/src/sync/hlc.ts +117 -0
package/src/sync/keychain.ts +144 -0
package/src/sync/pull.ts +232 -0
package/src/sync/push.ts +131 -0
package/src/types/chokidar.d.ts +23 -0
package/src/visualization/graph-renderer.ts +312 -0
package/src/visualization/subgraph-extract.ts +208 -0
package/src/visualization/views/community-clusters.ts +246 -0
package/src/visualization/views/dependency-map.ts +189 -0
package/src/visualization/views/graph-explorer.ts +364 -0
package/src/visualization/views/timeline.ts +247 -0
package/src/workspace/api-contracts.ts +226 -0
package/src/workspace/cross-repo.ts +61 -0
package/src/workspace/detector.ts +190 -0
package/src/workspace/manifest.ts +141 -0

package/src/retrieval/query-classifier.ts ADDED Viewed

@@ -0,0 +1,106 @@
+// Module: query-classifier — Local vs global query routing + task-type boosts
+import type { SiaDb } from "@/graph/db-interface";
+export type QueryMode = "local" | "global";
+export interface ClassificationResult {
+	mode: QueryMode;
+	globalUnavailable: boolean;
+}
+const GLOBAL_KEYWORDS: string[] = [
+	"architecture",
+	"overview",
+	"explain",
+	"structure",
+	"high-level",
+	"design",
+	"modules",
+	"subsystems",
+];
+const LOCAL_KEYWORDS: string[] = [
+	"function",
+	"class",
+	"method",
+	"variable",
+	"import",
+	"error",
+	"bug",
+	"fix",
+	"implement",
+	"where is",
+	"how does",
+	"what does",
+];
+/**
+ * Classify a query as local (three-stage pipeline) or global (community summaries).
+ *
+ * Keyword-based classification: count matches against global and local keyword
+ * lists, default to local when tied. If the graph is too small for meaningful
+ * community summaries (fewer than `config.communityMinGraphSize` active
+ * entities), force local and set `globalUnavailable: true`.
+ */
+export async function classifyQuery(
+	db: SiaDb,
+	query: string,
+	config: { communityMinGraphSize: number },
+): Promise<ClassificationResult> {
+	const lower = query.toLowerCase();
+	let globalScore = 0;
+	for (const kw of GLOBAL_KEYWORDS) {
+		if (lower.includes(kw)) {
+			globalScore++;
+		}
+	}
+	let localScore = 0;
+	for (const kw of LOCAL_KEYWORDS) {
+		if (lower.includes(kw)) {
+			localScore++;
+		}
+	}
+	// Default to local when tied (localScore >= globalScore means local wins on tie)
+	let mode: QueryMode = globalScore > localScore ? "global" : "local";
+	let globalUnavailable = false;
+	// Check graph size — force local if too few entities for community summaries
+	if (mode === "global") {
+		const result = await db.execute(
+			"SELECT COUNT(*) AS cnt FROM graph_nodes WHERE t_valid_until IS NULL AND archived_at IS NULL",
+		);
+		const count = Number((result.rows[0] as { cnt: number }).cnt);
+		if (count < config.communityMinGraphSize) {
+			mode = "local";
+			globalUnavailable = true;
+		}
+	}
+	return { mode, globalUnavailable };
+}
+/**
+ * Task-type boost vectors: maps task type strings to sets of entity types
+ * that should receive a scoring boost during reranking.
+ */
+export const TASK_TYPE_BOOSTS: Record<string, Set<string>> = {
+	"bug-fix": new Set(["Bug", "Solution"]),
+	regression: new Set(["Bug", "Solution"]),
+	feature: new Set(["Concept", "Decision"]),
+	review: new Set(["Convention"]),
+};
+/**
+ * Package-path boost: returns 0.15 when the entity's package matches the
+ * active package, 0 otherwise.
+ */
+export function packagePathBoost(entityPkg: string | null, activePkg: string | null): number {
+	if (entityPkg != null && activePkg != null && entityPkg === activePkg) {
+		return 0.15;
+	}
+	return 0;
+}

package/src/retrieval/reranker.ts ADDED Viewed

@@ -0,0 +1,156 @@
+// Module: reranker — RRF combination + trust-weighted scoring
+import type { SiaDb } from "@/graph/db-interface";
+import type { Entity } from "@/graph/entities";
+import type { SiaSearchResult } from "@/mcp/tools/sia-search";
+import { packagePathBoost, TASK_TYPE_BOOSTS } from "@/retrieval/query-classifier";
+/** A candidate with an entity ID and a score from a single retrieval signal. */
+export interface RankedCandidate {
+	entityId: string;
+	score: number;
+}
+/** Options for the rerank function. */
+export interface RerankOpts {
+	/** Task type for task-type boosting (e.g. "bug-fix", "feature"). */
+	taskType?: string;
+	/** Active package path for same-package boosting. */
+	packagePath?: string;
+	/** If true, exclude Tier 4 entities. */
+	paranoid?: boolean;
+	/** Maximum number of results to return. */
+	limit?: number;
+	/** If true, include extraction_method in results. */
+	includeProvenance?: boolean;
+}
+/** Trust weights keyed by tier number (1-4). No index-0. */
+const TRUST_WEIGHTS: Record<number, number> = {
+	1: 1.0,
+	2: 0.9,
+	3: 0.7,
+	4: 0.5,
+};
+/**
+ * Combine multiple ranked candidate lists via Reciprocal Rank Fusion (k=60).
+ *
+ * Each list is sorted by score DESC. For each entity in each list,
+ * the contribution is `1 / (k + rank + 1)` where rank is 0-based.
+ * Scores are summed across all lists.
+ */
+export function rrfCombine(...lists: RankedCandidate[][]): Map<string, number> {
+	const k = 60;
+	const scores = new Map<string, number>();
+	for (const list of lists) {
+		// Sort by score descending to establish rank order
+		const sorted = [...list].sort((a, b) => b.score - a.score);
+		for (let rank = 0; rank < sorted.length; rank++) {
+			const candidate = sorted[rank];
+			const rrfScore = 1 / (k + rank + 1);
+			const current = scores.get(candidate.entityId) ?? 0;
+			scores.set(candidate.entityId, current + rrfScore);
+		}
+	}
+	return scores;
+}
+/** Batch size for fetching entities from the database. */
+const ENTITY_BATCH_SIZE = 500;
+/**
+ * Rerank entities by combining RRF scores with trust weights, importance,
+ * confidence, task-type boosts, and package-path boosts.
+ *
+ * Formula: rrf_score * importance * confidence * trust_weight[tier] * (1 + task_boost * 0.3) + package_boost
+ */
+export async function rerank(
+	db: SiaDb,
+	rrfScores: Map<string, number>,
+	opts?: RerankOpts,
+): Promise<SiaSearchResult[]> {
+	if (rrfScores.size === 0) {
+		return [];
+	}
+	const entityIds = Array.from(rrfScores.keys());
+	// Fetch entities in batches of 500
+	const entities = new Map<string, Entity>();
+	for (let i = 0; i < entityIds.length; i += ENTITY_BATCH_SIZE) {
+		const batch = entityIds.slice(i, i + ENTITY_BATCH_SIZE);
+		const placeholders = batch.map(() => "?").join(", ");
+		const sql = `SELECT * FROM graph_nodes WHERE id IN (${placeholders}) AND t_valid_until IS NULL AND archived_at IS NULL`;
+		const result = await db.execute(sql, batch);
+		for (const row of result.rows) {
+			entities.set(row.id as string, row as unknown as Entity);
+		}
+	}
+	// Determine task-type boosted entity types
+	const boostedTypes: Set<string> | undefined = opts?.taskType
+		? TASK_TYPE_BOOSTS[opts.taskType]
+		: undefined;
+	// Score and filter
+	const scored: Array<{ entity: Entity; finalScore: number }> = [];
+	for (const [entityId, rrfScore] of rrfScores) {
+		const entity = entities.get(entityId);
+		if (!entity) {
+			// Entity was invalidated, archived, or doesn't exist
+			continue;
+		}
+		// Paranoid filter: remove Tier 4
+		if (opts?.paranoid && entity.trust_tier === 4) {
+			continue;
+		}
+		const trustWeight = TRUST_WEIGHTS[entity.trust_tier] ?? 0.5;
+		const taskBoost = boostedTypes?.has(entity.type) ? 1 : 0;
+		const pkgBoost = packagePathBoost(entity.package_path, opts?.packagePath ?? null);
+		const finalScore =
+			rrfScore * entity.importance * entity.confidence * trustWeight * (1 + taskBoost * 0.3) +
+			pkgBoost;
+		scored.push({ entity, finalScore });
+	}
+	// Sort by finalScore DESC
+	scored.sort((a, b) => b.finalScore - a.finalScore);
+	// Apply limit
+	const limit = opts?.limit ?? 15;
+	const top = scored.slice(0, limit);
+	// Map to SiaSearchResult
+	return top.map(({ entity, finalScore: _finalScore }) => {
+		const base: SiaSearchResult = {
+			id: entity.id,
+			type: entity.type,
+			name: entity.name,
+			summary: entity.summary,
+			content: entity.content,
+			trust_tier: entity.trust_tier,
+			confidence: entity.confidence,
+			importance: entity.importance,
+			tags: entity.tags,
+			file_paths: entity.file_paths,
+			conflict_group_id: entity.conflict_group_id ?? null,
+			t_valid_from: entity.t_valid_from ?? null,
+			source_repo_name: null,
+		};
+		if (opts?.includeProvenance) {
+			base.extraction_method = entity.extraction_method ?? null;
+		}
+		return base;
+	});
+}

package/src/retrieval/search.ts ADDED Viewed

@@ -0,0 +1,236 @@
+// Module: search — Three-stage pipeline orchestration
+//
+// Stage 1: Parallel BM25 + graph traversal + vector search
+// Stage 2: 1-hop neighbor expansion for candidates
+// Stage 3: RRF combination + trust-weighted reranking
+// Global queries bypass the pipeline and return community summaries.
+import type { Embedder } from "@/capture/embedder";
+import type { SiaDb } from "@/graph/db-interface";
+import type { SiaSearchResult } from "@/mcp/tools/sia-search";
+import { bm25Search } from "@/retrieval/bm25-search";
+import { graphTraversalSearch } from "@/retrieval/graph-traversal";
+import { classifyQuery } from "@/retrieval/query-classifier";
+import { type RankedCandidate, rerank, rrfCombine } from "@/retrieval/reranker";
+import { vectorSearch } from "@/retrieval/vector-search";
+/** Options accepted by hybridSearch. */
+export interface SearchOptions {
+	query: string;
+	taskType?: string;
+	nodeTypes?: string[];
+	packagePath?: string;
+	paranoid?: boolean;
+	limit?: number;
+	includeProvenance?: boolean;
+	communityMinGraphSize?: number;
+}
+/** Result returned by hybridSearch. */
+export interface SearchResult {
+	results: SiaSearchResult[];
+	mode: "local" | "global";
+	globalUnavailable: boolean;
+}
+/** Default minimum graph size before community summaries are available. */
+const DEFAULT_COMMUNITY_MIN_GRAPH_SIZE = 100;
+/**
+ * Three-stage hybrid retrieval pipeline.
+ *
+ * 1. Classify query as local or global.
+ * 2. If global, return community summaries from the `communities` table.
+ * 3. Stage 1: parallel BM25 + graph traversal + vector search.
+ * 4. Stage 2: expand 1-hop neighbors for every candidate.
+ * 5. Stage 3: RRF combine + trust-weighted rerank.
+ * 6. Post-filter by nodeTypes if specified.
+ * 7. Attach extraction_method if includeProvenance is set.
+ *
+ * The `embedder` parameter is nullable -- when null, vector search is skipped
+ * and the pipeline runs on BM25 + graph traversal only.
+ */
+export async function hybridSearch(
+	db: SiaDb,
+	embedder: Embedder | null,
+	opts: SearchOptions,
+): Promise<SearchResult> {
+	const limit = opts.limit ?? 15;
+	const communityMinGraphSize = opts.communityMinGraphSize ?? DEFAULT_COMMUNITY_MIN_GRAPH_SIZE;
+	// --- Classify query ---------------------------------------------------
+	const classification = await classifyQuery(db, opts.query, {
+		communityMinGraphSize,
+	});
+	// --- Global mode: return community summaries --------------------------
+	if (classification.mode === "global") {
+		const communities = await fetchCommunitySummaries(db, limit);
+		return {
+			results: communities,
+			mode: "global",
+			globalUnavailable: false,
+		};
+	}
+	// --- Stage 1: parallel retrieval signals ------------------------------
+	const searchOpts = {
+		limit: limit * 3, // over-fetch to leave room for reranking
+		paranoid: opts.paranoid,
+		packagePath: opts.packagePath,
+	};
+	const [bm25Results, graphResults, vecResults] = await Promise.all([
+		bm25Search(db, opts.query, searchOpts),
+		graphTraversalSearch(db, opts.query, searchOpts),
+		embedder ? vectorSearch(db, opts.query, embedder, searchOpts) : Promise.resolve([]),
+	]);
+	// --- Stage 2: expand 1-hop neighbors ----------------------------------
+	const expandedGraphResults = await expandNeighbors(db, graphResults, opts.paranoid);
+	// --- Stage 3: RRF combine + rerank ------------------------------------
+	const bm25Candidates: RankedCandidate[] = bm25Results.map((r) => ({
+		entityId: r.entityId,
+		score: r.score,
+	}));
+	const graphCandidates: RankedCandidate[] = expandedGraphResults.map((r) => ({
+		entityId: r.entityId,
+		score: r.score,
+	}));
+	const vecCandidates: RankedCandidate[] = vecResults.map((r) => ({
+		entityId: r.entityId,
+		score: r.score,
+	}));
+	const rrfScores = rrfCombine(bm25Candidates, graphCandidates, vecCandidates);
+	let results = await rerank(db, rrfScores, {
+		taskType: opts.taskType,
+		packagePath: opts.packagePath,
+		paranoid: opts.paranoid,
+		limit,
+		includeProvenance: opts.includeProvenance,
+	});
+	// --- Post-filter by nodeTypes ------------------------------------------
+	if (opts.nodeTypes && opts.nodeTypes.length > 0) {
+		const allowed = new Set(opts.nodeTypes);
+		results = results.filter((r) => allowed.has(r.type));
+	}
+	// --- Provenance --------------------------------------------------------
+	if (opts.includeProvenance) {
+		await attachProvenance(db, results);
+	}
+	return {
+		results,
+		mode: "local",
+		globalUnavailable: classification.globalUnavailable,
+	};
+}
+// ---------------------------------------------------------------------------
+// Internal helpers
+// ---------------------------------------------------------------------------
+/**
+ * Fetch community summaries for global-mode queries.
+ * Returns communities that have a non-NULL summary, ordered by member_count DESC.
+ */
+async function fetchCommunitySummaries(db: SiaDb, limit: number): Promise<SiaSearchResult[]> {
+	const result = await db.execute(
+		"SELECT * FROM communities WHERE summary IS NOT NULL ORDER BY member_count DESC LIMIT ?",
+		[limit],
+	);
+	return (result.rows as Record<string, unknown>[]).map((row) => ({
+		id: row.id as string,
+		type: "Community",
+		name: row.id as string,
+		summary: (row.summary as string) ?? "",
+		content: (row.summary as string) ?? "",
+		trust_tier: 1,
+		confidence: 1.0,
+		importance: 1.0,
+		tags: "[]",
+		file_paths: "[]",
+		conflict_group_id: null,
+		t_valid_from: null,
+		source_repo_name: null,
+	}));
+}
+/**
+ * Stage 2: expand 1-hop neighbors for each candidate entity.
+ *
+ * For each entity in the input list, query the `edges` table for active
+ * 1-hop neighbors. Neighbors not already present in the result set are
+ * added at score 0.7.
+ */
+async function expandNeighbors(
+	db: SiaDb,
+	results: Array<{ entityId: string; score: number }>,
+	paranoid?: boolean,
+): Promise<Array<{ entityId: string; score: number }>> {
+	const scoreMap = new Map<string, number>();
+	// Seed with existing results
+	for (const r of results) {
+		const existing = scoreMap.get(r.entityId);
+		if (existing === undefined || r.score > existing) {
+			scoreMap.set(r.entityId, r.score);
+		}
+	}
+	// Expand each candidate
+	const candidateIds = results.map((r) => r.entityId);
+	for (const entityId of candidateIds) {
+		const edgeResult = await db.execute(
+			"SELECT from_id, to_id FROM graph_edges WHERE (from_id = ? OR to_id = ?) AND t_valid_until IS NULL",
+			[entityId, entityId],
+		);
+		for (const row of edgeResult.rows) {
+			const fromId = row.from_id as string;
+			const toId = row.to_id as string;
+			const neighborId = fromId === entityId ? toId : fromId;
+			// Skip if already in the result set
+			if (scoreMap.has(neighborId)) continue;
+			// Validate the neighbor is active (and paranoid-safe)
+			const paranoidClause = paranoid ? " AND trust_tier < 4" : "";
+			const check = await db.execute(
+				`SELECT id FROM graph_nodes WHERE id = ? AND t_valid_until IS NULL AND archived_at IS NULL${paranoidClause}`,
+				[neighborId],
+			);
+			if (check.rows.length === 0) continue;
+			scoreMap.set(neighborId, 0.7);
+		}
+	}
+	return [...scoreMap.entries()].map(([entityId, score]) => ({
+		entityId,
+		score,
+	}));
+}
+/**
+ * Attach extraction_method to results that don't already have it set.
+ * Only queries the DB for results where extraction_method is undefined.
+ */
+async function attachProvenance(db: SiaDb, results: SiaSearchResult[]): Promise<void> {
+	for (const result of results) {
+		if (result.extraction_method === undefined) {
+			const row = await db.execute("SELECT extraction_method FROM graph_nodes WHERE id = ?", [
+				result.id,
+			]);
+			if (row.rows.length > 0) {
+				result.extraction_method = (row.rows[0].extraction_method as string | null) ?? null;
+			}
+		}
+	}
+}

package/src/retrieval/throttle.ts ADDED Viewed

@@ -0,0 +1,102 @@
+// Module: throttle — Progressive rate limiting for MCP tool calls
+import type { SiaDb } from "@/graph/db-interface";
+export type ThrottleMode = "normal" | "reduced" | "blocked";
+export interface ThrottleResult {
+	mode: ThrottleMode;
+	callCount: number;
+	warning?: string;
+}
+export interface ThrottleConfig {
+	normalMax: number;
+	reducedMax: number;
+}
+const DEFAULT_THROTTLE_CONFIG: ThrottleConfig = {
+	normalMax: 3,
+	reducedMax: 8,
+};
+export const THROTTLED_TOOLS = new Set([
+	"sia_search",
+	"sia_execute",
+	"sia_execute_file",
+	"sia_fetch_and_index",
+	"sia_by_file",
+	"sia_expand",
+	"sia_at_time",
+	"sia_backlinks",
+]);
+/**
+ * Progressive throttle backed by the search_throttle table in graph.db.
+ *
+ * Thresholds (inclusive):
+ *  - count <= normalMax  → "normal"
+ *  - count <= reducedMax → "reduced" (with warning)
+ *  - count >  reducedMax → "blocked" (with warning mentioning sia_batch_execute)
+ */
+export class ProgressiveThrottle {
+	private config: ThrottleConfig;
+	constructor(
+		private db: SiaDb,
+		config?: Partial<ThrottleConfig>,
+	) {
+		this.config = { ...DEFAULT_THROTTLE_CONFIG, ...config };
+	}
+	/**
+	 * Record a tool call for the given session/tool pair and return the throttle mode.
+	 */
+	async check(sessionId: string, toolName: string): Promise<ThrottleResult> {
+		const now = Date.now();
+		// Upsert: insert or increment call_count
+		await this.db.execute(
+			`INSERT INTO search_throttle (session_id, tool_name, call_count, last_called_at)
+       VALUES (?, ?, 1, ?)
+       ON CONFLICT(session_id, tool_name) DO UPDATE SET
+         call_count = call_count + 1,
+         last_called_at = ?`,
+			[sessionId, toolName, now, now],
+		);
+		// Read back the updated count
+		const { rows } = await this.db.execute(
+			"SELECT call_count FROM search_throttle WHERE session_id = ? AND tool_name = ?",
+			[sessionId, toolName],
+		);
+		const callCount = (rows[0]?.call_count as number) ?? 1;
+		const { normalMax, reducedMax } = this.config;
+		if (callCount <= normalMax) {
+			return { mode: "normal", callCount };
+		}
+		if (callCount <= reducedMax) {
+			return {
+				mode: "reduced",
+				callCount,
+				warning: `Reducing results (${callCount} calls). Consider sia_batch_execute for batch operations.`,
+			};
+		}
+		return {
+			mode: "blocked",
+			callCount,
+			warning: `Tool blocked for this session (${callCount} calls). Use sia_batch_execute instead.`,
+		};
+	}
+	/**
+	 * Clear all throttle entries for the given session.
+	 */
+	async reset(sessionId: string): Promise<void> {
+		await this.db.execute("DELETE FROM search_throttle WHERE session_id = ?", [sessionId]);
+	}
+}