@mindrian_os/install 1.13.0-beta.11
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude-plugin/plugin.json +21 -0
- package/.mcp.json +9 -0
- package/CHANGELOG.md +3333 -0
- package/LICENSE +123 -0
- package/README.md +673 -0
- package/agents/brain-query.md +80 -0
- package/agents/framework-runner.md +237 -0
- package/agents/grading.md +188 -0
- package/agents/investor.md +128 -0
- package/agents/larry-extended.md +135 -0
- package/agents/opportunity-scanner.md +91 -0
- package/agents/persona-analyst.md +132 -0
- package/agents/research.md +89 -0
- package/agents/reverse-salient-agent.md +27 -0
- package/bin/cli.js +142 -0
- package/bin/mindrian-mcp-server.cjs +182 -0
- package/bin/mindrian-tools.cjs +765 -0
- package/commands/act.md +439 -0
- package/commands/admin.md +404 -0
- package/commands/analyze-needs.md +42 -0
- package/commands/analyze-systems.md +39 -0
- package/commands/analyze-timing.md +42 -0
- package/commands/auto-explore.md +64 -0
- package/commands/beautiful-question.md +40 -0
- package/commands/brain-derive.md +78 -0
- package/commands/build-knowledge.md +42 -0
- package/commands/build-thesis.md +46 -0
- package/commands/causal.md +234 -0
- package/commands/challenge-assumptions.md +33 -0
- package/commands/compare-ventures.md +83 -0
- package/commands/dashboard.md +110 -0
- package/commands/deep-grade.md +82 -0
- package/commands/diagnose.md +58 -0
- package/commands/diagnostics.md +151 -0
- package/commands/doctor.md +151 -0
- package/commands/dominant-designs.md +40 -0
- package/commands/explain-decision.md +87 -0
- package/commands/explore-domains.md +42 -0
- package/commands/explore-futures.md +40 -0
- package/commands/explore-trends.md +42 -0
- package/commands/export.md +103 -0
- package/commands/file-meeting.md +724 -0
- package/commands/find-analogies.md +188 -0
- package/commands/find-bottlenecks.md +62 -0
- package/commands/find-connections.md +76 -0
- package/commands/funding.md +81 -0
- package/commands/grade.md +203 -0
- package/commands/graph.md +128 -0
- package/commands/hat-briefing.md +125 -0
- package/commands/heal.md +196 -0
- package/commands/help.md +399 -0
- package/commands/hmi-status.md +172 -0
- package/commands/jtbd.md +241 -0
- package/commands/leadership.md +73 -0
- package/commands/lean-canvas.md +40 -0
- package/commands/macro-trends.md +40 -0
- package/commands/map-unknowns.md +40 -0
- package/commands/memory.md +173 -0
- package/commands/models.md +175 -0
- package/commands/mos-reason.md +285 -0
- package/commands/mullins.md +120 -0
- package/commands/new-project.md +481 -0
- package/commands/onboard.md +434 -0
- package/commands/operator.md +149 -0
- package/commands/opportunities.md +144 -0
- package/commands/organize.md +497 -0
- package/commands/persona.md +198 -0
- package/commands/pipeline.md +112 -0
- package/commands/present.md +91 -0
- package/commands/publish.md +201 -0
- package/commands/query.md +124 -0
- package/commands/radar.md +72 -0
- package/commands/reanalyze.md +91 -0
- package/commands/research.md +196 -0
- package/commands/room.md +352 -0
- package/commands/rooms.md +598 -0
- package/commands/root-cause.md +40 -0
- package/commands/rs-experts.md +85 -0
- package/commands/rs-explain.md +100 -0
- package/commands/rs-fetch.md +94 -0
- package/commands/rs-thesis.md +85 -0
- package/commands/scenario-plan.md +40 -0
- package/commands/scheduled-tasks.md +285 -0
- package/commands/score-innovation.md +43 -0
- package/commands/scout.md +239 -0
- package/commands/setup.md +618 -0
- package/commands/snapshot.md +147 -0
- package/commands/speakers.md +84 -0
- package/commands/splash.md +28 -0
- package/commands/status.md +75 -0
- package/commands/structure-argument.md +42 -0
- package/commands/suggest-next.md +80 -0
- package/commands/systems-thinking.md +40 -0
- package/commands/think-hats.md +42 -0
- package/commands/update.md +181 -0
- package/commands/user-needs.md +40 -0
- package/commands/validate.md +40 -0
- package/commands/value-proposition.md +61 -0
- package/commands/vault.md +180 -0
- package/commands/visualize.md +52 -0
- package/commands/whitespace.md +507 -0
- package/commands/wiki.md +69 -0
- package/hooks/hooks.json +381 -0
- package/hooks/run-hook.cmd +64 -0
- package/lib/__init__.py +0 -0
- package/lib/__pycache__/__init__.cpython-312.pyc +0 -0
- package/lib/agents/auto-explore-agent.cjs +1043 -0
- package/lib/agents/reverse-salient-agent.cjs +679 -0
- package/lib/agents/tension-hook-agent.cjs +544 -0
- package/lib/brain/ROOM.md +44 -0
- package/lib/brain/chain-recommender.cjs +301 -0
- package/lib/chat/chat-context.js +185 -0
- package/lib/chat/chat-panel.js +721 -0
- package/lib/chat/fabric-chat.cjs +288 -0
- package/lib/chat/generative-tools.js +219 -0
- package/lib/conversation/ROOM.md +39 -0
- package/lib/conversation/classifier-rules.json +38 -0
- package/lib/conversation/classifier.cjs +264 -0
- package/lib/conversation/operator.cjs +287 -0
- package/lib/copy/115-spec-strings.cjs +55 -0
- package/lib/core/__init__.py +0 -0
- package/lib/core/__nav-stub.cjs +14 -0
- package/lib/core/__pycache__/__init__.cpython-312.pyc +0 -0
- package/lib/core/__pycache__/rs-math.cpython-312.pyc +0 -0
- package/lib/core/__pycache__/rs_cache.cpython-312.pyc +0 -0
- package/lib/core/__pycache__/rs_corpus.cpython-312.pyc +0 -0
- package/lib/core/__pycache__/rs_hybrid.cpython-312.pyc +0 -0
- package/lib/core/__pycache__/rs_math.cpython-312.pyc +0 -0
- package/lib/core/__pycache__/rs_rooms.cpython-312.pyc +0 -0
- package/lib/core/artifact-id.cjs +148 -0
- package/lib/core/asset-ops.cjs +151 -0
- package/lib/core/auto-commit-throttle.cjs +129 -0
- package/lib/core/bearer-token.cjs +199 -0
- package/lib/core/brain-client.cjs +865 -0
- package/lib/core/brain-derivation-prompts.cjs +326 -0
- package/lib/core/brain-derivation-queue.cjs +431 -0
- package/lib/core/brain-derivation.cjs +580 -0
- package/lib/core/brain-md-schema.cjs +528 -0
- package/lib/core/brain-md-staleness.cjs +357 -0
- package/lib/core/brain-response-sanitize.cjs +188 -0
- package/lib/core/bridge-writer.cjs +477 -0
- package/lib/core/chat-context-builder.cjs +253 -0
- package/lib/core/cross-room-aggregator.cjs +762 -0
- package/lib/core/daily-briefing.cjs +438 -0
- package/lib/core/decision-capture.cjs +618 -0
- package/lib/core/deep-links.cjs +82 -0
- package/lib/core/dispatch-optimizer.cjs +354 -0
- package/lib/core/dual-path-detector.cjs +84 -0
- package/lib/core/dual-path-detector.test.cjs +334 -0
- package/lib/core/exports-log.cjs +79 -0
- package/lib/core/feynman-minto-invariants.cjs +605 -0
- package/lib/core/folder-memory-async.cjs +338 -0
- package/lib/core/folder-memory-shared.cjs +890 -0
- package/lib/core/folder-memory.cjs +416 -0
- package/lib/core/framework-chain-composer.cjs +411 -0
- package/lib/core/frontmatter-schemas.cjs +330 -0
- package/lib/core/git-ops.cjs +141 -0
- package/lib/core/graph-ops.cjs +258 -0
- package/lib/core/hat-persistence.cjs +362 -0
- package/lib/core/index.cjs +60 -0
- package/lib/core/integration-registry.cjs +232 -0
- package/lib/core/intelligence-cascade.cjs +661 -0
- package/lib/core/lazygraph-ops.cjs +1057 -0
- package/lib/core/lru-cache.cjs +139 -0
- package/lib/core/mcp-profiles.cjs +182 -0
- package/lib/core/meeting-ops.cjs +54 -0
- package/lib/core/memory-ops.cjs +600 -0
- package/lib/core/migrations/ROOM.md +33 -0
- package/lib/core/migrations/phase-109-nodes-provenance.cjs +339 -0
- package/lib/core/migrations/phase-109-session-focus.cjs +99 -0
- package/lib/core/model-profiles.cjs +246 -0
- package/lib/core/mullins-scaffold.cjs +160 -0
- package/lib/core/nav-dial.cjs +316 -0
- package/lib/core/navigation/ROOM.md +15 -0
- package/lib/core/navigation/explanation.cjs +43 -0
- package/lib/core/navigation/focus.cjs +135 -0
- package/lib/core/navigation/ingestion.cjs +82 -0
- package/lib/core/navigation/insights.cjs +350 -0
- package/lib/core/navigation/memory-events.cjs +118 -0
- package/lib/core/navigation/neighborhood.cjs +78 -0
- package/lib/core/navigation/packet.cjs +182 -0
- package/lib/core/navigation/room-home.cjs +127 -0
- package/lib/core/navigation/transitions.cjs +82 -0
- package/lib/core/navigation-engine-shared.cjs +242 -0
- package/lib/core/navigation-engine.cjs +664 -0
- package/lib/core/navigation.cjs +60 -0
- package/lib/core/nl-graph-queries.cjs +164 -0
- package/lib/core/offer-presenter.cjs +406 -0
- package/lib/core/opportunity-extractor.cjs +183 -0
- package/lib/core/opportunity-ops.cjs +1371 -0
- package/lib/core/persona-ops.cjs +537 -0
- package/lib/core/persona-taxonomy.cjs +190 -0
- package/lib/core/platform-gates.cjs +120 -0
- package/lib/core/platform.cjs +257 -0
- package/lib/core/proactive-intelligence.cjs +528 -0
- package/lib/core/problem-type-router.cjs +315 -0
- package/lib/core/reasoning-ops.cjs +639 -0
- package/lib/core/reverse-salient-persona-suffix.cjs +115 -0
- package/lib/core/room-classifier-strict-mode.cjs +229 -0
- package/lib/core/room-db.cjs +127 -0
- package/lib/core/room-ops-async.cjs +92 -0
- package/lib/core/room-ops-shared.cjs +64 -0
- package/lib/core/room-ops-sync.cjs +70 -0
- package/lib/core/room-ops.cjs +32 -0
- package/lib/core/room-type-detector.cjs +386 -0
- package/lib/core/rs-brain-substrate-prompts.cjs +129 -0
- package/lib/core/rs-brain-substrate.cjs +570 -0
- package/lib/core/rs-breakthrough-scorer.cjs +255 -0
- package/lib/core/rs-canon-violations.cjs +82 -0
- package/lib/core/rs-chain-feeder.cjs +343 -0
- package/lib/core/rs-commercial-assessor.cjs +280 -0
- package/lib/core/rs-differential-scorer.cjs +376 -0
- package/lib/core/rs-domain-analyzer.cjs +385 -0
- package/lib/core/rs-egress-prompts.cjs +113 -0
- package/lib/core/rs-egress-telemetry.cjs +225 -0
- package/lib/core/rs-egress-violations.cjs +53 -0
- package/lib/core/rs-expert-mapper.cjs +467 -0
- package/lib/core/rs-fetcher-academic.cjs +697 -0
- package/lib/core/rs-fetcher-experts.cjs +314 -0
- package/lib/core/rs-fetcher-industry.cjs +731 -0
- package/lib/core/rs-fetcher-patents.cjs +564 -0
- package/lib/core/rs-innovation-classifier.cjs +194 -0
- package/lib/core/rs-mind-map.cjs +656 -0
- package/lib/core/rs-neo4j-writer.cjs +388 -0
- package/lib/core/rs-nl-to-query.cjs +425 -0
- package/lib/core/rs-pinecone-bridge.cjs +303 -0
- package/lib/core/rs-preprocessor.cjs +350 -0
- package/lib/core/rs-query-matrix.cjs +316 -0
- package/lib/core/rs-query-to-text.cjs +438 -0
- package/lib/core/rs-sqlite-mirror.cjs +443 -0
- package/lib/core/rs-thesis-generator.cjs +188 -0
- package/lib/core/rs_cache.py +479 -0
- package/lib/core/rs_corpus.py +468 -0
- package/lib/core/rs_hybrid.py +586 -0
- package/lib/core/rs_math.py +287 -0
- package/lib/core/rs_rooms.py +193 -0
- package/lib/core/scheduled-scanner.cjs +463 -0
- package/lib/core/scratchpad-ops.cjs +201 -0
- package/lib/core/section-8-trace-schema.cjs +138 -0
- package/lib/core/section-registry.cjs +111 -0
- package/lib/core/session-state.cjs +144 -0
- package/lib/core/shallow-doc-parser.cjs +174 -0
- package/lib/core/shallow-doc-parser.test.cjs +226 -0
- package/lib/core/skill-activation-router.cjs +284 -0
- package/lib/core/state-ops.cjs +46 -0
- package/lib/core/statusline-cache.cjs +266 -0
- package/lib/core/token-estimator.cjs +348 -0
- package/lib/core/user-archetype.cjs +239 -0
- package/lib/core/user-md-ops.cjs +524 -0
- package/lib/core/visual-ops.cjs +624 -0
- package/lib/core/write-lock.cjs +149 -0
- package/lib/graph/canvas-graph.js +467 -0
- package/lib/graph/constellation-config.cjs +299 -0
- package/lib/graph/graph-detail-panel.js +165 -0
- package/lib/hmi/ROOM.md +47 -0
- package/lib/hmi/across-session-memory.cjs +604 -0
- package/lib/hmi/cross-room-memory.cjs +575 -0
- package/lib/hmi/decoy-tier.cjs +395 -0
- package/lib/hmi/jtbd-classifier.cjs +219 -0
- package/lib/hmi/jtbd-state.cjs +199 -0
- package/lib/hmi/jtbd-taxonomy.json +392 -0
- package/lib/hmi/selector-dispatcher.cjs +546 -0
- package/lib/hmi/selector-telemetry.cjs +263 -0
- package/lib/hmi/shape-f0-renderer.cjs +139 -0
- package/lib/hmi/shape-f1-fallback.cjs +80 -0
- package/lib/hmi/shape-f1-renderer.cjs +138 -0
- package/lib/hmi/shape-f2-renderer.cjs +132 -0
- package/lib/hmi/shape-f3-renderer.cjs +66 -0
- package/lib/hmi/shape-f4-renderer.cjs +72 -0
- package/lib/hmi/shape-f5-renderer.cjs +155 -0
- package/lib/hmi/shape-f6-plan-review-renderer.cjs +312 -0
- package/lib/hmi/shape-f6-renderer.cjs +144 -0
- package/lib/hmi/shape-g-renderer.cjs +219 -0
- package/lib/hmi/shape-h-renderer.cjs +222 -0
- package/lib/hmi/tier-check.cjs +63 -0
- package/lib/import/PRECONDITIONS.md +41 -0
- package/lib/import/branding.cjs +210 -0
- package/lib/import/branding.test.cjs +235 -0
- package/lib/import/classifications-sync.cjs +104 -0
- package/lib/import/classifications-sync.test.cjs +129 -0
- package/lib/import/enricher.cjs +296 -0
- package/lib/import/enricher.test.cjs +273 -0
- package/lib/import/integration.test.cjs +376 -0
- package/lib/import/manifest.cjs +129 -0
- package/lib/import/manifest.schema.json +185 -0
- package/lib/import/manifest.test.cjs +123 -0
- package/lib/import/meeting-detector.cjs +92 -0
- package/lib/import/meeting-detector.test.cjs +100 -0
- package/lib/import/person-detector.cjs +229 -0
- package/lib/import/person-detector.test.cjs +149 -0
- package/lib/import/report.cjs +186 -0
- package/lib/import/report.test.cjs +186 -0
- package/lib/import/room-md-scaffolder.cjs +49 -0
- package/lib/import/router.cjs +224 -0
- package/lib/import/router.test.cjs +356 -0
- package/lib/import/run-all-tests.cjs +36 -0
- package/lib/import/smoke-test.cjs +213 -0
- package/lib/import/smoke-test.test.cjs +148 -0
- package/lib/import/test-fixtures/collision-vault/preexisting-room/STATE.md +8 -0
- package/lib/import/test-fixtures/collision-vault/preexisting-room/problem-definition/onboarding/onboarding.md +7 -0
- package/lib/import/test-fixtures/collision-vault/source/onboarding.md +5 -0
- package/lib/import/test-fixtures/obsidian-vault/.obsidian/workspace.json +1 -0
- package/lib/import/test-fixtures/obsidian-vault/notes/with-wikilinks.md +4 -0
- package/lib/import/test-fixtures/tiny-vault/notes/2026-01-15-team-sync.md +9 -0
- package/lib/import/test-fixtures/tiny-vault/notes/empty.md +3 -0
- package/lib/import/test-fixtures/tiny-vault/notes/onboarding.md +5 -0
- package/lib/import/test-fixtures/tiny-vault/notes/pricing.md +5 -0
- package/lib/import/test-fixtures/tiny-vault/notes/random.md +4 -0
- package/lib/import/undo.test.cjs +199 -0
- package/lib/import/vault-scanner.cjs +105 -0
- package/lib/import/vault-scanner.test.cjs +67 -0
- package/lib/mcp/app-html/dashboard.html +316 -0
- package/lib/mcp/app-html/graph.html +428 -0
- package/lib/mcp/app-html/mindrian-platform.html +1841 -0
- package/lib/mcp/app-html/wiki.html +383 -0
- package/lib/mcp/app-views.cjs +322 -0
- package/lib/mcp/brain-router.cjs +418 -0
- package/lib/mcp/capability-registry.cjs +62 -0
- package/lib/mcp/larry-context.cjs +46 -0
- package/lib/mcp/larry-server-instructions.md +114 -0
- package/lib/mcp/pipeline-state.cjs +275 -0
- package/lib/mcp/prompts.cjs +302 -0
- package/lib/mcp/resources.cjs +227 -0
- package/lib/mcp/session-catchup.cjs +327 -0
- package/lib/mcp/surface-detect.cjs +75 -0
- package/lib/mcp/tool-router.cjs +1034 -0
- package/lib/memory/aaak-compress.cjs +403 -0
- package/lib/memory/aaak-compress.test.cjs +288 -0
- package/lib/memory/async-artifact-auto-commit.test.cjs +223 -0
- package/lib/memory/bearer-token.test.cjs +315 -0
- package/lib/memory/brain-cache-lru.test.cjs +259 -0
- package/lib/memory/brain-client-query-shape.test.cjs +160 -0
- package/lib/memory/brain-derivation-graceful-degradation.test.cjs +1019 -0
- package/lib/memory/brain-derivation-queue.test.cjs +539 -0
- package/lib/memory/brain-derivation.test.cjs +634 -0
- package/lib/memory/brain-derive-command.test.cjs +534 -0
- package/lib/memory/brain-md-invariants-validator.test.cjs +704 -0
- package/lib/memory/brain-md-schema.test.cjs +467 -0
- package/lib/memory/brain-md-staleness.test.cjs +525 -0
- package/lib/memory/brain-server-resolution.test.cjs +314 -0
- package/lib/memory/chain-recommender.test.cjs +233 -0
- package/lib/memory/chat-context.test.cjs +128 -0
- package/lib/memory/command-registry.test.cjs +220 -0
- package/lib/memory/cross-room-aggregator.test.cjs +909 -0
- package/lib/memory/dashboard-server.test.cjs +256 -0
- package/lib/memory/debouncer-drain-at-prompt.test.cjs +389 -0
- package/lib/memory/decision-capture.test.cjs +632 -0
- package/lib/memory/decision-capture.worker.cjs +70 -0
- package/lib/memory/explain-decision-command.test.cjs +521 -0
- package/lib/memory/explain-decision-footer.test.cjs +316 -0
- package/lib/memory/explored-materials-store.cjs +392 -0
- package/lib/memory/feynman-minto-guardian.test.cjs +736 -0
- package/lib/memory/feynman-minto-invariants.test.cjs +511 -0
- package/lib/memory/feynman-prompts-drift.test.cjs +144 -0
- package/lib/memory/feynman-prompts.cjs +151 -0
- package/lib/memory/feynman-prompts.test.cjs +96 -0
- package/lib/memory/folder-memory-quadruple.test.cjs +548 -0
- package/lib/memory/folder-memory.test.cjs +503 -0
- package/lib/memory/framework-chain-composer.test.cjs +515 -0
- package/lib/memory/frontmatter-schema-validator.test.cjs +290 -0
- package/lib/memory/heal-command.test.cjs +604 -0
- package/lib/memory/index-artifact-transaction.test.cjs +333 -0
- package/lib/memory/lazygraph-rs-discoveries-view.test.cjs +122 -0
- package/lib/memory/mcp-input-validation.test.cjs +240 -0
- package/lib/memory/mcp-server-brain-deps.test.cjs +270 -0
- package/lib/memory/mcp-stack-fallback.test.cjs +433 -0
- package/lib/memory/minto-debouncer.test.cjs +407 -0
- package/lib/memory/minto-debouncer.worker.cjs +46 -0
- package/lib/memory/minto-migration-v88.test.cjs +265 -0
- package/lib/memory/minto-schema-v88.test.cjs +390 -0
- package/lib/memory/mos-status-renderer.test.cjs +631 -0
- package/lib/memory/narrative-schema.cjs +376 -0
- package/lib/memory/narrative-schema.test.cjs +209 -0
- package/lib/memory/nav-dial.test.cjs +414 -0
- package/lib/memory/navigation-engine-core.test.cjs +722 -0
- package/lib/memory/navigation-invariants.test.cjs +483 -0
- package/lib/memory/offer-presenter.test.cjs +554 -0
- package/lib/memory/on-stop-snapshot.test.cjs +404 -0
- package/lib/memory/pending-tension-store.cjs +373 -0
- package/lib/memory/post-compact-reinjection.test.cjs +854 -0
- package/lib/memory/post-write-triple.test.cjs +317 -0
- package/lib/memory/pre-compact-snapshot.test.cjs +495 -0
- package/lib/memory/problem-type-router.test.cjs +656 -0
- package/lib/memory/query-efficiency-telemetry.test.cjs +370 -0
- package/lib/memory/recompile-room-references.test.cjs +392 -0
- package/lib/memory/recompile-room-references.worker.cjs +42 -0
- package/lib/memory/record-decision-dual-write.test.cjs +454 -0
- package/lib/memory/room-classifier-strict-mode.test.cjs +417 -0
- package/lib/memory/room-minto-hook.test.cjs +398 -0
- package/lib/memory/rs-discovery-engine.test.cjs +323 -0
- package/lib/memory/run-feynman-tests.cjs +1247 -0
- package/lib/memory/security-trifecta.test.cjs +312 -0
- package/lib/memory/session-start-brain-staleness.test.cjs +363 -0
- package/lib/memory/session-start-triple-injection.test.cjs +514 -0
- package/lib/memory/sessionstart-banner-formatter.cjs +318 -0
- package/lib/memory/sessionstart-minto-banner.test.cjs +373 -0
- package/lib/memory/skill-activation-router.test.cjs +419 -0
- package/lib/memory/stamp-artifact-write.test.cjs +304 -0
- package/lib/memory/statusline-active-room.test.cjs +315 -0
- package/lib/memory/statusline-minto-segment.test.cjs +292 -0
- package/lib/memory/sync-async-entry-points.test.cjs +204 -0
- package/lib/memory/test-bridge-writer-enhanced.cjs +452 -0
- package/lib/memory/test-rs-brain-substrate-shape.cjs +529 -0
- package/lib/memory/test-rs-brain-substrate.cjs +636 -0
- package/lib/memory/test-rs-breakthrough-scorer.cjs +375 -0
- package/lib/memory/test-rs-canon-violations.cjs +218 -0
- package/lib/memory/test-rs-chain-feeder-core.cjs +344 -0
- package/lib/memory/test-rs-chain-feeder-skill-spawn.cjs +297 -0
- package/lib/memory/test-rs-commercial-assessor.cjs +385 -0
- package/lib/memory/test-rs-differential-scorer.cjs +480 -0
- package/lib/memory/test-rs-discovery-engine.cjs +603 -0
- package/lib/memory/test-rs-domain-analyzer.cjs +492 -0
- package/lib/memory/test-rs-egress-primitives.cjs +420 -0
- package/lib/memory/test-rs-expert-mapper.cjs +547 -0
- package/lib/memory/test-rs-explain-command.cjs +443 -0
- package/lib/memory/test-rs-fetcher-academic.cjs +848 -0
- package/lib/memory/test-rs-fetcher-experts.cjs +496 -0
- package/lib/memory/test-rs-fetcher-industry.cjs +702 -0
- package/lib/memory/test-rs-fetcher-patents.cjs +674 -0
- package/lib/memory/test-rs-innovation-classifier.cjs +301 -0
- package/lib/memory/test-rs-mind-map.cjs +646 -0
- package/lib/memory/test-rs-neo4j-writer.cjs +518 -0
- package/lib/memory/test-rs-nl-to-query.cjs +449 -0
- package/lib/memory/test-rs-pinecone-bridge.cjs +277 -0
- package/lib/memory/test-rs-preprocessor.cjs +433 -0
- package/lib/memory/test-rs-query-matrix.cjs +391 -0
- package/lib/memory/test-rs-query-to-text.cjs +551 -0
- package/lib/memory/test-rs-sqlite-mirror.cjs +649 -0
- package/lib/memory/test-rs-thesis-generator.cjs +360 -0
- package/lib/memory/triple-context-formatter.cjs +473 -0
- package/lib/memory/triple-context-formatter.test.cjs +442 -0
- package/lib/memory/user-md-persona.test.cjs +565 -0
- package/lib/memory/userpromptsubmit-integration.test.cjs +690 -0
- package/lib/memory/validators/README.md +157 -0
- package/lib/memory/validators/brain-md-invariants.cjs +475 -0
- package/lib/memory/validators/brain-substrate-invariants.cjs +285 -0
- package/lib/memory/validators/external-academic-invariants.cjs +249 -0
- package/lib/memory/validators/external-industry-invariants.cjs +271 -0
- package/lib/memory/validators/external-patents-invariants.cjs +266 -0
- package/lib/memory/validators/minto-invariants.cjs +62 -0
- package/lib/memory/validators/navigation-invariants.cjs +340 -0
- package/lib/memory/validators/queue-health.cjs +95 -0
- package/lib/memory/validators/snapshot-integrity.cjs +129 -0
- package/lib/memory/validators/stale-lifecycle.cjs +116 -0
- package/lib/memory/vault-section-minto-generator-atomic.test.cjs +556 -0
- package/lib/memory/vault-section-minto-generator-atomic.worker.cjs +73 -0
- package/lib/memory/write-lock-atomic.test.cjs +137 -0
- package/lib/memory/write-lock-atomic.worker.cjs +55 -0
- package/lib/parity/check-parity.cjs +83 -0
- package/lib/presentation/presentation-server.cjs +101 -0
- package/lib/presentation/presentation-watcher.cjs +123 -0
- package/lib/quickview/hub-server.cjs +719 -0
- package/lib/quickview/server.cjs +533 -0
- package/lib/render/JTBD-PALETTES.md +145 -0
- package/lib/render/ROOM.md +59 -0
- package/lib/render/render-v2.cjs +486 -0
- package/lib/render/render-v2.test.cjs +267 -0
- package/lib/render/render.cjs +65 -0
- package/lib/state/ROOM.md +46 -0
- package/lib/state/state-md-parser.cjs +215 -0
- package/lib/statusline/ROOM.md +38 -0
- package/lib/statusline/banner-suppression.cjs +50 -0
- package/lib/statusline/surface-detect.cjs +85 -0
- package/lib/update-bootstrap.sh.template +145 -0
- package/lib/vault/frontmatter-schema.cjs +297 -0
- package/lib/vault/room-scanner.cjs +352 -0
- package/lib/vault/wikilink-builder.cjs +231 -0
- package/lib/vault/wikilink-builder.test.cjs +182 -0
- package/lib/wiki/graph-links.cjs +281 -0
- package/lib/wiki/page-renderer.cjs +229 -0
- package/lib/wiki/wiki-chat.cjs +81 -0
- package/lib/wiki/wiki-layout.cjs +1459 -0
- package/lib/wiki/wiki-search.cjs +142 -0
- package/lib/wiki/wiki-server.cjs +678 -0
- package/lib/wiki/wiki-watcher.cjs +105 -0
- package/lib/workflow/ROOM.md +47 -0
- package/lib/workflow/command-resolver.cjs +155 -0
- package/lib/workflow/command-resolver.test.cjs +235 -0
- package/package.json +44 -0
- package/pipelines/analogy/01-decompose.md +80 -0
- package/pipelines/analogy/02-abstract.md +87 -0
- package/pipelines/analogy/03-search.md +135 -0
- package/pipelines/analogy/04-transfer.md +101 -0
- package/pipelines/analogy/05-validate.md +106 -0
- package/pipelines/analogy/CHAIN.md +56 -0
- package/pipelines/discovery/01-explore-domains.md +44 -0
- package/pipelines/discovery/02-think-hats.md +50 -0
- package/pipelines/discovery/03-analyze-needs.md +54 -0
- package/pipelines/discovery/CHAIN.md +37 -0
- package/pipelines/thesis/01-structure-argument.md +45 -0
- package/pipelines/thesis/02-challenge-assumptions.md +48 -0
- package/pipelines/thesis/03-build-thesis.md +54 -0
- package/pipelines/thesis/CHAIN.md +37 -0
- package/references/brain/causal-directives.md +91 -0
- package/references/brain/causal-enrichment.cypher +165 -0
- package/references/brain/command-triggers-schema.md +226 -0
- package/references/brain/graph-architecture.md +317 -0
- package/references/brain/query-patterns.md +460 -0
- package/references/brain/room-hierarchy-schema.md +218 -0
- package/references/brain/schema.md +76 -0
- package/references/capability-radar/capabilities-index.md +241 -0
- package/references/capability-radar/changelog-cache.md +81 -0
- package/references/causal/causal-schema.md +103 -0
- package/references/design/email-template-standard.md +155 -0
- package/references/design/graph-visualization-standard.md +178 -0
- package/references/document-generation.md +179 -0
- package/references/hsi/HSI-TOOLS-REFERENCE.md +222 -0
- package/references/import-config.md +141 -0
- package/references/integrations/detection-patterns.md +101 -0
- package/references/meeting/artifact-template.md +377 -0
- package/references/meeting/cross-meeting-intelligence.md +216 -0
- package/references/meeting/cross-relationship-patterns.md +202 -0
- package/references/meeting/live-join-interface.md +244 -0
- package/references/meeting/section-mapping.md +192 -0
- package/references/meeting/segment-classification.md +258 -0
- package/references/meeting/speaker-profile-template.md +219 -0
- package/references/meeting/summary-template.md +348 -0
- package/references/meeting/transcript-patterns.md +226 -0
- package/references/methodology/analyze-needs.md +135 -0
- package/references/methodology/analyze-systems.md +121 -0
- package/references/methodology/analyze-timing.md +149 -0
- package/references/methodology/beautiful-question.md +109 -0
- package/references/methodology/build-knowledge.md +161 -0
- package/references/methodology/build-thesis.md +237 -0
- package/references/methodology/challenge-assumptions.md +127 -0
- package/references/methodology/diagnose.md +169 -0
- package/references/methodology/dominant-designs.md +212 -0
- package/references/methodology/explore-domains.md +147 -0
- package/references/methodology/explore-futures.md +163 -0
- package/references/methodology/explore-trends.md +129 -0
- package/references/methodology/find-bottlenecks.md +131 -0
- package/references/methodology/grade.md +211 -0
- package/references/methodology/index.md +97 -0
- package/references/methodology/leadership.md +200 -0
- package/references/methodology/lean-canvas.md +116 -0
- package/references/methodology/macro-trends.md +192 -0
- package/references/methodology/map-unknowns.md +137 -0
- package/references/methodology/mullins-7-domains.md +104 -0
- package/references/methodology/problem-types.md +65 -0
- package/references/methodology/root-cause.md +178 -0
- package/references/methodology/sapphire-encoding.md +355 -0
- package/references/methodology/scenario-plan.md +178 -0
- package/references/methodology/score-innovation.md +154 -0
- package/references/methodology/structure-argument.md +158 -0
- package/references/methodology/systems-thinking.md +159 -0
- package/references/methodology/think-hats.md +147 -0
- package/references/methodology/triz-matrix.json +751 -0
- package/references/methodology/triz-principles.md +501 -0
- package/references/methodology/user-needs.md +199 -0
- package/references/methodology/validate.md +163 -0
- package/references/methodology/value-proposition.md +244 -0
- package/references/opportunities/funding-lifecycle.md +103 -0
- package/references/opportunities/grant-api-patterns.md +99 -0
- package/references/opportunities/opportunity-template.md +84 -0
- package/references/personality/assessment-philosophy.md +72 -0
- package/references/personality/lexicon.md +100 -0
- package/references/personality/persona-chains.md +56 -0
- package/references/personality/pws-lexicon-full.md +499 -0
- package/references/personality/voice-dna.md +156 -0
- package/references/personas/hat-perspectives.md +76 -0
- package/references/personas/persona-template.md +63 -0
- package/references/pipeline/act-output-contract.md +88 -0
- package/references/pipeline/chains-index.md +39 -0
- package/references/pws-profile-generation.md +79 -0
- package/references/reasoning/reasoning-schema.md +143 -0
- package/references/reasoning/reasoning-template.md +68 -0
- package/references/reasoning/run-template.md +38 -0
- package/references/research/RESEARCH_14_CLAUDE_CODE_SOURCE_ARCHITECTURE.md +209 -0
- package/references/research/RESEARCH_15_V1.8_OPTIMIZATION_JTBD.md +375 -0
- package/references/research/RESEARCH_16_NATIVE_FIRST_PLUGIN_ARCHITECTURE.md +575 -0
- package/references/research/RESEARCH_17_MCP_UI_FRAMEWORKS.md +272 -0
- package/references/taxonomy/TAXONOMY.md +192 -0
- package/references/templates/MINTO.md +36 -0
- package/references/user-research/2026-04-05-leah-lawrence-session.md +202 -0
- package/references/vault-kit/README.md +35 -0
- package/references/vault-kit/app.json +12 -0
- package/references/vault-kit/appearance.json +12 -0
- package/references/vault-kit/graph.json +35 -0
- package/references/vault-kit/snippets/mindrian-destijl.css +297 -0
- package/references/vault-kit/templates/new-artifact.md +37 -0
- package/references/vault-kit/templates/new-meeting-note.md +35 -0
- package/references/vault-kit/templates/new-team-profile.md +29 -0
- package/references/vault-kit/templates/new-xref.md +35 -0
- package/references/visual/symbol-system.md +151 -0
- package/skills/MOSDeckEngine/SKILL.md +325 -0
- package/skills/brain-connector/SKILL.md +114 -0
- package/skills/context-engine/SKILL.md +147 -0
- package/skills/conversation-mode/SKILL.md +102 -0
- package/skills/larry-personality/SKILL.md +219 -0
- package/skills/larry-personality/framework-chains.md +92 -0
- package/skills/larry-personality/mode-engine.md +185 -0
- package/skills/mullins-scaffold/SKILL.md +61 -0
- package/skills/mullins-scaffold/scaffold.json +146 -0
- package/skills/pws-methodology/SKILL.md +49 -0
- package/skills/room-passive/SKILL.md +165 -0
- package/skills/room-proactive/SKILL.md +250 -0
- package/skills/ui-system/SKILL.md +277 -0
|
@@ -0,0 +1,303 @@
|
|
|
1
|
+
/*
|
|
2
|
+
* Copyright (c) 2026 Mindrian. BSL 1.1.
|
|
3
|
+
* Phase 89.2 Plan 06 Task 1 -- Pinecone-direct bridge for 1024-dim
|
|
4
|
+
* vector retrieval (CJS->Python shim).
|
|
5
|
+
*
|
|
6
|
+
* The bridge wraps the existing rs_cache.py::fetch_all_from_namespace
|
|
7
|
+
* primitive (Phase 89-03, v1.10.16) without modifying it. This is a
|
|
8
|
+
* Canon Part 7 (Reuse Before Build) consumer: zero new Python code,
|
|
9
|
+
* zero new index, zero new field schema. The strict-1024-dim deferred
|
|
10
|
+
* item from 89.1 (substrate carries _score not embedding on the live
|
|
11
|
+
* Brain wire path) is resolved here by going Pinecone-direct against
|
|
12
|
+
* the rs-external index used for external corpora.
|
|
13
|
+
*
|
|
14
|
+
* Architecture:
|
|
15
|
+
*
|
|
16
|
+
* queryPineconeWithVectors(namespace, queryText, topK)
|
|
17
|
+
* -> spawnSync python3 -c bridgeScript
|
|
18
|
+
* -> bridgeScript reads JSON from stdin
|
|
19
|
+
* -> bridgeScript invokes rs_cache.fetch_all_from_namespace
|
|
20
|
+
* -> bridgeScript writes JSON {success, hits[]} to stdout
|
|
21
|
+
* -> CJS parses + returns
|
|
22
|
+
*
|
|
23
|
+
* Graceful degradation contract (Phase 89.2-01 / 02 / 03 / 04 pattern):
|
|
24
|
+
*
|
|
25
|
+
* missing PINECONE_API_KEY -> {success: false, error: 'pinecone_api_key_missing'}
|
|
26
|
+
* python3 not on PATH -> {success: false, error: 'python_unavailable'}
|
|
27
|
+
* non-zero exit -> {success: false, error: 'python_exit_<N>'}
|
|
28
|
+
* stdout parse failure -> {success: false, error: 'parse_error'}
|
|
29
|
+
* timeout -> {success: false, error: 'timeout'}
|
|
30
|
+
*
|
|
31
|
+
* NEVER throws. Every external boundary returns a structured envelope.
|
|
32
|
+
*
|
|
33
|
+
* Canon Part 8 (Graph Boundary): two defense-in-depth layers.
|
|
34
|
+
*
|
|
35
|
+
* Layer 1 -- pre-egress: auditQueryString runs on the queryText
|
|
36
|
+
* parameter before spawnSync. Throws ExternalEgressViolation on
|
|
37
|
+
* FORBIDDEN_PATTERNS hit. Adversarial input never reaches Pinecone.
|
|
38
|
+
*
|
|
39
|
+
* Layer 2 -- post-receive: auditQueryObject runs on the parsed hits[]
|
|
40
|
+
* payload before return. Throws ExternalEgressViolation if a hit's
|
|
41
|
+
* metadata smuggles a forbidden pattern through. The rs-external
|
|
42
|
+
* namespace is supposed to hold only public OpenAlex/arXiv metadata
|
|
43
|
+
* (Phase 89-03 Canon attestation), but we re-audit on the receive
|
|
44
|
+
* side because trust is not a security property -- enforcement is.
|
|
45
|
+
*
|
|
46
|
+
* Additionally exposes:
|
|
47
|
+
*
|
|
48
|
+
* cosineSimilarity(a, b) -- pure JS dot(a,b)/(norm(a)*norm(b)).
|
|
49
|
+
* Both inputs MUST be Number arrays of identical length (typically
|
|
50
|
+
* 1024 for Pinecone multilingual-e5-large). Returns 0 on degenerate
|
|
51
|
+
* zero-vectors. Differential scorer uses this on the two query
|
|
52
|
+
* vectors returned by twin queryPineconeWithVectors calls.
|
|
53
|
+
*
|
|
54
|
+
* Pure CJS, zero npm deps, node built-ins only beyond the three
|
|
55
|
+
* rs-egress-* primitives shipped in Wave 1 (Plan 89.2-01).
|
|
56
|
+
*/
|
|
57
|
+
'use strict';
|
|
58
|
+
|
|
59
|
+
const path = require('node:path');
|
|
60
|
+
const childProcess = require('child_process');
|
|
61
|
+
const { auditQueryString, auditQueryObject } = require('./rs-egress-prompts.cjs');
|
|
62
|
+
// rs-egress-violations is required transitively by rs-egress-prompts; we do
|
|
63
|
+
// not throw ExternalEgressViolation directly from this module (the audit
|
|
64
|
+
// helpers do). The require below is a reachability witness for the Canon
|
|
65
|
+
// Part 8 audit chain at module-load time.
|
|
66
|
+
require('./rs-egress-violations.cjs');
|
|
67
|
+
|
|
68
|
+
// ---------- Constants ----------
|
|
69
|
+
|
|
70
|
+
const REPO_ROOT = path.resolve(__dirname, '..', '..');
|
|
71
|
+
const PYTHON_BIN = process.env.MINDRIAN_PYTHON || 'python3';
|
|
72
|
+
const BRIDGE_TIMEOUT_MS = 30000;
|
|
73
|
+
const DEFAULT_LIMIT = 1000;
|
|
74
|
+
|
|
75
|
+
// ---------- Embedded Python bridge script ----------
|
|
76
|
+
//
|
|
77
|
+
// This script is spawned as `python3 -c <script>`. It MUST be valid Python.
|
|
78
|
+
// The leading `# BSL 1.1` line is a deliberate Canon discipline marker so
|
|
79
|
+
// the embedded Python source is licensed identically to the surrounding
|
|
80
|
+
// CJS file (W4 fix per Plan 89.2-06).
|
|
81
|
+
//
|
|
82
|
+
// Protocol:
|
|
83
|
+
//
|
|
84
|
+
// stdin : JSON {namespace: string, limit?: integer}
|
|
85
|
+
// stdout : JSON {success: boolean, hits?: array, error?: string}
|
|
86
|
+
//
|
|
87
|
+
// The script imports rs_cache from lib.core (REPO_ROOT must be on
|
|
88
|
+
// sys.path). On any exception, returns success:false with the exception
|
|
89
|
+
// message. Never raises to the parent process.
|
|
90
|
+
|
|
91
|
+
const bridgeScript = [
|
|
92
|
+
'# BSL 1.1',
|
|
93
|
+
'# Copyright (c) 2026 Mindrian. Phase 89.2 Plan 06 Task 1 -- pinecone bridge embedded Python.',
|
|
94
|
+
'# This script wraps rs_cache.py::fetch_all_from_namespace to retrieve',
|
|
95
|
+
'# 1024-dim Pinecone-direct vectors. JSON over stdio: parent writes a',
|
|
96
|
+
'# request envelope to stdin; child writes a response envelope to stdout.',
|
|
97
|
+
'# Errors are reported via the response envelope (success:false), never',
|
|
98
|
+
'# raised to the parent process. The child exits 0 on graceful failure.',
|
|
99
|
+
'import sys, os, json',
|
|
100
|
+
'# Ensure REPO_ROOT is on sys.path so `from lib.core.rs_cache import ...` resolves.',
|
|
101
|
+
'sys.path.insert(0, os.environ.get("MINDRIAN_REPO_ROOT", os.getcwd()))',
|
|
102
|
+
'try:',
|
|
103
|
+
' from lib.core.rs_cache import fetch_all_from_namespace',
|
|
104
|
+
' payload = json.loads(sys.stdin.read())',
|
|
105
|
+
' ns = payload["namespace"]',
|
|
106
|
+
' limit = int(payload.get("limit", 1000))',
|
|
107
|
+
' records = fetch_all_from_namespace(ns, limit=limit)',
|
|
108
|
+
' # Map rs_cache.py output {id, values, metadata} to bridge hits[].',
|
|
109
|
+
' hits = []',
|
|
110
|
+
' for r in records:',
|
|
111
|
+
' hits.append({',
|
|
112
|
+
' "id": r.get("id", ""),',
|
|
113
|
+
' "score": float(r.get("score", 0.0)) if "score" in r else 0.0,',
|
|
114
|
+
' "values": list(r.get("values") or []),',
|
|
115
|
+
' "metadata": dict(r.get("metadata") or {}),',
|
|
116
|
+
' })',
|
|
117
|
+
' sys.stdout.write(json.dumps({"success": True, "hits": hits}))',
|
|
118
|
+
'except Exception as e:',
|
|
119
|
+
' sys.stdout.write(json.dumps({"success": False, "error": str(e)}))',
|
|
120
|
+
'',
|
|
121
|
+
].join('\n');
|
|
122
|
+
|
|
123
|
+
// ---------- queryPineconeWithVectors ----------
|
|
124
|
+
//
|
|
125
|
+
// Public entry point. Spawns python3 with the embedded bridgeScript,
|
|
126
|
+
// passes the namespace + limit via stdin, parses the JSON response,
|
|
127
|
+
// audits, and returns the structured envelope.
|
|
128
|
+
//
|
|
129
|
+
// Inputs:
|
|
130
|
+
// namespace string the Pinecone namespace, typically 'external:<topic-slug>'
|
|
131
|
+
// queryText string the original user query (audited pre-egress; not used by the
|
|
132
|
+
// bridge call itself since fetch_all_from_namespace pulls all
|
|
133
|
+
// cached vectors -- the BERT cosine is computed downstream).
|
|
134
|
+
// The query text is included in the audit triple so the
|
|
135
|
+
// caller's intent is checked at the gate.
|
|
136
|
+
// topK integer result cap (default 1000; bounded by rs_cache.MAX_NAMESPACE_VECTORS)
|
|
137
|
+
//
|
|
138
|
+
// Returns Promise resolving to:
|
|
139
|
+
// { success: true, hits: [{id, score, values: number[], metadata}] }
|
|
140
|
+
// { success: false, error: 'pinecone_api_key_missing'|'python_unavailable'
|
|
141
|
+
// |'python_exit_<N>'|'parse_error'|'timeout'
|
|
142
|
+
// |'invalid_namespace'|'invalid_top_k', stderr?: string }
|
|
143
|
+
//
|
|
144
|
+
// Throws (the only escape route -- Canon Part 8):
|
|
145
|
+
// ExternalEgressViolation if queryText matches FORBIDDEN_PATTERNS
|
|
146
|
+
// OR if returned hits[] metadata smuggles a forbidden
|
|
147
|
+
// pattern through.
|
|
148
|
+
|
|
149
|
+
async function queryPineconeWithVectors(namespace, queryText, topK) {
|
|
150
|
+
// Argument validation (graceful, never throws on shape errors).
|
|
151
|
+
if (typeof namespace !== 'string' || namespace.length === 0) {
|
|
152
|
+
return { success: false, error: 'invalid_namespace' };
|
|
153
|
+
}
|
|
154
|
+
if (typeof queryText !== 'string') {
|
|
155
|
+
return { success: false, error: 'invalid_query_text' };
|
|
156
|
+
}
|
|
157
|
+
const limit = (typeof topK === 'number' && topK > 0) ? Math.floor(topK) : DEFAULT_LIMIT;
|
|
158
|
+
|
|
159
|
+
// Canon Part 8 Layer 1: pre-egress audit on user-controlled queryText.
|
|
160
|
+
// auditQueryString throws ExternalEgressViolation on hit -- this is the
|
|
161
|
+
// single intentional escape route from this module.
|
|
162
|
+
auditQueryString(queryText, 'pinecone-bridge');
|
|
163
|
+
// Audit the namespace too (defense-in-depth; namespaces are typically
|
|
164
|
+
// 'external:<topic-slug>' so the topic-slug carries the user's domain).
|
|
165
|
+
auditQueryString(namespace, 'pinecone-bridge');
|
|
166
|
+
|
|
167
|
+
// Env-var gate. Pinecone SDK requires PINECONE_API_KEY; if absent the
|
|
168
|
+
// child process raises a RuntimeError. Short-circuit here so the user
|
|
169
|
+
// sees the canonical 'pinecone_api_key_missing' tag and not a stack trace.
|
|
170
|
+
if (!process.env.PINECONE_API_KEY) {
|
|
171
|
+
return { success: false, error: 'pinecone_api_key_missing' };
|
|
172
|
+
}
|
|
173
|
+
|
|
174
|
+
const requestEnvelope = JSON.stringify({ namespace: namespace, limit: limit });
|
|
175
|
+
const childEnv = Object.assign({}, process.env, {
|
|
176
|
+
MINDRIAN_REPO_ROOT: REPO_ROOT,
|
|
177
|
+
});
|
|
178
|
+
|
|
179
|
+
let res;
|
|
180
|
+
try {
|
|
181
|
+
res = childProcess.spawnSync(PYTHON_BIN, ['-c', bridgeScript], {
|
|
182
|
+
input: requestEnvelope,
|
|
183
|
+
encoding: 'utf8',
|
|
184
|
+
timeout: BRIDGE_TIMEOUT_MS,
|
|
185
|
+
env: childEnv,
|
|
186
|
+
cwd: REPO_ROOT,
|
|
187
|
+
});
|
|
188
|
+
} catch (err) {
|
|
189
|
+
// spawnSync itself does not normally throw; this is defense-in-depth.
|
|
190
|
+
return { success: false, error: 'spawn_threw', detail: String(err && err.message) };
|
|
191
|
+
}
|
|
192
|
+
|
|
193
|
+
// Honor per-error-code graceful degradation.
|
|
194
|
+
if (res && res.error) {
|
|
195
|
+
if (res.error.code === 'ENOENT') {
|
|
196
|
+
return { success: false, error: 'python_unavailable' };
|
|
197
|
+
}
|
|
198
|
+
if (res.error.code === 'ETIMEDOUT' || res.error.code === 'ERR_CHILD_PROCESS_TIMEOUT') {
|
|
199
|
+
return { success: false, error: 'timeout' };
|
|
200
|
+
}
|
|
201
|
+
return { success: false, error: 'spawn_error', detail: String(res.error.message) };
|
|
202
|
+
}
|
|
203
|
+
|
|
204
|
+
if (res && res.signal === 'SIGTERM') {
|
|
205
|
+
// Node delivers SIGTERM on timeout; covers the case when the child was
|
|
206
|
+
// killed without the error object being populated.
|
|
207
|
+
return { success: false, error: 'timeout' };
|
|
208
|
+
}
|
|
209
|
+
|
|
210
|
+
const stdout = (res && typeof res.stdout === 'string') ? res.stdout : '';
|
|
211
|
+
const stderr = (res && typeof res.stderr === 'string') ? res.stderr : '';
|
|
212
|
+
|
|
213
|
+
if (res && res.status !== 0) {
|
|
214
|
+
return {
|
|
215
|
+
success: false,
|
|
216
|
+
error: 'python_exit_' + res.status,
|
|
217
|
+
stderr: stderr.slice(0, 500),
|
|
218
|
+
};
|
|
219
|
+
}
|
|
220
|
+
|
|
221
|
+
let parsed;
|
|
222
|
+
try {
|
|
223
|
+
parsed = JSON.parse(stdout);
|
|
224
|
+
} catch (_e) {
|
|
225
|
+
return {
|
|
226
|
+
success: false,
|
|
227
|
+
error: 'parse_error',
|
|
228
|
+
stderr: stderr.slice(0, 500),
|
|
229
|
+
stdout_sample: stdout.slice(0, 200),
|
|
230
|
+
};
|
|
231
|
+
}
|
|
232
|
+
|
|
233
|
+
if (!parsed || typeof parsed !== 'object') {
|
|
234
|
+
return { success: false, error: 'parse_error', stdout_sample: stdout.slice(0, 200) };
|
|
235
|
+
}
|
|
236
|
+
|
|
237
|
+
// Bridge-internal failure: child returned {success:false, error:'...'} envelope.
|
|
238
|
+
if (parsed.success !== true) {
|
|
239
|
+
return {
|
|
240
|
+
success: false,
|
|
241
|
+
error: typeof parsed.error === 'string' ? parsed.error : 'bridge_error',
|
|
242
|
+
};
|
|
243
|
+
}
|
|
244
|
+
|
|
245
|
+
// Canon Part 8 Layer 2: post-receive audit. The rs-external namespace is
|
|
246
|
+
// supposed to hold only public metadata, but trust is not a security
|
|
247
|
+
// property. Re-audit the hits[] payload before returning to the caller.
|
|
248
|
+
// Throws ExternalEgressViolation on hit (intentional escape route).
|
|
249
|
+
auditQueryObject(parsed, 'pinecone-bridge');
|
|
250
|
+
|
|
251
|
+
return parsed;
|
|
252
|
+
}
|
|
253
|
+
|
|
254
|
+
// ---------- cosineSimilarity ----------
|
|
255
|
+
//
|
|
256
|
+
// Pure JS pair-wise cosine similarity on equal-length numeric arrays.
|
|
257
|
+
// Used by the differential scorer to compute BERT cosine between the two
|
|
258
|
+
// vectors returned by twin queryPineconeWithVectors calls (one per concept).
|
|
259
|
+
//
|
|
260
|
+
// Inputs:
|
|
261
|
+
// a, b number[] of equal length (typically 1024 for multilingual-e5-large)
|
|
262
|
+
//
|
|
263
|
+
// Returns:
|
|
264
|
+
// number in [-1, 1] -- Pinecone vectors are typically L2-normalized,
|
|
265
|
+
// so the result is usually in [0, 1].
|
|
266
|
+
// 0 -- if either vector is degenerate (norm == 0) OR
|
|
267
|
+
// lengths differ. Caller treats 0 as no signal.
|
|
268
|
+
//
|
|
269
|
+
// Throws:
|
|
270
|
+
// never. Returns 0 on shape errors so the caller's downstream logic
|
|
271
|
+
// stays in graceful-degradation territory.
|
|
272
|
+
|
|
273
|
+
function cosineSimilarity(a, b) {
|
|
274
|
+
if (!Array.isArray(a) || !Array.isArray(b)) return 0;
|
|
275
|
+
if (a.length !== b.length || a.length === 0) return 0;
|
|
276
|
+
let dot = 0;
|
|
277
|
+
let normA = 0;
|
|
278
|
+
let normB = 0;
|
|
279
|
+
for (let i = 0; i < a.length; i += 1) {
|
|
280
|
+
const x = a[i];
|
|
281
|
+
const y = b[i];
|
|
282
|
+
if (typeof x !== 'number' || typeof y !== 'number') return 0;
|
|
283
|
+
dot += x * y;
|
|
284
|
+
normA += x * x;
|
|
285
|
+
normB += y * y;
|
|
286
|
+
}
|
|
287
|
+
if (normA === 0 || normB === 0) return 0;
|
|
288
|
+
return dot / (Math.sqrt(normA) * Math.sqrt(normB));
|
|
289
|
+
}
|
|
290
|
+
|
|
291
|
+
// ---------- Exports ----------
|
|
292
|
+
|
|
293
|
+
module.exports = {
|
|
294
|
+
queryPineconeWithVectors: queryPineconeWithVectors,
|
|
295
|
+
cosineSimilarity: cosineSimilarity,
|
|
296
|
+
_test: {
|
|
297
|
+
PYTHON_BIN: PYTHON_BIN,
|
|
298
|
+
BRIDGE_TIMEOUT_MS: BRIDGE_TIMEOUT_MS,
|
|
299
|
+
DEFAULT_LIMIT: DEFAULT_LIMIT,
|
|
300
|
+
REPO_ROOT: REPO_ROOT,
|
|
301
|
+
bridgeScript: bridgeScript,
|
|
302
|
+
},
|
|
303
|
+
};
|
|
@@ -0,0 +1,350 @@
|
|
|
1
|
+
/*
|
|
2
|
+
* Copyright (c) 2026 Mindrian. BSL 1.1.
|
|
3
|
+
* Phase 89.2 Plan 06 Task 2 -- Phase 2 deterministic preprocessor.
|
|
4
|
+
*
|
|
5
|
+
* Per-document deterministic processor that produces the canonical 5-field
|
|
6
|
+
* preprocessed shape from raw fetcher output (papers + patents + signals
|
|
7
|
+
* all flow through the same preprocessor with source-aware extraction):
|
|
8
|
+
*
|
|
9
|
+
* {
|
|
10
|
+
* document_id : string (copy of input.id for traceability)
|
|
11
|
+
* technical_terms : string[] (top-N from deterministic n-gram + stopword filter)
|
|
12
|
+
* concepts : string[] (intersection with domain_analysis.concepts)
|
|
13
|
+
* methods : string[] (deterministic verb-phrase patterns)
|
|
14
|
+
* relevance_score : number in [0,1] (concept overlap ratio)
|
|
15
|
+
* boundary_flag : boolean (relevance < 0.5 OR zero concept overlap)
|
|
16
|
+
* }
|
|
17
|
+
*
|
|
18
|
+
* Determinism contract: same documents + same opts -> byte-identical output.
|
|
19
|
+
* No Math.random, no Date.now, no LLM call. The preprocessor is the
|
|
20
|
+
* deterministic bridge between Wave 2 fetchers (Plans 89.2-02 / 03 / 04)
|
|
21
|
+
* and Wave 3 differential scorer (Task 3 of this plan). It produces the
|
|
22
|
+
* concept[] field that the differential scorer consumes pair-wise.
|
|
23
|
+
*
|
|
24
|
+
* Canon Part 7 (Reuse Before Build): consumes domain_analysis from
|
|
25
|
+
* lib/core/rs-domain-analyzer.cjs (89.1) for concept extraction. May
|
|
26
|
+
* also consume substrate metadata via lib/core/rs-brain-substrate.cjs
|
|
27
|
+
* (89.1a) for boundary_flag heuristic refinement -- the relevance_score
|
|
28
|
+
* derived from domain_analysis IS the boundary signal in v1.11.0.
|
|
29
|
+
*
|
|
30
|
+
* Canon Part 8 (Graph Boundary): two defense-in-depth layers.
|
|
31
|
+
*
|
|
32
|
+
* Layer 1 -- pre-input scan: domain_analysis fields are scanned for
|
|
33
|
+
* FORBIDDEN_PATTERNS before any extraction logic runs. On hit, the
|
|
34
|
+
* preprocessor returns a structured envelope {error, reason} so the
|
|
35
|
+
* caller knows the upstream component leaked and can repair before
|
|
36
|
+
* downstream surfaces (the differential scorer + classifier + thesis
|
|
37
|
+
* generator all flow downstream from preprocessor output).
|
|
38
|
+
*
|
|
39
|
+
* Layer 2 -- pre-return audit: the composite preprocessed[] output is
|
|
40
|
+
* scanned via auditQueryObject before return. Throws
|
|
41
|
+
* ExternalEgressViolation on any FORBIDDEN_PATTERNS hit. Defense-in-
|
|
42
|
+
* depth so adversarial document.abstract / document.title content
|
|
43
|
+
* that leaks through extraction is caught at the gate before the
|
|
44
|
+
* differential scorer sees it.
|
|
45
|
+
*
|
|
46
|
+
* NEVER throws on operational failure (empty input, missing fields, etc.).
|
|
47
|
+
* ONLY throws ExternalEgressViolation on Canon Part 8 boundary breach.
|
|
48
|
+
*
|
|
49
|
+
* Pure CJS, zero npm deps, node built-ins only.
|
|
50
|
+
*/
|
|
51
|
+
'use strict';
|
|
52
|
+
|
|
53
|
+
const { auditQueryObject } = require('./rs-egress-prompts.cjs');
|
|
54
|
+
const crossRoomAggregator = require('./cross-room-aggregator.cjs');
|
|
55
|
+
// rs-egress-violations is required transitively by rs-egress-prompts; we do
|
|
56
|
+
// not throw ExternalEgressViolation directly from this module (auditQueryObject
|
|
57
|
+
// does). The require below is a reachability witness for the audit chain.
|
|
58
|
+
require('./rs-egress-violations.cjs');
|
|
59
|
+
|
|
60
|
+
const FORBIDDEN_PATTERNS = crossRoomAggregator.FORBIDDEN_PATTERNS;
|
|
61
|
+
if (!Array.isArray(FORBIDDEN_PATTERNS) || FORBIDDEN_PATTERNS.length < 6) {
|
|
62
|
+
throw new Error(
|
|
63
|
+
'rs-preprocessor: FORBIDDEN_PATTERNS re-export failed; ' +
|
|
64
|
+
'Canon Part 8 drift risk (expected >= 6 patterns from cross-room-aggregator)'
|
|
65
|
+
);
|
|
66
|
+
}
|
|
67
|
+
|
|
68
|
+
// ---------- Constants ----------
|
|
69
|
+
|
|
70
|
+
const TECHNICAL_TERMS_MAX = 20;
|
|
71
|
+
const CONCEPTS_MAX = 10;
|
|
72
|
+
const METHODS_MAX = 5;
|
|
73
|
+
const BOUNDARY_THRESHOLD = 0.5;
|
|
74
|
+
const TEXT_MAX_LEN = 100000; // 100KB cap on per-document text scan
|
|
75
|
+
|
|
76
|
+
// English stopwords (mirror rs-domain-analyzer.cjs STOPWORDS set; frozen).
|
|
77
|
+
const STOPWORDS = Object.freeze(new Set([
|
|
78
|
+
'a', 'an', 'and', 'are', 'as', 'at', 'be', 'by', 'for', 'from',
|
|
79
|
+
'has', 'have', 'in', 'is', 'it', 'its', 'of', 'on', 'or', 'that',
|
|
80
|
+
'the', 'this', 'to', 'was', 'were', 'will', 'with',
|
|
81
|
+
'i', 'you', 'we', 'they', 'he', 'she', 'our', 'their',
|
|
82
|
+
'about', 'above', 'after', 'again', 'all', 'also', 'any', 'been',
|
|
83
|
+
'before', 'between', 'both', 'but', 'can', 'did', 'do', 'does',
|
|
84
|
+
'into', 'just', 'more', 'most', 'no', 'not', 'now', 'only',
|
|
85
|
+
'over', 'own', 'same', 'so', 'some', 'such', 'than', 'then',
|
|
86
|
+
'there', 'these', 'those', 'through', 'under', 'up', 'very',
|
|
87
|
+
'what', 'when', 'where', 'which', 'who', 'why', 'how',
|
|
88
|
+
'while', 'because', 'against', 'last', 'week', 'held', 'results',
|
|
89
|
+
]));
|
|
90
|
+
|
|
91
|
+
// Technical-term regex: lowercase alphanumeric tokens 4-20 chars, optionally hyphenated.
|
|
92
|
+
const TECHNICAL_TERM_REGEX = /\b[a-z][a-z0-9]{3,19}(?:-[a-z0-9]{1,15})?\b/gi;
|
|
93
|
+
|
|
94
|
+
// Method-verb regex: deterministic verb-phrase capture.
|
|
95
|
+
const METHOD_REGEX = /\b(applied|used|tested|measured|computed|calculated|analyzed|developed|implemented|proposed|designed)\s+([a-z][a-z0-9 -]{2,30})\b/gi;
|
|
96
|
+
|
|
97
|
+
// ---------- preInputScan ----------
|
|
98
|
+
//
|
|
99
|
+
// Scans every string field of the domain_analysis input against
|
|
100
|
+
// FORBIDDEN_PATTERNS. Returns true if any field hits a forbidden pattern.
|
|
101
|
+
|
|
102
|
+
function preInputScan(da) {
|
|
103
|
+
if (!da || typeof da !== 'object') return false;
|
|
104
|
+
for (const key of Object.keys(da)) {
|
|
105
|
+
const v = da[key];
|
|
106
|
+
if (typeof v === 'string') {
|
|
107
|
+
for (const re of FORBIDDEN_PATTERNS) {
|
|
108
|
+
if (re.test(v)) return true;
|
|
109
|
+
}
|
|
110
|
+
} else if (Array.isArray(v)) {
|
|
111
|
+
for (const item of v) {
|
|
112
|
+
if (typeof item === 'string') {
|
|
113
|
+
for (const re of FORBIDDEN_PATTERNS) {
|
|
114
|
+
if (re.test(item)) return true;
|
|
115
|
+
}
|
|
116
|
+
}
|
|
117
|
+
}
|
|
118
|
+
}
|
|
119
|
+
}
|
|
120
|
+
return false;
|
|
121
|
+
}
|
|
122
|
+
|
|
123
|
+
// ---------- tokenize ----------
|
|
124
|
+
//
|
|
125
|
+
// Lowercase, alpha+digit only, length >= 3, stopwords stripped.
|
|
126
|
+
// Deterministic.
|
|
127
|
+
|
|
128
|
+
function tokenize(s) {
|
|
129
|
+
if (typeof s !== 'string') return [];
|
|
130
|
+
const truncated = s.length > TEXT_MAX_LEN ? s.slice(0, TEXT_MAX_LEN) : s;
|
|
131
|
+
return truncated.toLowerCase()
|
|
132
|
+
.replace(/[^a-z0-9\s_-]/g, ' ')
|
|
133
|
+
.split(/\s+/)
|
|
134
|
+
.filter(function (t) { return t.length >= 3 && !STOPWORDS.has(t); });
|
|
135
|
+
}
|
|
136
|
+
|
|
137
|
+
// ---------- extractTechnicalTerms ----------
|
|
138
|
+
//
|
|
139
|
+
// Extract technical terms from text via TECHNICAL_TERM_REGEX. Lowercase,
|
|
140
|
+
// dedupe, filter stopwords, count by frequency, sort by count desc + alpha,
|
|
141
|
+
// take top TECHNICAL_TERMS_MAX. Determinism anchor: when counts tie, alpha
|
|
142
|
+
// sort breaks ties so output is byte-stable.
|
|
143
|
+
|
|
144
|
+
function extractTechnicalTerms(text) {
|
|
145
|
+
if (typeof text !== 'string' || text.length === 0) return [];
|
|
146
|
+
const truncated = text.length > TEXT_MAX_LEN ? text.slice(0, TEXT_MAX_LEN) : text;
|
|
147
|
+
const matches = truncated.toLowerCase().match(TECHNICAL_TERM_REGEX) || [];
|
|
148
|
+
const counts = new Map();
|
|
149
|
+
for (const m of matches) {
|
|
150
|
+
const t = m.trim();
|
|
151
|
+
if (t.length < 4 || STOPWORDS.has(t)) continue;
|
|
152
|
+
counts.set(t, (counts.get(t) || 0) + 1);
|
|
153
|
+
}
|
|
154
|
+
const arr = [];
|
|
155
|
+
for (const [term, count] of counts.entries()) {
|
|
156
|
+
arr.push({ term: term, count: count });
|
|
157
|
+
}
|
|
158
|
+
arr.sort(function (a, b) {
|
|
159
|
+
if (b.count !== a.count) return b.count - a.count;
|
|
160
|
+
return a.term < b.term ? -1 : (a.term > b.term ? 1 : 0);
|
|
161
|
+
});
|
|
162
|
+
return arr.slice(0, TECHNICAL_TERMS_MAX).map(function (e) { return e.term; });
|
|
163
|
+
}
|
|
164
|
+
|
|
165
|
+
// ---------- extractConcepts ----------
|
|
166
|
+
//
|
|
167
|
+
// Intersection of text tokens with domain_analysis.concepts. Deterministic.
|
|
168
|
+
// Capped at CONCEPTS_MAX. Order: domain_analysis.concepts iteration order.
|
|
169
|
+
|
|
170
|
+
function extractConcepts(text, da) {
|
|
171
|
+
if (!da || !Array.isArray(da.concepts) || da.concepts.length === 0) return [];
|
|
172
|
+
if (typeof text !== 'string' || text.length === 0) return [];
|
|
173
|
+
const tokens = new Set(tokenize(text));
|
|
174
|
+
const out = [];
|
|
175
|
+
const seen = new Set();
|
|
176
|
+
for (const c of da.concepts) {
|
|
177
|
+
if (typeof c !== 'string') continue;
|
|
178
|
+
const cl = c.toLowerCase();
|
|
179
|
+
if (seen.has(cl)) continue;
|
|
180
|
+
if (tokens.has(cl)) {
|
|
181
|
+
seen.add(cl);
|
|
182
|
+
out.push(cl);
|
|
183
|
+
if (out.length >= CONCEPTS_MAX) break;
|
|
184
|
+
}
|
|
185
|
+
}
|
|
186
|
+
return out;
|
|
187
|
+
}
|
|
188
|
+
|
|
189
|
+
// ---------- extractMethods ----------
|
|
190
|
+
//
|
|
191
|
+
// Deterministic verb-phrase capture via METHOD_REGEX. Take match group 2,
|
|
192
|
+
// trim, lowercase, dedupe, cap at METHODS_MAX.
|
|
193
|
+
|
|
194
|
+
function extractMethods(text) {
|
|
195
|
+
if (typeof text !== 'string' || text.length === 0) return [];
|
|
196
|
+
const truncated = text.length > TEXT_MAX_LEN ? text.slice(0, TEXT_MAX_LEN) : text;
|
|
197
|
+
const out = [];
|
|
198
|
+
const seen = new Set();
|
|
199
|
+
let match;
|
|
200
|
+
// Reset regex stateful position for safety.
|
|
201
|
+
METHOD_REGEX.lastIndex = 0;
|
|
202
|
+
while ((match = METHOD_REGEX.exec(truncated)) !== null) {
|
|
203
|
+
const phrase = (match[2] || '').trim().toLowerCase();
|
|
204
|
+
if (phrase.length === 0) continue;
|
|
205
|
+
if (seen.has(phrase)) continue;
|
|
206
|
+
seen.add(phrase);
|
|
207
|
+
out.push(phrase);
|
|
208
|
+
if (out.length >= METHODS_MAX) break;
|
|
209
|
+
}
|
|
210
|
+
return out;
|
|
211
|
+
}
|
|
212
|
+
|
|
213
|
+
// ---------- computeRelevance ----------
|
|
214
|
+
//
|
|
215
|
+
// Concept-overlap ratio (concepts found in text / total domain_analysis.concepts).
|
|
216
|
+
// Bounded [0,1]. Deterministic.
|
|
217
|
+
|
|
218
|
+
function computeRelevance(text, da) {
|
|
219
|
+
if (!da || !Array.isArray(da.concepts) || da.concepts.length === 0) return 0;
|
|
220
|
+
if (typeof text !== 'string' || text.length === 0) return 0;
|
|
221
|
+
const overlap = extractConcepts(text, da).length;
|
|
222
|
+
const ratio = overlap / da.concepts.length;
|
|
223
|
+
return Math.max(0, Math.min(1, ratio));
|
|
224
|
+
}
|
|
225
|
+
|
|
226
|
+
// ---------- computeBoundaryFlag ----------
|
|
227
|
+
//
|
|
228
|
+
// True if relevance below threshold OR zero concept overlap. The boundary
|
|
229
|
+
// flag tells the differential scorer (and classifier downstream) that this
|
|
230
|
+
// document is on the edge of the user's substrate; cross-domain analogies
|
|
231
|
+
// surface most strongly when at least one side is boundary-flagged.
|
|
232
|
+
|
|
233
|
+
function computeBoundaryFlag(relevance, concepts) {
|
|
234
|
+
if (typeof relevance !== 'number' || isNaN(relevance)) return true;
|
|
235
|
+
if (!Array.isArray(concepts) || concepts.length === 0) return true;
|
|
236
|
+
return relevance < BOUNDARY_THRESHOLD;
|
|
237
|
+
}
|
|
238
|
+
|
|
239
|
+
// ---------- preprocess ----------
|
|
240
|
+
//
|
|
241
|
+
// Public entry point. Takes raw fetcher output (papers + patents + signals)
|
|
242
|
+
// and produces deterministic per-document preprocessed records.
|
|
243
|
+
//
|
|
244
|
+
// Inputs:
|
|
245
|
+
// documents Array<{id, abstract?, signal?, title?, source?, ...}>
|
|
246
|
+
// opts optional object:
|
|
247
|
+
// domain_analysis {primary_domain, concepts[], terminology[], methods[]}
|
|
248
|
+
// from lib/core/rs-domain-analyzer.cjs
|
|
249
|
+
//
|
|
250
|
+
// Output (happy path):
|
|
251
|
+
// Array<{document_id, technical_terms[], concepts[], methods[],
|
|
252
|
+
// relevance_score, boundary_flag, warning?}>
|
|
253
|
+
//
|
|
254
|
+
// Output (Canon Part 8 input rejection):
|
|
255
|
+
// {error: 'invalid_input', reason: 'forbidden_input'}
|
|
256
|
+
//
|
|
257
|
+
// Throws:
|
|
258
|
+
// ExternalEgressViolation if composite output contains FORBIDDEN_PATTERNS
|
|
259
|
+
// (intentional Canon Part 8 escape route).
|
|
260
|
+
|
|
261
|
+
function preprocess(documents, opts) {
|
|
262
|
+
if (!Array.isArray(documents)) return [];
|
|
263
|
+
if (documents.length === 0) return [];
|
|
264
|
+
|
|
265
|
+
opts = opts || {};
|
|
266
|
+
const domain_analysis = opts.domain_analysis || { concepts: [], terminology: [], methods: [] };
|
|
267
|
+
|
|
268
|
+
// Canon Part 8 Layer 1: pre-input scan on domain_analysis.
|
|
269
|
+
if (preInputScan(domain_analysis)) {
|
|
270
|
+
return { error: 'invalid_input', reason: 'forbidden_input' };
|
|
271
|
+
}
|
|
272
|
+
|
|
273
|
+
const out = [];
|
|
274
|
+
for (const doc of documents) {
|
|
275
|
+
if (!doc || typeof doc !== 'object') continue;
|
|
276
|
+
const document_id = (typeof doc.id === 'string') ? doc.id : '';
|
|
277
|
+
// Source-aware text extraction. Papers + patents have abstract; signals
|
|
278
|
+
// have signal. Title is fallback. All flow through the same preprocessing.
|
|
279
|
+
let text = '';
|
|
280
|
+
if (typeof doc.abstract === 'string' && doc.abstract.length > 0) {
|
|
281
|
+
text = doc.abstract;
|
|
282
|
+
} else if (typeof doc.signal === 'string' && doc.signal.length > 0) {
|
|
283
|
+
text = doc.signal;
|
|
284
|
+
} else if (typeof doc.title === 'string' && doc.title.length > 0) {
|
|
285
|
+
text = doc.title;
|
|
286
|
+
}
|
|
287
|
+
|
|
288
|
+
if (text.length === 0) {
|
|
289
|
+
out.push({
|
|
290
|
+
document_id: document_id,
|
|
291
|
+
technical_terms: [],
|
|
292
|
+
concepts: [],
|
|
293
|
+
methods: [],
|
|
294
|
+
relevance_score: 0,
|
|
295
|
+
boundary_flag: true,
|
|
296
|
+
warning: 'document_text_missing',
|
|
297
|
+
});
|
|
298
|
+
continue;
|
|
299
|
+
}
|
|
300
|
+
|
|
301
|
+
// Title is included in the technical-term + concept extraction surface
|
|
302
|
+
// when present, so adversarial title content (Test 9) flows through the
|
|
303
|
+
// pre-return audit and gets caught.
|
|
304
|
+
const composite = (typeof doc.title === 'string' ? doc.title + ' ' : '') + text;
|
|
305
|
+
|
|
306
|
+
const technical_terms = extractTechnicalTerms(composite);
|
|
307
|
+
const concepts = extractConcepts(composite, domain_analysis);
|
|
308
|
+
const methods = extractMethods(composite);
|
|
309
|
+
const relevance_score = computeRelevance(composite, domain_analysis);
|
|
310
|
+
const boundary_flag = computeBoundaryFlag(relevance_score, concepts);
|
|
311
|
+
|
|
312
|
+
out.push({
|
|
313
|
+
document_id: document_id,
|
|
314
|
+
technical_terms: technical_terms,
|
|
315
|
+
concepts: concepts,
|
|
316
|
+
methods: methods,
|
|
317
|
+
relevance_score: relevance_score,
|
|
318
|
+
boundary_flag: boundary_flag,
|
|
319
|
+
});
|
|
320
|
+
}
|
|
321
|
+
|
|
322
|
+
// Canon Part 8 Layer 2: pre-return audit. Throws ExternalEgressViolation
|
|
323
|
+
// on any FORBIDDEN_PATTERNS hit in the composite preprocessed[] output.
|
|
324
|
+
// This is the intentional escape route from preprocess().
|
|
325
|
+
auditQueryObject(out, 'preprocessor');
|
|
326
|
+
|
|
327
|
+
return out;
|
|
328
|
+
}
|
|
329
|
+
|
|
330
|
+
// ---------- Exports ----------
|
|
331
|
+
|
|
332
|
+
module.exports = {
|
|
333
|
+
preprocess: preprocess,
|
|
334
|
+
_test: {
|
|
335
|
+
extractTechnicalTerms: extractTechnicalTerms,
|
|
336
|
+
extractConcepts: extractConcepts,
|
|
337
|
+
extractMethods: extractMethods,
|
|
338
|
+
computeRelevance: computeRelevance,
|
|
339
|
+
computeBoundaryFlag: computeBoundaryFlag,
|
|
340
|
+
tokenize: tokenize,
|
|
341
|
+
preInputScan: preInputScan,
|
|
342
|
+
TECHNICAL_TERM_REGEX: TECHNICAL_TERM_REGEX,
|
|
343
|
+
METHOD_REGEX: METHOD_REGEX,
|
|
344
|
+
STOPWORDS: STOPWORDS,
|
|
345
|
+
TECHNICAL_TERMS_MAX: TECHNICAL_TERMS_MAX,
|
|
346
|
+
CONCEPTS_MAX: CONCEPTS_MAX,
|
|
347
|
+
METHODS_MAX: METHODS_MAX,
|
|
348
|
+
BOUNDARY_THRESHOLD: BOUNDARY_THRESHOLD,
|
|
349
|
+
},
|
|
350
|
+
};
|