npm - feed-the-machine - Versions diffs - 1.6.0 → 1.7.0 - Mend

feed-the-machine 1.6.0 → 1.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (269) hide show

package/LICENSE +21 -21
package/README.md +170 -170
package/bin/brain.py +1340 -0
package/bin/convert_claude_skills_to_codex.py +490 -0
package/bin/generate-manifest.mjs +463 -463
package/bin/harden_codex_skills.py +141 -0
package/bin/install.mjs +491 -491
package/bin/migrate-eng-buddy-data.py +875 -0
package/bin/playbook_engine/__init__.py +1 -0
package/bin/playbook_engine/conftest.py +8 -0
package/bin/playbook_engine/extractor.py +33 -0
package/bin/playbook_engine/manager.py +102 -0
package/bin/playbook_engine/models.py +84 -0
package/bin/playbook_engine/registry.py +35 -0
package/bin/playbook_engine/test_extractor.py +72 -0
package/bin/playbook_engine/test_integration.py +129 -0
package/bin/playbook_engine/test_manager.py +85 -0
package/bin/playbook_engine/test_models.py +166 -0
package/bin/playbook_engine/test_registry.py +67 -0
package/bin/playbook_engine/test_tracer.py +86 -0
package/bin/playbook_engine/tracer.py +93 -0
package/bin/tasks_db.py +456 -0
package/docs/HOOKS.md +243 -243
package/docs/INBOX.md +233 -233
package/ftm/SKILL.md +125 -122
package/ftm-audit/SKILL.md +623 -623
package/ftm-audit/references/protocols/PROJECT-PATTERNS.md +91 -91
package/ftm-audit/references/protocols/RUNTIME-WIRING.md +66 -66
package/ftm-audit/references/protocols/WIRING-CONTRACTS.md +135 -135
package/ftm-audit/references/strategies/AUTO-FIX-STRATEGIES.md +69 -69
package/ftm-audit/references/templates/REPORT-FORMAT.md +96 -96
package/ftm-audit/scripts/run-knip.sh +23 -23
package/ftm-audit.yml +2 -2
package/ftm-brainstorm/SKILL.md +1003 -498
package/ftm-brainstorm/evals/evals.json +180 -100
package/ftm-brainstorm/evals/promptfoo.yaml +109 -109
package/ftm-brainstorm/references/agent-prompts.md +552 -224
package/ftm-brainstorm/references/plan-template.md +209 -121
package/ftm-brainstorm.yml +2 -2
package/ftm-browse/SKILL.md +454 -454
package/ftm-browse/daemon/browser-manager.ts +206 -206
package/ftm-browse/daemon/bun.lock +30 -30
package/ftm-browse/daemon/cli.ts +347 -347
package/ftm-browse/daemon/commands.ts +410 -410
package/ftm-browse/daemon/main.ts +357 -357
package/ftm-browse/daemon/package.json +17 -17
package/ftm-browse/daemon/server.ts +189 -189
package/ftm-browse/daemon/snapshot.ts +519 -519
package/ftm-browse/daemon/tsconfig.json +22 -22
package/ftm-browse.yml +4 -4
package/ftm-capture/SKILL.md +370 -370
package/ftm-capture.yml +4 -4
package/ftm-codex-gate/SKILL.md +361 -361
package/ftm-codex-gate.yml +2 -2
package/ftm-config/SKILL.md +422 -345
package/ftm-config.default.yml +125 -82
package/ftm-config.yml +44 -2
package/ftm-council/SKILL.md +416 -416
package/ftm-council/references/prompts/CLAUDE-INVESTIGATION.md +60 -60
package/ftm-council/references/prompts/CODEX-INVESTIGATION.md +58 -58
package/ftm-council/references/prompts/GEMINI-INVESTIGATION.md +58 -58
package/ftm-council/references/prompts/REBUTTAL-TEMPLATE.md +57 -57
package/ftm-council/references/protocols/PREREQUISITES.md +47 -47
package/ftm-council/references/protocols/STEP-0-FRAMING.md +46 -46
package/ftm-council.yml +2 -2
package/ftm-dashboard/SKILL.md +163 -163
package/ftm-dashboard.yml +4 -4
package/ftm-debug/SKILL.md +1037 -1037
package/ftm-debug/references/phases/PHASE-0-INTAKE.md +58 -58
package/ftm-debug/references/phases/PHASE-1-TRIAGE.md +46 -46
package/ftm-debug/references/phases/PHASE-2-WAR-ROOM-AGENTS.md +279 -279
package/ftm-debug/references/phases/PHASE-3-TO-6-EXECUTION.md +436 -436
package/ftm-debug/references/protocols/BLACKBOARD.md +86 -86
package/ftm-debug/references/protocols/EDGE-CASES.md +103 -103
package/ftm-debug.yml +2 -2
package/ftm-diagram/SKILL.md +277 -277
package/ftm-diagram.yml +2 -2
package/ftm-executor/SKILL.md +777 -777
package/ftm-executor/references/STYLE-TEMPLATE.md +73 -73
package/ftm-executor/references/phases/PHASE-0-VERIFICATION.md +62 -62
package/ftm-executor/references/phases/PHASE-2-AGENT-ASSEMBLY.md +34 -34
package/ftm-executor/references/phases/PHASE-3-WORKTREES.md +38 -38
package/ftm-executor/references/phases/PHASE-4-5-AUDIT.md +72 -72
package/ftm-executor/references/phases/PHASE-4-DISPATCH.md +66 -66
package/ftm-executor/references/phases/PHASE-5-5-CODEX-GATE.md +73 -73
package/ftm-executor/references/protocols/DOCUMENTATION-BOOTSTRAP.md +36 -36
package/ftm-executor/references/protocols/MODEL-PROFILE.md +59 -59
package/ftm-executor/references/protocols/PROGRESS-TRACKING.md +66 -66
package/ftm-executor/runtime/ftm-runtime.mjs +252 -252
package/ftm-executor/runtime/package.json +8 -8
package/ftm-executor.yml +2 -2
package/ftm-git/SKILL.md +441 -441
package/ftm-git/evals/evals.json +26 -26
package/ftm-git/evals/promptfoo.yaml +75 -75
package/ftm-git/hooks/post-commit-experience.sh +92 -92
package/ftm-git/references/patterns/SECRET-PATTERNS.md +104 -104
package/ftm-git/references/protocols/REMEDIATION.md +139 -139
package/ftm-git/scripts/pre-commit-secrets.sh +110 -110
package/ftm-git.yml +2 -2
package/ftm-inbox/backend/__pycache__/main.cpython-314.pyc +0 -0
package/ftm-inbox/backend/adapters/_retry.py +64 -64
package/ftm-inbox/backend/adapters/base.py +230 -230
package/ftm-inbox/backend/adapters/freshservice.py +104 -104
package/ftm-inbox/backend/adapters/gmail.py +125 -125
package/ftm-inbox/backend/adapters/jira.py +136 -136
package/ftm-inbox/backend/adapters/registry.py +192 -192
package/ftm-inbox/backend/adapters/slack.py +110 -110
package/ftm-inbox/backend/db/connection.py +54 -54
package/ftm-inbox/backend/db/schema.py +78 -78
package/ftm-inbox/backend/executor/__init__.py +7 -7
package/ftm-inbox/backend/executor/engine.py +149 -149
package/ftm-inbox/backend/executor/step_runner.py +98 -98
package/ftm-inbox/backend/main.py +103 -103
package/ftm-inbox/backend/models/__init__.py +1 -1
package/ftm-inbox/backend/models/unified_task.py +36 -36
package/ftm-inbox/backend/planner/__init__.py +6 -6
package/ftm-inbox/backend/planner/__pycache__/__init__.cpython-314.pyc +0 -0
package/ftm-inbox/backend/planner/__pycache__/generator.cpython-314.pyc +0 -0
package/ftm-inbox/backend/planner/__pycache__/schema.cpython-314.pyc +0 -0
package/ftm-inbox/backend/planner/generator.py +127 -127
package/ftm-inbox/backend/planner/schema.py +34 -34
package/ftm-inbox/backend/requirements.txt +5 -5
package/ftm-inbox/backend/routes/__pycache__/plan.cpython-314.pyc +0 -0
package/ftm-inbox/backend/routes/execute.py +186 -186
package/ftm-inbox/backend/routes/health.py +52 -52
package/ftm-inbox/backend/routes/inbox.py +68 -68
package/ftm-inbox/backend/routes/plan.py +271 -271
package/ftm-inbox/bin/launchagent.mjs +91 -91
package/ftm-inbox/bin/setup.mjs +188 -188
package/ftm-inbox/bin/start.sh +10 -10
package/ftm-inbox/bin/status.sh +17 -17
package/ftm-inbox/bin/stop.sh +8 -8
package/ftm-inbox/config.example.yml +55 -55
package/ftm-inbox/package-lock.json +2898 -2898
package/ftm-inbox/package.json +26 -26
package/ftm-inbox/postcss.config.js +6 -6
package/ftm-inbox/src/app.css +199 -199
package/ftm-inbox/src/app.html +18 -18
package/ftm-inbox/src/lib/api.ts +166 -166
package/ftm-inbox/src/lib/components/ExecutionLog.svelte +81 -81
package/ftm-inbox/src/lib/components/InboxFeed.svelte +143 -143
package/ftm-inbox/src/lib/components/PlanStep.svelte +271 -271
package/ftm-inbox/src/lib/components/PlanView.svelte +206 -206
package/ftm-inbox/src/lib/components/StreamPanel.svelte +99 -99
package/ftm-inbox/src/lib/components/TaskCard.svelte +190 -190
package/ftm-inbox/src/lib/components/ui/EmptyState.svelte +63 -63
package/ftm-inbox/src/lib/components/ui/KawaiiCard.svelte +86 -86
package/ftm-inbox/src/lib/components/ui/PillButton.svelte +106 -106
package/ftm-inbox/src/lib/components/ui/StatusBadge.svelte +67 -67
package/ftm-inbox/src/lib/components/ui/StreamDrawer.svelte +149 -149
package/ftm-inbox/src/lib/components/ui/ThemeToggle.svelte +80 -80
package/ftm-inbox/src/lib/theme.ts +47 -47
package/ftm-inbox/src/routes/+layout.svelte +76 -76
package/ftm-inbox/src/routes/+page.svelte +401 -401
package/ftm-inbox/svelte.config.js +12 -12
package/ftm-inbox/tailwind.config.ts +63 -63
package/ftm-inbox/tsconfig.json +13 -13
package/ftm-inbox/vite.config.ts +6 -6
package/ftm-intent/SKILL.md +241 -241
package/ftm-intent.yml +2 -2
package/ftm-manifest.json +3794 -3794
package/ftm-map/SKILL.md +291 -291
package/ftm-map/scripts/db.py +712 -712
package/ftm-map/scripts/index.py +415 -415
package/ftm-map/scripts/parser.py +224 -224
package/ftm-map/scripts/queries/go-tags.scm +20 -20
package/ftm-map/scripts/queries/javascript-tags.scm +35 -35
package/ftm-map/scripts/queries/python-tags.scm +31 -31
package/ftm-map/scripts/queries/ruby-tags.scm +19 -19
package/ftm-map/scripts/queries/rust-tags.scm +37 -37
package/ftm-map/scripts/queries/typescript-tags.scm +41 -41
package/ftm-map/scripts/query.py +301 -301
package/ftm-map/scripts/ranker.py +377 -377
package/ftm-map/scripts/requirements.txt +5 -5
package/ftm-map/scripts/setup-hooks.sh +27 -27
package/ftm-map/scripts/setup.sh +56 -56
package/ftm-map/scripts/test_db.py +364 -364
package/ftm-map/scripts/test_parser.py +174 -174
package/ftm-map/scripts/test_query.py +183 -183
package/ftm-map/scripts/test_ranker.py +199 -199
package/ftm-map/scripts/views.py +591 -591
package/ftm-map.yml +2 -2
package/ftm-mind/SKILL.md +201 -1943
package/ftm-mind/evals/promptfoo.yaml +142 -142
package/ftm-mind/references/blackboard-protocol.md +110 -0
package/ftm-mind/references/blackboard-schema.md +328 -328
package/ftm-mind/references/complexity-guide.md +110 -110
package/ftm-mind/references/complexity-sizing.md +138 -0
package/ftm-mind/references/decide-act-protocol.md +172 -0
package/ftm-mind/references/direct-execution.md +51 -0
package/ftm-mind/references/environment-discovery.md +77 -0
package/ftm-mind/references/event-registry.md +319 -319
package/ftm-mind/references/mcp-inventory.md +300 -296
package/ftm-mind/references/ops-routing.md +47 -0
package/ftm-mind/references/orient-protocol.md +234 -0
package/ftm-mind/references/personality.md +40 -0
package/ftm-mind/references/protocols/COMPLEXITY-SIZING.md +72 -72
package/ftm-mind/references/protocols/MCP-HEURISTICS.md +32 -32
package/ftm-mind/references/protocols/PLAN-APPROVAL.md +80 -80
package/ftm-mind/references/reflexion-protocol.md +249 -249
package/ftm-mind/references/routing/SCENARIOS.md +22 -22
package/ftm-mind/references/routing-scenarios.md +35 -35
package/ftm-mind.yml +2 -2
package/ftm-ops.yml +4 -0
package/ftm-pause/SKILL.md +395 -395
package/ftm-pause/references/protocols/SKILL-RESTORE-PROTOCOLS.md +186 -186
package/ftm-pause/references/protocols/VALIDATION.md +80 -80
package/ftm-pause.yml +2 -2
package/ftm-researcher/SKILL.md +275 -275
package/ftm-researcher/evals/agent-diversity.yaml +17 -17
package/ftm-researcher/evals/synthesis-quality.yaml +12 -12
package/ftm-researcher/evals/trigger-accuracy.yaml +39 -39
package/ftm-researcher/references/adaptive-search.md +116 -116
package/ftm-researcher/references/agent-prompts.md +193 -193
package/ftm-researcher/references/council-integration.md +193 -193
package/ftm-researcher/references/output-format.md +203 -203
package/ftm-researcher/references/synthesis-pipeline.md +165 -165
package/ftm-researcher/scripts/score_credibility.py +234 -234
package/ftm-researcher/scripts/validate_research.py +92 -92
package/ftm-researcher.yml +2 -2
package/ftm-resume/SKILL.md +518 -518
package/ftm-resume/references/protocols/VALIDATION.md +172 -172
package/ftm-resume.yml +2 -2
package/ftm-retro/SKILL.md +380 -380
package/ftm-retro/references/protocols/SCORING-RUBRICS.md +89 -89
package/ftm-retro/references/templates/REPORT-FORMAT.md +109 -109
package/ftm-retro.yml +2 -2
package/ftm-routine/SKILL.md +170 -170
package/ftm-routine.yml +4 -4
package/ftm-state/blackboard/capabilities.json +5 -5
package/ftm-state/blackboard/capabilities.schema.json +27 -27
package/ftm-state/blackboard/context.json +37 -23
package/ftm-state/blackboard/experiences/doom-statusline-fix.json +26 -0
package/ftm-state/blackboard/experiences/hackathon-pages-site.json +26 -0
package/ftm-state/blackboard/experiences/hindsight-sso-kickoff.json +42 -0
package/ftm-state/blackboard/experiences/index.json +58 -9
package/ftm-state/blackboard/experiences/learning-ragnarok-api-access.json +23 -0
package/ftm-state/blackboard/experiences/nordlayer-members-auto-assign.json +26 -0
package/ftm-state/blackboard/experiences/saml2aws-stale-session-fix.json +41 -0
package/ftm-state/blackboard/patterns.json +6 -6
package/ftm-state/schemas/context.schema.json +130 -130
package/ftm-state/schemas/experience-index.schema.json +77 -77
package/ftm-state/schemas/experience.schema.json +78 -78
package/ftm-state/schemas/patterns.schema.json +44 -44
package/ftm-upgrade/SKILL.md +194 -194
package/ftm-upgrade/scripts/check-version.sh +76 -76
package/ftm-upgrade/scripts/upgrade.sh +143 -143
package/ftm-upgrade.yml +2 -2
package/ftm-verify.yml +2 -2
package/ftm.yml +2 -2
package/hooks/ftm-auto-log.sh +137 -0
package/hooks/ftm-blackboard-enforcer.sh +93 -93
package/hooks/ftm-discovery-reminder.sh +90 -90
package/hooks/ftm-drafts-gate.sh +61 -61
package/hooks/ftm-event-logger.mjs +107 -107
package/hooks/ftm-install-hooks.sh +240 -0
package/hooks/ftm-learning-capture.sh +117 -0
package/hooks/ftm-map-autodetect.sh +79 -79
package/hooks/ftm-pending-sync-check.sh +22 -22
package/hooks/ftm-plan-gate.sh +92 -92
package/hooks/ftm-post-commit-trigger.sh +57 -57
package/hooks/ftm-post-compaction.sh +138 -0
package/hooks/ftm-pre-compaction.sh +147 -0
package/hooks/ftm-session-end.sh +52 -0
package/hooks/ftm-session-snapshot.sh +213 -0
package/hooks/settings-template.json +81 -81
package/install.sh +363 -363
package/package.json +84 -84
package/uninstall.sh +25 -25

package/ftm-researcher/scripts/score_credibility.py CHANGED Viewed

@@ -1,234 +1,234 @@
-#!/usr/bin/env python3
-"""
-Source credibility scoring for ftm-researcher findings.
-Scoring dimensions:
-- Source type weight (35%): primary > peer_reviewed > official_docs > news > blog > forum
-- Recency (20%): decay based on age for fast-moving topics
-- Expertise signals (25%): domain authority, author credentials
-- Bias detection (20%): sensationalism penalties, balanced language bonuses
-Additional flags:
-- Corroboration bonus: +0.15 if independently found by 2+ agents from different source types
-- Circular sourcing: flag if multiple sources cite the same original
-"""
-import json
-import sys
-import re
-from datetime import datetime
-from urllib.parse import urlparse
-# Source type base weights
-SOURCE_WEIGHTS = {
-    "primary": 1.0,
-    "peer_reviewed": 0.9,
-    "official_docs": 0.85,
-    "code_repo": 0.8,
-    "qa_site": 0.65,
-    "news": 0.6,
-    "blog": 0.4,
-    "forum": 0.25,
-    "codebase": 0.95,  # local codebase findings are high-trust
-}
-# High-authority domains
-HIGH_AUTHORITY = {
-    "arxiv.org", "nature.com", "science.org", "acm.org", "ieee.org",
-    "github.com", "docs.python.org", "developer.mozilla.org",
-    "platform.openai.com", "docs.anthropic.com", "cloud.google.com",
-    "aws.amazon.com", "learn.microsoft.com",
-}
-MODERATE_AUTHORITY = {
-    "stackoverflow.com", "stackexchange.com", "reddit.com",
-    "news.ycombinator.com", "techcrunch.com", "arstechnica.com",
-    "thenewstack.io", "infoq.com", "dev.to",
-}
-# Sensationalism indicators
-SENSATIONAL_PATTERNS = [
-    r"you won't believe", r"shocking", r"mind-blowing", r"game.?changer",
-    r"revolutionary", r"incredible", r"amazing breakthrough",
-]
-# Balanced language indicators
-BALANCED_PATTERNS = [
-    r"however", r"on the other hand", r"trade-?off", r"limitation",
-    r"caveat", r"although", r"despite", r"conversely",
-]
-def score_source_type(finding: dict) -> float:
-    return SOURCE_WEIGHTS.get(finding.get("source_type", "blog"), 0.4)
-def score_recency(finding: dict, fast_moving: bool = True) -> float:
-    """Score based on source recency. Extracts year from URL or metadata."""
-    url = finding.get("source_url", "")
-    evidence = finding.get("evidence", "")
-    current_year = datetime.now().year
-    # Try to extract year from URL (common in blog/paper URLs)
-    year_match = re.search(r'/(20[12]\d)/', url)
-    if not year_match:
-        # Try evidence text for year mentions
-        year_match = re.search(r'\b(20[12]\d)\b', evidence)
-    if year_match:
-        source_year = int(year_match.group(1))
-        age = current_year - source_year
-        if fast_moving:
-            # Aggressive decay for fast-moving topics (tech, AI, etc.)
-            decay_map = {0: 1.0, 1: 0.85, 2: 0.65, 3: 0.45, 4: 0.30}
-            return decay_map.get(age, 0.2)
-        else:
-            # Gentle decay for stable topics
-            decay_map = {0: 1.0, 1: 0.95, 2: 0.85, 3: 0.75, 4: 0.65, 5: 0.55}
-            return decay_map.get(age, 0.4)
-    # No date info — return neutral
-    return 0.7
-def score_domain_authority(finding: dict) -> float:
-    url = finding.get("source_url", "")
-    if not url:
-        if finding.get("source_type") == "codebase":
-            return 0.95
-        return 0.5
-    try:
-        domain = urlparse(url).netloc.lower()
-        # Strip www.
-        domain = domain.removeprefix("www.")
-    except Exception:
-        return 0.5
-    if domain in HIGH_AUTHORITY:
-        return 0.9
-    if domain in MODERATE_AUTHORITY:
-        return 0.7
-    # Check for .edu, .gov
-    if domain.endswith(".edu") or domain.endswith(".gov"):
-        return 0.85
-    return 0.55
-def score_bias(finding: dict) -> float:
-    text = finding.get("evidence", "") + " " + finding.get("claim", "")
-    text_lower = text.lower()
-    score = 0.7  # baseline
-    # Penalize sensationalism
-    for pattern in SENSATIONAL_PATTERNS:
-        if re.search(pattern, text_lower):
-            score -= 0.1
-    # Bonus for balanced language
-    for pattern in BALANCED_PATTERNS:
-        if re.search(pattern, text_lower):
-            score += 0.05
-    return max(0.1, min(1.0, score))
-def detect_circular_sourcing(findings: list) -> list:
-    """Flag findings where multiple sources trace to the same original."""
-    url_groups = {}
-    for i, f in enumerate(findings):
-        url = f.get("source_url", "")
-        if url:
-            domain = urlparse(url).netloc.lower().removeprefix("www.")
-            claim_key = f.get("claim", "")[:50]
-            key = f"{domain}:{claim_key}"
-            url_groups.setdefault(key, []).append(i)
-    circular_indices = set()
-    for key, indices in url_groups.items():
-        if len(indices) > 1:
-            for idx in indices:
-                circular_indices.add(idx)
-    return list(circular_indices)
-def score_findings(findings: list) -> list:
-    circular = detect_circular_sourcing(findings)
-    # Count agent agreement per claim (simplified: exact claim match)
-    claim_agents = {}
-    for f in findings:
-        claim = f.get("claim", "")
-        agent = f.get("agent_role", "unknown")
-        source_type = f.get("source_type", "")
-        claim_agents.setdefault(claim, {"agents": set(), "source_types": set()})
-        claim_agents[claim]["agents"].add(agent)
-        claim_agents[claim]["source_types"].add(source_type)
-    scored = []
-    for i, f in enumerate(findings):
-        type_score = score_source_type(f)
-        recency_score = score_recency(f)
-        authority_score = score_domain_authority(f)
-        bias_score = score_bias(f)
-        # Weighted composite
-        composite = (
-            type_score * 0.35 +
-            recency_score * 0.20 +
-            authority_score * 0.25 +
-            bias_score * 0.20
-        )
-        # Corroboration bonus
-        claim = f.get("claim", "")
-        if claim in claim_agents:
-            info = claim_agents[claim]
-            if len(info["agents"]) >= 2 and len(info["source_types"]) >= 2:
-                composite += 0.15
-        # Circular sourcing penalty
-        is_circular = i in circular
-        if is_circular:
-            composite -= 0.2
-        composite = max(0.0, min(1.0, composite))
-        scored_finding = {
-            **f,
-            "credibility_score": round(composite, 3),
-            "score_breakdown": {
-                "source_type": round(type_score, 3),
-                "recency": round(recency_score, 3),
-                "domain_authority": round(authority_score, 3),
-                "bias": round(bias_score, 3),
-            },
-            "circular_sourcing": is_circular,
-            "corroborated": claim in claim_agents and len(claim_agents[claim]["agents"]) >= 2,
-            "trust_level": (
-                "high" if composite >= 0.75 else
-                "moderate" if composite >= 0.55 else
-                "low" if composite >= 0.35 else
-                "verify"
-            ),
-        }
-        scored.append(scored_finding)
-    return sorted(scored, key=lambda x: x["credibility_score"], reverse=True)
-def main():
-    if len(sys.argv) < 2:
-        print("Usage: score_credibility.py <findings.json>", file=sys.stderr)
-        sys.exit(1)
-    with open(sys.argv[1]) as f:
-        findings = json.load(f)
-    scored = score_findings(findings)
-    print(json.dumps(scored, indent=2))
-if __name__ == "__main__":
-    main()
+#!/usr/bin/env python3
+"""
+Source credibility scoring for ftm-researcher findings.
+Scoring dimensions:
+- Source type weight (35%): primary > peer_reviewed > official_docs > news > blog > forum
+- Recency (20%): decay based on age for fast-moving topics
+- Expertise signals (25%): domain authority, author credentials
+- Bias detection (20%): sensationalism penalties, balanced language bonuses
+Additional flags:
+- Corroboration bonus: +0.15 if independently found by 2+ agents from different source types
+- Circular sourcing: flag if multiple sources cite the same original
+"""
+import json
+import sys
+import re
+from datetime import datetime
+from urllib.parse import urlparse
+# Source type base weights
+SOURCE_WEIGHTS = {
+    "primary": 1.0,
+    "peer_reviewed": 0.9,
+    "official_docs": 0.85,
+    "code_repo": 0.8,
+    "qa_site": 0.65,
+    "news": 0.6,
+    "blog": 0.4,
+    "forum": 0.25,
+    "codebase": 0.95,  # local codebase findings are high-trust
+}
+# High-authority domains
+HIGH_AUTHORITY = {
+    "arxiv.org", "nature.com", "science.org", "acm.org", "ieee.org",
+    "github.com", "docs.python.org", "developer.mozilla.org",
+    "platform.openai.com", "docs.anthropic.com", "cloud.google.com",
+    "aws.amazon.com", "learn.microsoft.com",
+}
+MODERATE_AUTHORITY = {
+    "stackoverflow.com", "stackexchange.com", "reddit.com",
+    "news.ycombinator.com", "techcrunch.com", "arstechnica.com",
+    "thenewstack.io", "infoq.com", "dev.to",
+}
+# Sensationalism indicators
+SENSATIONAL_PATTERNS = [
+    r"you won't believe", r"shocking", r"mind-blowing", r"game.?changer",
+    r"revolutionary", r"incredible", r"amazing breakthrough",
+]
+# Balanced language indicators
+BALANCED_PATTERNS = [
+    r"however", r"on the other hand", r"trade-?off", r"limitation",
+    r"caveat", r"although", r"despite", r"conversely",
+]
+def score_source_type(finding: dict) -> float:
+    return SOURCE_WEIGHTS.get(finding.get("source_type", "blog"), 0.4)
+def score_recency(finding: dict, fast_moving: bool = True) -> float:
+    """Score based on source recency. Extracts year from URL or metadata."""
+    url = finding.get("source_url", "")
+    evidence = finding.get("evidence", "")
+    current_year = datetime.now().year
+    # Try to extract year from URL (common in blog/paper URLs)
+    year_match = re.search(r'/(20[12]\d)/', url)
+    if not year_match:
+        # Try evidence text for year mentions
+        year_match = re.search(r'\b(20[12]\d)\b', evidence)
+    if year_match:
+        source_year = int(year_match.group(1))
+        age = current_year - source_year
+        if fast_moving:
+            # Aggressive decay for fast-moving topics (tech, AI, etc.)
+            decay_map = {0: 1.0, 1: 0.85, 2: 0.65, 3: 0.45, 4: 0.30}
+            return decay_map.get(age, 0.2)
+        else:
+            # Gentle decay for stable topics
+            decay_map = {0: 1.0, 1: 0.95, 2: 0.85, 3: 0.75, 4: 0.65, 5: 0.55}
+            return decay_map.get(age, 0.4)
+    # No date info — return neutral
+    return 0.7
+def score_domain_authority(finding: dict) -> float:
+    url = finding.get("source_url", "")
+    if not url:
+        if finding.get("source_type") == "codebase":
+            return 0.95
+        return 0.5
+    try:
+        domain = urlparse(url).netloc.lower()
+        # Strip www.
+        domain = domain.removeprefix("www.")
+    except Exception:
+        return 0.5
+    if domain in HIGH_AUTHORITY:
+        return 0.9
+    if domain in MODERATE_AUTHORITY:
+        return 0.7
+    # Check for .edu, .gov
+    if domain.endswith(".edu") or domain.endswith(".gov"):
+        return 0.85
+    return 0.55
+def score_bias(finding: dict) -> float:
+    text = finding.get("evidence", "") + " " + finding.get("claim", "")
+    text_lower = text.lower()
+    score = 0.7  # baseline
+    # Penalize sensationalism
+    for pattern in SENSATIONAL_PATTERNS:
+        if re.search(pattern, text_lower):
+            score -= 0.1
+    # Bonus for balanced language
+    for pattern in BALANCED_PATTERNS:
+        if re.search(pattern, text_lower):
+            score += 0.05
+    return max(0.1, min(1.0, score))
+def detect_circular_sourcing(findings: list) -> list:
+    """Flag findings where multiple sources trace to the same original."""
+    url_groups = {}
+    for i, f in enumerate(findings):
+        url = f.get("source_url", "")
+        if url:
+            domain = urlparse(url).netloc.lower().removeprefix("www.")
+            claim_key = f.get("claim", "")[:50]
+            key = f"{domain}:{claim_key}"
+            url_groups.setdefault(key, []).append(i)
+    circular_indices = set()
+    for key, indices in url_groups.items():
+        if len(indices) > 1:
+            for idx in indices:
+                circular_indices.add(idx)
+    return list(circular_indices)
+def score_findings(findings: list) -> list:
+    circular = detect_circular_sourcing(findings)
+    # Count agent agreement per claim (simplified: exact claim match)
+    claim_agents = {}
+    for f in findings:
+        claim = f.get("claim", "")
+        agent = f.get("agent_role", "unknown")
+        source_type = f.get("source_type", "")
+        claim_agents.setdefault(claim, {"agents": set(), "source_types": set()})
+        claim_agents[claim]["agents"].add(agent)
+        claim_agents[claim]["source_types"].add(source_type)
+    scored = []
+    for i, f in enumerate(findings):
+        type_score = score_source_type(f)
+        recency_score = score_recency(f)
+        authority_score = score_domain_authority(f)
+        bias_score = score_bias(f)
+        # Weighted composite
+        composite = (
+            type_score * 0.35 +
+            recency_score * 0.20 +
+            authority_score * 0.25 +
+            bias_score * 0.20
+        )
+        # Corroboration bonus
+        claim = f.get("claim", "")
+        if claim in claim_agents:
+            info = claim_agents[claim]
+            if len(info["agents"]) >= 2 and len(info["source_types"]) >= 2:
+                composite += 0.15
+        # Circular sourcing penalty
+        is_circular = i in circular
+        if is_circular:
+            composite -= 0.2
+        composite = max(0.0, min(1.0, composite))
+        scored_finding = {
+            **f,
+            "credibility_score": round(composite, 3),
+            "score_breakdown": {
+                "source_type": round(type_score, 3),
+                "recency": round(recency_score, 3),
+                "domain_authority": round(authority_score, 3),
+                "bias": round(bias_score, 3),
+            },
+            "circular_sourcing": is_circular,
+            "corroborated": claim in claim_agents and len(claim_agents[claim]["agents"]) >= 2,
+            "trust_level": (
+                "high" if composite >= 0.75 else
+                "moderate" if composite >= 0.55 else
+                "low" if composite >= 0.35 else
+                "verify"
+            ),
+        }
+        scored.append(scored_finding)
+    return sorted(scored, key=lambda x: x["credibility_score"], reverse=True)
+def main():
+    if len(sys.argv) < 2:
+        print("Usage: score_credibility.py <findings.json>", file=sys.stderr)
+        sys.exit(1)
+    with open(sys.argv[1]) as f:
+        findings = json.load(f)
+    scored = score_findings(findings)
+    print(json.dumps(scored, indent=2))
+if __name__ == "__main__":
+    main()

package/ftm-researcher/scripts/validate_research.py CHANGED Viewed

@@ -1,92 +1,92 @@
-#!/usr/bin/env python3
-"""
-Validates ftm-researcher output for completeness and quality.
-Checks:
-1. All required fields present in each finding
-2. Source URLs are non-empty for non-codebase findings
-3. Confidence scores in valid range
-4. Disagreement map has all 4 tiers
-5. No placeholder text (TBD, TODO, FIXME)
-6. Minimum finding count per mode (quick: 3, standard: 10, deep: 15)
-7. Source diversity: at least 3 different source types represented
-8. No duplicate claims (exact match)
-"""
-import json
-import sys
-REQUIRED_FINDING_FIELDS = ["claim", "source_type", "confidence", "agent_role"]
-REQUIRED_MAP_TIERS = ["consensus", "contested", "unique_insights", "refuted"]
-PLACEHOLDER_PATTERNS = ["TBD", "TODO", "FIXME", "placeholder", "lorem ipsum"]
-MIN_FINDINGS = {"quick": 3, "standard": 10, "deep": 15}
-def validate(output: dict) -> dict:
-    errors = []
-    warnings = []
-    mode = output.get("mode", "standard")
-    findings = output.get("findings", [])
-    disagreement_map = output.get("disagreement_map", {})
-    # Check minimum findings
-    min_count = MIN_FINDINGS.get(mode, 10)
-    if len(findings) < min_count:
-        warnings.append(f"Only {len(findings)} findings for {mode} mode (expected >= {min_count})")
-    # Check required fields
-    for i, f in enumerate(findings):
-        for field in REQUIRED_FINDING_FIELDS:
-            if field not in f or not f[field]:
-                errors.append(f"Finding {i}: missing required field '{field}'")
-        # Source URL required for non-codebase
-        if f.get("source_type") != "codebase" and not f.get("source_url"):
-            warnings.append(f"Finding {i}: no source_url for {f.get('source_type')} source")
-        # Confidence range
-        conf = f.get("confidence", 0)
-        if not (0.0 <= conf <= 1.0):
-            errors.append(f"Finding {i}: confidence {conf} out of range [0, 1]")
-        # Placeholder detection
-        text = json.dumps(f).lower()
-        for p in PLACEHOLDER_PATTERNS:
-            if p.lower() in text:
-                errors.append(f"Finding {i}: contains placeholder text '{p}'")
-    # Source diversity
-    source_types = set(f.get("source_type", "") for f in findings)
-    if len(source_types) < 3:
-        warnings.append(f"Only {len(source_types)} source types (expected >= 3)")
-    # Duplicate detection
-    claims = [f.get("claim", "") for f in findings]
-    dupes = [c for c in claims if claims.count(c) > 1]
-    if dupes:
-        errors.append(f"Duplicate claims found: {set(dupes)}")
-    # Disagreement map tiers
-    if mode in ("standard", "deep"):
-        for tier in REQUIRED_MAP_TIERS:
-            if tier not in disagreement_map:
-                errors.append(f"Disagreement map missing tier: {tier}")
-    return {"errors": errors, "warnings": warnings, "valid": len(errors) == 0}
-def main():
-    if len(sys.argv) < 2:
-        print("Usage: validate_research.py <output.json>", file=sys.stderr)
-        sys.exit(1)
-    with open(sys.argv[1]) as f:
-        output = json.load(f)
-    result = validate(output)
-    print(json.dumps(result, indent=2))
-    sys.exit(0 if result["valid"] else 1)
-if __name__ == "__main__":
-    main()
+#!/usr/bin/env python3
+"""
+Validates ftm-researcher output for completeness and quality.
+Checks:
+1. All required fields present in each finding
+2. Source URLs are non-empty for non-codebase findings
+3. Confidence scores in valid range
+4. Disagreement map has all 4 tiers
+5. No placeholder text (TBD, TODO, FIXME)
+6. Minimum finding count per mode (quick: 3, standard: 10, deep: 15)
+7. Source diversity: at least 3 different source types represented
+8. No duplicate claims (exact match)
+"""
+import json
+import sys
+REQUIRED_FINDING_FIELDS = ["claim", "source_type", "confidence", "agent_role"]
+REQUIRED_MAP_TIERS = ["consensus", "contested", "unique_insights", "refuted"]
+PLACEHOLDER_PATTERNS = ["TBD", "TODO", "FIXME", "placeholder", "lorem ipsum"]
+MIN_FINDINGS = {"quick": 3, "standard": 10, "deep": 15}
+def validate(output: dict) -> dict:
+    errors = []
+    warnings = []
+    mode = output.get("mode", "standard")
+    findings = output.get("findings", [])
+    disagreement_map = output.get("disagreement_map", {})
+    # Check minimum findings
+    min_count = MIN_FINDINGS.get(mode, 10)
+    if len(findings) < min_count:
+        warnings.append(f"Only {len(findings)} findings for {mode} mode (expected >= {min_count})")
+    # Check required fields
+    for i, f in enumerate(findings):
+        for field in REQUIRED_FINDING_FIELDS:
+            if field not in f or not f[field]:
+                errors.append(f"Finding {i}: missing required field '{field}'")
+        # Source URL required for non-codebase
+        if f.get("source_type") != "codebase" and not f.get("source_url"):
+            warnings.append(f"Finding {i}: no source_url for {f.get('source_type')} source")
+        # Confidence range
+        conf = f.get("confidence", 0)
+        if not (0.0 <= conf <= 1.0):
+            errors.append(f"Finding {i}: confidence {conf} out of range [0, 1]")
+        # Placeholder detection
+        text = json.dumps(f).lower()
+        for p in PLACEHOLDER_PATTERNS:
+            if p.lower() in text:
+                errors.append(f"Finding {i}: contains placeholder text '{p}'")
+    # Source diversity
+    source_types = set(f.get("source_type", "") for f in findings)
+    if len(source_types) < 3:
+        warnings.append(f"Only {len(source_types)} source types (expected >= 3)")
+    # Duplicate detection
+    claims = [f.get("claim", "") for f in findings]
+    dupes = [c for c in claims if claims.count(c) > 1]
+    if dupes:
+        errors.append(f"Duplicate claims found: {set(dupes)}")
+    # Disagreement map tiers
+    if mode in ("standard", "deep"):
+        for tier in REQUIRED_MAP_TIERS:
+            if tier not in disagreement_map:
+                errors.append(f"Disagreement map missing tier: {tier}")
+    return {"errors": errors, "warnings": warnings, "valid": len(errors) == 0}
+def main():
+    if len(sys.argv) < 2:
+        print("Usage: validate_research.py <output.json>", file=sys.stderr)
+        sys.exit(1)
+    with open(sys.argv[1]) as f:
+        output = json.load(f)
+    result = validate(output)
+    print(json.dumps(result, indent=2))
+    sys.exit(0 if result["valid"] else 1)
+if __name__ == "__main__":
+    main()

package/ftm-researcher.yml CHANGED Viewed

@@ -1,2 +1,2 @@
-name: ftm-researcher
-description: Deep parallel research engine with 7 domain-specialized finder agents, adversarial review via ftm-council, adaptive wave-based search, and codebase awareness. Use when the user wants thorough research on any topic — "research X", "find out about Y", "what's the state of the art on Z", "compare approaches to W", "deep dive into X", "look into Y". Also invoked by ftm-brainstorm for its research sprints. Triggers on "research", "investigate", "deep dive", "state of the art", "compare", "find examples of", "what's out there for", "how do others handle", "find me evidence", "look into". For idea exploration and brainstorming, use ftm-brainstorm instead (which calls ftm-researcher internally for research).
+name: ftm-researcher
+description: Deep parallel research engine with 7 domain-specialized finder agents, adversarial review via ftm-council, adaptive wave-based search, and codebase awareness. Use when the user wants thorough research on any topic — "research X", "find out about Y", "what's the state of the art on Z", "compare approaches to W", "deep dive into X", "look into Y". Also invoked by ftm-brainstorm for its research sprints. Triggers on "research", "investigate", "deep dive", "state of the art", "compare", "find examples of", "what's out there for", "how do others handle", "find me evidence", "look into". For idea exploration and brainstorming, use ftm-brainstorm instead (which calls ftm-researcher internally for research).