npm - verifiable-thinking-mcp - Versions diffs - 0.4.0 - Mend

verifiable-thinking-mcp 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (68) hide show

package/LICENSE +21 -0
package/README.md +339 -0
package/package.json +75 -0
package/src/index.ts +38 -0
package/src/lib/cache.ts +246 -0
package/src/lib/compression.ts +804 -0
package/src/lib/compute/cache.ts +86 -0
package/src/lib/compute/classifier.ts +555 -0
package/src/lib/compute/confidence.ts +79 -0
package/src/lib/compute/context.ts +154 -0
package/src/lib/compute/extract.ts +200 -0
package/src/lib/compute/filter.ts +224 -0
package/src/lib/compute/index.ts +171 -0
package/src/lib/compute/math.ts +247 -0
package/src/lib/compute/patterns.ts +564 -0
package/src/lib/compute/registry.ts +145 -0
package/src/lib/compute/solvers/arithmetic.ts +65 -0
package/src/lib/compute/solvers/calculus.ts +249 -0
package/src/lib/compute/solvers/derivation-core.ts +371 -0
package/src/lib/compute/solvers/derivation-latex.ts +160 -0
package/src/lib/compute/solvers/derivation-mistakes.ts +1046 -0
package/src/lib/compute/solvers/derivation-simplify.ts +451 -0
package/src/lib/compute/solvers/derivation-transform.ts +620 -0
package/src/lib/compute/solvers/derivation.ts +67 -0
package/src/lib/compute/solvers/facts.ts +120 -0
package/src/lib/compute/solvers/formula.ts +728 -0
package/src/lib/compute/solvers/index.ts +36 -0
package/src/lib/compute/solvers/logic.ts +422 -0
package/src/lib/compute/solvers/probability.ts +307 -0
package/src/lib/compute/solvers/statistics.ts +262 -0
package/src/lib/compute/solvers/word-problems.ts +408 -0
package/src/lib/compute/types.ts +107 -0
package/src/lib/concepts.ts +111 -0
package/src/lib/domain.ts +731 -0
package/src/lib/extraction.ts +912 -0
package/src/lib/index.ts +122 -0
package/src/lib/judge.ts +260 -0
package/src/lib/math/ast.ts +842 -0
package/src/lib/math/index.ts +8 -0
package/src/lib/math/operators.ts +171 -0
package/src/lib/math/tokenizer.ts +477 -0
package/src/lib/patterns.ts +200 -0
package/src/lib/session.ts +825 -0
package/src/lib/think/challenge.ts +323 -0
package/src/lib/think/complexity.ts +504 -0
package/src/lib/think/confidence-drift.ts +507 -0
package/src/lib/think/consistency.ts +347 -0
package/src/lib/think/guidance.ts +188 -0
package/src/lib/think/helpers.ts +568 -0
package/src/lib/think/hypothesis.ts +216 -0
package/src/lib/think/index.ts +127 -0
package/src/lib/think/prompts.ts +262 -0
package/src/lib/think/route.ts +358 -0
package/src/lib/think/schema.ts +98 -0
package/src/lib/think/scratchpad-schema.ts +662 -0
package/src/lib/think/spot-check.ts +961 -0
package/src/lib/think/types.ts +93 -0
package/src/lib/think/verification.ts +260 -0
package/src/lib/tokens.ts +177 -0
package/src/lib/verification.ts +620 -0
package/src/prompts/index.ts +10 -0
package/src/prompts/templates.ts +336 -0
package/src/resources/index.ts +8 -0
package/src/resources/sessions.ts +196 -0
package/src/tools/compress.ts +138 -0
package/src/tools/index.ts +5 -0
package/src/tools/scratchpad.ts +2659 -0
package/src/tools/sessions.ts +144 -0

package/src/lib/domain.ts ADDED Viewed

@@ -0,0 +1,731 @@
+/**
+ * Unified Domain Detector
+ *
+ * Single source of truth for domain detection used by:
+ * - Complexity router (think/complexity.ts) → complexity weight
+ * - Compute engine (compute/) → solver relevance filtering
+ * - Verification (verification.ts) → domain-specific checks
+ *
+ * Architecture: O(n) keyword matching with precomputed lowercase
+ * Returns both granular domain and meta-category for different consumers.
+ */
+import { type SolverMask, SolverType } from "./compute/classifier.ts";
+// =============================================================================
+// TYPES
+// =============================================================================
+/** Granular domain for complexity scoring */
+export type GranularDomain =
+  | "quantum_computing"
+  | "cryptography"
+  | "complexity_theory"
+  | "distributed_systems"
+  | "networking"
+  | "competitive_analysis"
+  | "paradox"
+  | "probability_statistics"
+  | "machine_learning"
+  | "cognitive_reasoning"
+  | "algorithms"
+  | "calculus"
+  | "linear_algebra"
+  | "logic_puzzle"
+  | "game_theory"
+  | "number_theory"
+  | "combinatorics"
+  | "constraint_reasoning"
+  | "conditional_probability"
+  | "lateral_thinking"
+  | "rate_problems"
+  | "clock_problems"
+  | "common_knowledge"
+  | "financial"
+  | "teaching"
+  | "general";
+/** Meta-category for compute filtering */
+export type MetaDomain = "financial" | "coding" | "scientific" | "educational" | "general";
+/** Verification domain (legacy compat) */
+export type VerificationDomain = "math" | "logic" | "code" | "general";
+/** Full detection result */
+export interface DomainResult {
+  /** Granular domain name */
+  domain: GranularDomain;
+  /** Complexity weight (0-1) for router */
+  weight: number;
+  /** Meta-category for compute filtering */
+  meta: MetaDomain;
+  /** Verification domain for legacy compat */
+  verification: VerificationDomain;
+  /** Solver types relevant for this domain */
+  relevantSolvers: SolverMask;
+}
+// =============================================================================
+// DOMAIN DEFINITIONS
+// =============================================================================
+interface DomainDef {
+  keywords: string[];
+  weight: number;
+  meta: MetaDomain;
+  verification: VerificationDomain;
+  /** Which solver types are relevant (bitmask) */
+  solvers: SolverMask;
+}
+/** All solver types - for educational/general where we want everything */
+const ALL_SOLVERS =
+  SolverType.ARITHMETIC |
+  SolverType.FORMULA_TIER1 |
+  SolverType.FORMULA_TIER2 |
+  SolverType.FORMULA_TIER3 |
+  SolverType.FORMULA_TIER4 |
+  SolverType.WORD_PROBLEM |
+  SolverType.MULTI_STEP |
+  SolverType.CALCULUS |
+  SolverType.FACTS |
+  SolverType.LOGIC |
+  SolverType.PROBABILITY;
+/** Basic math only - for general questions */
+const BASIC_MATH =
+  SolverType.ARITHMETIC | SolverType.FORMULA_TIER1 | SolverType.FORMULA_TIER2 | SolverType.FACTS;
+/** Financial computations */
+const FINANCIAL_SOLVERS =
+  SolverType.ARITHMETIC |
+  SolverType.FORMULA_TIER1 | // percentage
+  SolverType.FORMULA_TIER4 | // interest
+  SolverType.WORD_PROBLEM;
+/** Coding-relevant computations */
+const CODING_SOLVERS =
+  SolverType.ARITHMETIC |
+  SolverType.FORMULA_TIER1 | // modulo, factorial
+  SolverType.FORMULA_TIER2 | // power, gcd, lcm
+  SolverType.FORMULA_TIER3; // log, combinations
+/** Scientific computations (all math) */
+const SCIENTIFIC_SOLVERS = ALL_SOLVERS;
+/** Logic and probability */
+const LOGIC_SOLVERS =
+  SolverType.LOGIC | SolverType.PROBABILITY | SolverType.FACTS | SolverType.ARITHMETIC;
+const DOMAINS: Record<GranularDomain, DomainDef> = {
+  // === HIGH COMPLEXITY (0.9+) ===
+  quantum_computing: {
+    keywords: ["quantum", "qubit", "superposition", "entanglement", "shor's algorithm"],
+    weight: 0.95,
+    meta: "scientific",
+    verification: "math",
+    solvers: SCIENTIFIC_SOLVERS,
+  },
+  cryptography: {
+    keywords: [
+      "cryptograph",
+      "rsa",
+      "lattice",
+      "zero-knowledge",
+      "discrete logarithm",
+      "public-key",
+      "security reduction",
+    ],
+    weight: 0.95,
+    meta: "coding",
+    verification: "math",
+    solvers: CODING_SOLVERS,
+  },
+  common_knowledge: {
+    keywords: [
+      "blue eyes",
+      "blue-eyed",
+      "islanders",
+      "leave at midnight",
+      "know your",
+      "common knowledge",
+      "induction",
+      "eye color",
+      "days until",
+    ],
+    weight: 0.95,
+    meta: "educational",
+    verification: "logic",
+    solvers: ALL_SOLVERS,
+  },
+  complexity_theory: {
+    keywords: [
+      "p ≠ np",
+      "p vs np",
+      "np-complete",
+      "np-hard",
+      "polynomial-time",
+      "exponential time",
+      "sat solver",
+      "sat instance",
+      "halting problem",
+      "undecidable",
+      "computability",
+      "turing machine",
+    ],
+    weight: 0.9,
+    meta: "coding",
+    verification: "logic",
+    solvers: CODING_SOLVERS,
+  },
+  distributed_systems: {
+    keywords: [
+      "lock-free",
+      "consensus",
+      "distributed",
+      "byzantine",
+      "memory ordering",
+      "cache coherence",
+      "two-phase commit",
+      "paxos",
+      "raft",
+    ],
+    weight: 0.9,
+    meta: "coding",
+    verification: "code",
+    solvers: CODING_SOLVERS,
+  },
+  paradox: {
+    keywords: [
+      "two envelopes",
+      "envelope paradox",
+      "sleeping beauty",
+      "halfers",
+      "thirders",
+      "monty hall",
+      "naive argument",
+      "symmetrically",
+      "prisoners",
+      "loop-following",
+      "survival probability",
+      "100 boxes",
+      "boy born on tuesday",
+      "born on",
+      "probability both are boys",
+      "both children",
+      "two children",
+      "this statement",
+      "self-referential",
+      "liar paradox",
+      "sorites",
+      "heap paradox",
+      "grain",
+      "simpson",
+      "aggregation paradox",
+    ],
+    weight: 0.92,
+    meta: "educational",
+    verification: "logic",
+    solvers: ALL_SOLVERS,
+  },
+  logic_puzzle: {
+    keywords: [
+      "knight",
+      "knave",
+      "liar",
+      "truth-teller",
+      "truthteller",
+      "syllogism",
+      "valid argument",
+      "sound argument",
+      "premise",
+      "conclusion follows",
+      "logically",
+      "VALID",
+      "INVALID",
+      "UNSOUND",
+      "valid or invalid",
+      "sound or unsound",
+    ],
+    weight: 0.92,
+    meta: "educational",
+    verification: "logic",
+    solvers: LOGIC_SOLVERS,
+  },
+  game_theory: {
+    keywords: [
+      "prisoner's dilemma",
+      "nash equilibrium",
+      "payoff",
+      "dominant strategy",
+      "zero-sum",
+      "minimax",
+      "game theory",
+    ],
+    weight: 0.9,
+    meta: "scientific",
+    verification: "math",
+    solvers: SCIENTIFIC_SOLVERS,
+  },
+  conditional_probability: {
+    keywords: [
+      "given that",
+      "conditional",
+      "revolver",
+      "russian roulette",
+      "chamber",
+      "bullet",
+      "envelope",
+      "adjacent",
+      "spin",
+      "fire",
+    ],
+    weight: 0.9,
+    meta: "scientific",
+    verification: "math",
+    solvers: SolverType.PROBABILITY | SolverType.ARITHMETIC,
+  },
+  competitive_analysis: {
+    keywords: ["competitive ratio", "online algorithm", "ski-rental", "adversarial"],
+    weight: 0.88,
+    meta: "coding",
+    verification: "math",
+    solvers: CODING_SOLVERS,
+  },
+  // === MODERATE-HIGH COMPLEXITY (0.7-0.89) ===
+  number_theory: {
+    keywords: [
+      "prime",
+      "factorial",
+      "divisible",
+      "remainder",
+      "modulo",
+      "mod ",
+      "trailing zero",
+      "integer",
+      "divisor",
+      "gcd",
+      "lcm",
+      "last digit",
+      "^100",
+      "^10",
+    ],
+    weight: 0.85,
+    meta: "scientific",
+    verification: "math",
+    solvers:
+      SolverType.FORMULA_TIER1 |
+      SolverType.FORMULA_TIER2 |
+      SolverType.FORMULA_TIER3 |
+      SolverType.ARITHMETIC,
+  },
+  combinatorics: {
+    keywords: [
+      "arrange",
+      "permutation",
+      "combination",
+      "ways to",
+      "how many ways",
+      "choose",
+      "select",
+      "distribute",
+      "partition",
+      "letters in",
+      "anagram",
+      "mississippi",
+      "arrange the letters",
+    ],
+    weight: 0.85,
+    meta: "scientific",
+    verification: "math",
+    solvers: SolverType.FORMULA_TIER3 | SolverType.ARITHMETIC,
+  },
+  constraint_reasoning: {
+    keywords: [
+      "minimum number",
+      "guarantee",
+      "worst case",
+      "at least",
+      "at most",
+      "balance scale",
+      "weighing",
+      "pigeonhole",
+      "must draw",
+      "must flip",
+    ],
+    weight: 0.85,
+    meta: "educational",
+    verification: "logic",
+    solvers: ALL_SOLVERS,
+  },
+  clock_problems: {
+    keywords: ["clock hands", "hour hand", "minute hand", "overlap", "12 hours", "24 hours"],
+    weight: 0.85,
+    meta: "scientific",
+    verification: "math",
+    solvers: SolverType.ARITHMETIC | SolverType.FORMULA_TIER1,
+  },
+  probability_statistics: {
+    keywords: [
+      "probability",
+      "bayesian",
+      "conditional probability",
+      "bayes",
+      "distribution",
+      "regression",
+      "statistical",
+      "expected value",
+      "variance",
+      "sample size",
+      "more reliable",
+      "less reliable",
+      "survey of",
+      "expected number",
+      "expected flips",
+      "expected rolls",
+      // Econometrics / causal inference
+      "instrumental variable",
+      "instrument",
+      "causal effect",
+      "causal inference",
+      "endogenous",
+      "exogenous",
+      "confound",
+      "confounder",
+      "treatment effect",
+      "randomized",
+      "observational",
+      "selection bias",
+      "omitted variable",
+      "estimate effect",
+      "estimate the effect",
+    ],
+    weight: 0.85, // Slightly higher than teaching (0.6) to win keyword conflicts
+    meta: "scientific",
+    verification: "math",
+    solvers: SolverType.PROBABILITY | SolverType.ARITHMETIC | SolverType.FORMULA_TIER1,
+  },
+  lateral_thinking: {
+    keywords: ["trick", "lateral", "only enter once", "can only", "how do you", "determine which"],
+    weight: 0.8,
+    meta: "educational",
+    verification: "logic",
+    solvers: ALL_SOLVERS,
+  },
+  machine_learning: {
+    keywords: [
+      "backpropagation",
+      "gradient",
+      "neural network",
+      "deep learning",
+      "optimization",
+      "loss function",
+      "transformer",
+      "attention mechanism",
+    ],
+    weight: 0.75,
+    meta: "coding",
+    verification: "math",
+    solvers: SCIENTIFIC_SOLVERS,
+  },
+  cognitive_reasoning: {
+    keywords: [
+      "cognitive",
+      "psychology",
+      "logical fallacy",
+      "fallacy",
+      "inference",
+      "heuristic",
+      "bias",
+    ],
+    weight: 0.75,
+    meta: "educational",
+    verification: "logic",
+    solvers: LOGIC_SOLVERS,
+  },
+  rate_problems: {
+    keywords: [
+      "machines",
+      "widgets",
+      "workers",
+      "mph",
+      "speed",
+      "rate",
+      "per hour",
+      "per minute",
+      "round trip",
+      "average speed",
+    ],
+    weight: 0.75,
+    meta: "scientific",
+    verification: "math",
+    solvers: SolverType.WORD_PROBLEM | SolverType.ARITHMETIC | SolverType.FORMULA_TIER1,
+  },
+  calculus: {
+    keywords: [
+      "derivative",
+      "integral",
+      "limit",
+      "differentiation",
+      "integration",
+      "calculus",
+      "d/dx",
+      "integral of",
+      "∫",
+    ],
+    weight: 0.72,
+    meta: "scientific",
+    verification: "math",
+    solvers:
+      SolverType.CALCULUS |
+      SolverType.ARITHMETIC |
+      SolverType.FORMULA_TIER1 |
+      SolverType.FORMULA_TIER2,
+  },
+  algorithms: {
+    keywords: [
+      "algorithm",
+      "time complexity",
+      "space complexity",
+      "big-o",
+      "recursion",
+      "dynamic programming",
+      "graph traversal",
+    ],
+    weight: 0.7,
+    meta: "coding",
+    verification: "code",
+    solvers: CODING_SOLVERS,
+  },
+  linear_algebra: {
+    keywords: [
+      "matrix",
+      "determinant",
+      "eigenvalue",
+      "eigenvector",
+      "inverse matrix",
+      "transpose",
+      "linear transformation",
+    ],
+    weight: 0.7,
+    meta: "scientific",
+    verification: "math",
+    solvers: SolverType.FORMULA_TIER4 | SolverType.ARITHMETIC,
+  },
+  networking: {
+    keywords: ["tcp", "udp", "three-way handshake", "protocol", "packet", "routing", "dns", "http"],
+    weight: 0.7,
+    meta: "coding",
+    verification: "code",
+    solvers: BASIC_MATH,
+  },
+  // === FINANCIAL (special category) ===
+  financial: {
+    keywords: [
+      "interest",
+      "compound",
+      "investment",
+      "roi",
+      "return on",
+      "savings",
+      "loan",
+      "mortgage",
+      "amortization",
+      "apr",
+      "apy",
+      "stock",
+      "portfolio",
+      "dividend",
+      "inflation",
+      "present value",
+      "future value",
+      "npv",
+      "irr",
+      "financial advisor",
+      "finance",
+      "budget",
+      "expense",
+      "revenue",
+      "profit margin",
+      "break-even",
+    ],
+    weight: 0.65,
+    meta: "financial",
+    verification: "math",
+    solvers: FINANCIAL_SOLVERS,
+  },
+  // === TEACHING/EDUCATIONAL (show all work) ===
+  teaching: {
+    keywords: [
+      "tutor",
+      "teacher",
+      "student",
+      "homework",
+      "assignment",
+      "lesson",
+      "learn",
+      "explain",
+      "teach",
+      "class",
+      "course",
+      "education",
+      "school",
+      "university",
+      "college",
+      "exam",
+      "test prep",
+      "study",
+      "practice problem",
+      "exercise",
+      "worksheet",
+      "step by step",
+      "show your work",
+      "show work",
+      "solve step",
+      "walk through",
+      "walkthrough",
+    ],
+    weight: 0.55, // Lower than most domains - should be overridden by specific math domains
+    meta: "educational",
+    verification: "general",
+    solvers: ALL_SOLVERS,
+  },
+  // === DEFAULT ===
+  general: {
+    keywords: [],
+    weight: 0.5,
+    meta: "general",
+    verification: "general",
+    solvers: BASIC_MATH,
+  },
+};
+// Precompute domain list for iteration (excludes "general" which is fallback)
+const DOMAIN_LIST = Object.entries(DOMAINS).filter(([name]) => name !== "general") as [
+  GranularDomain,
+  DomainDef,
+][];
+// =============================================================================
+// OPTIMIZED KEYWORD INDEX
+// Build a keyword→domain map for O(1) exact-match lookups.
+// Keywords sorted by length (longest first) for substring matching.
+// =============================================================================
+interface KeywordEntry {
+  keyword: string;
+  domain: GranularDomain;
+  def: DomainDef;
+}
+// Build keyword index at module load time
+const KEYWORD_INDEX: KeywordEntry[] = [];
+for (const [domain, def] of DOMAIN_LIST) {
+  for (const kw of def.keywords) {
+    KEYWORD_INDEX.push({ keyword: kw.toLowerCase(), domain, def });
+  }
+}
+// Sort by:
+// 1. Domain weight descending (higher complexity domains match first)
+// 2. Keyword length descending (longer matches take priority within same weight tier)
+// This ensures "conditional probability" matches before "probability",
+// and higher-weight domains like "financial" match before lower-weight ones like "teaching"
+KEYWORD_INDEX.sort((a, b) => {
+  const weightDiff = b.def.weight - a.def.weight;
+  if (Math.abs(weightDiff) > 0.01) return weightDiff;
+  return b.keyword.length - a.keyword.length;
+});
+// =============================================================================
+// MAIN DETECTION FUNCTION
+// =============================================================================
+/**
+ * Detect domain from text with optimized keyword matching.
+ * Uses pre-sorted keyword index for O(k) complexity where k = number of keywords.
+ * Keywords are checked longest-first to prefer more specific matches.
+ *
+ * @param text - Text to analyze (question, system prompt, or thought)
+ * @returns Full domain detection result
+ */
+export function detectDomainFull(text: string): DomainResult {
+  const lower = text.toLowerCase();
+  // Optimized: iterate pre-sorted keywords (longest first)
+  // First match wins, ensuring "conditional probability" beats "probability"
+  for (const { keyword, domain, def } of KEYWORD_INDEX) {
+    if (lower.includes(keyword)) {
+      return {
+        domain,
+        weight: def.weight,
+        meta: def.meta,
+        verification: def.verification,
+        relevantSolvers: def.solvers,
+      };
+    }
+  }
+  // Fallback to general
+  const general = DOMAINS.general;
+  return {
+    domain: "general",
+    weight: general.weight,
+    meta: general.meta,
+    verification: general.verification,
+    relevantSolvers: general.solvers,
+  };
+}
+// =============================================================================
+// CONVENIENCE FUNCTIONS
+// =============================================================================
+/**
+ * Get just the granular domain name (for complexity router)
+ */
+export function detectGranularDomain(text: string): GranularDomain {
+  return detectDomainFull(text).domain;
+}
+/**
+ * Get domain weight for complexity scoring
+ */
+export function getDomainWeight(text: string): { domain: string; weight: number } {
+  const result = detectDomainFull(text);
+  return { domain: result.domain, weight: result.weight };
+}
+/**
+ * Get meta-domain for compute filtering
+ */
+export function detectMetaDomain(text: string): MetaDomain {
+  return detectDomainFull(text).meta;
+}
+/**
+ * Get verification domain (legacy compat with verification.ts)
+ */
+export function detectVerificationDomain(text: string): VerificationDomain {
+  return detectDomainFull(text).verification;
+}
+/**
+ * Get relevant solver bitmask for a text's domain
+ */
+export function getRelevantSolvers(text: string): SolverMask {
+  return detectDomainFull(text).relevantSolvers;
+}
+/**
+ * Check if a solver type is relevant for the detected domain
+ */
+export function isSolverRelevant(text: string, solverType: SolverMask): boolean {
+  const relevant = detectDomainFull(text).relevantSolvers;
+  return (relevant & solverType) !== 0;
+}