npm - thumbgate - Versions diffs - 1.15.0 → 1.16.0 - Mend

thumbgate 1.15.0 → 1.16.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (129) hide show

package/.claude-plugin/marketplace.json +6 -6
package/.claude-plugin/plugin.json +3 -3
package/.well-known/llms.txt +5 -5
package/.well-known/mcp/server-card.json +1 -1
package/README.md +59 -35
package/adapters/chatgpt/openapi.yaml +118 -2
package/adapters/claude/.mcp.json +2 -2
package/adapters/mcp/server-stdio.js +210 -84
package/adapters/opencode/opencode.json +1 -1
package/bench/prompt-eval-suite.json +5 -1
package/bin/cli.js +157 -8
package/config/evals/agent-safety-eval.json +338 -22
package/config/gates/routine.json +43 -0
package/config/github-about.json +3 -3
package/config/model-candidates.json +131 -0
package/openapi/openapi.yaml +118 -2
package/package.json +55 -48
package/public/blog.html +7 -7
package/public/codex-plugin.html +6 -6
package/public/compare.html +29 -23
package/public/dashboard.html +82 -10
package/public/guide.html +28 -28
package/public/index.html +216 -98
package/public/learn.html +50 -22
package/public/lessons.html +1 -1
package/public/numbers.html +17 -17
package/public/pro.html +82 -18
package/scripts/agent-audit-trace.js +55 -0
package/scripts/agent-memory-lifecycle.js +96 -0
package/scripts/agent-readiness-plan.js +118 -0
package/scripts/agentic-data-pipeline.js +21 -1
package/scripts/agents-sdk-sandbox-plan.js +57 -0
package/scripts/ai-org-governance.js +98 -0
package/scripts/ai-search-distribution.js +43 -0
package/scripts/artifact-agent-plan.js +81 -0
package/scripts/billing.js +27 -8
package/scripts/cli-schema.js +18 -2
package/scripts/code-mode-mcp-plan.js +71 -0
package/scripts/context-engine.js +1 -2
package/scripts/context-manager.js +4 -1
package/scripts/dashboard-render-spec.js +1 -1
package/scripts/dashboard.js +275 -9
package/scripts/decision-journal.js +13 -3
package/scripts/document-workflow-governance.js +62 -0
package/scripts/enterprise-agent-rollout.js +34 -0
package/scripts/experience-replay-governance.js +69 -0
package/scripts/export-hf-dataset.js +1 -1
package/scripts/feedback-loop.js +92 -4
package/scripts/feedback-to-rules.js +17 -23
package/scripts/gates-engine.js +4 -6
package/scripts/growth-campaigns.js +49 -0
package/scripts/harness-selector.js +16 -4
package/scripts/hybrid-supervisor-agent.js +64 -0
package/scripts/inference-cache-policy.js +72 -0
package/scripts/inference-economics.js +53 -0
package/scripts/internal-agent-bootstrap.js +12 -2
package/scripts/knowledge-layer-plan.js +108 -0
package/scripts/lesson-inference.js +183 -44
package/scripts/lesson-search.js +4 -1
package/scripts/llm-client.js +157 -26
package/scripts/mailer/resend-mailer.js +112 -1
package/scripts/mcp-transport-strategy.js +66 -0
package/scripts/memory-store-governance.js +60 -0
package/scripts/meta-agent-loop.js +7 -13
package/scripts/model-access-eligibility.js +38 -0
package/scripts/model-migration-readiness.js +55 -0
package/scripts/operational-integrity.js +96 -3
package/scripts/otel-declarative-config.js +56 -0
package/scripts/perplexity-client.js +1 -1
package/scripts/post-training-governance.js +34 -0
package/scripts/private-core-boundary.js +72 -0
package/scripts/production-agent-readiness.js +40 -0
package/scripts/prompt-eval.js +564 -32
package/scripts/prompt-programs.js +93 -0
package/scripts/provider-action-normalizer.js +585 -0
package/scripts/scaling-law-claims.js +60 -0
package/scripts/security-scanner.js +1 -1
package/scripts/self-distill-agent.js +7 -32
package/scripts/seo-gsd.js +232 -55
package/scripts/skill-rag-router.js +53 -0
package/scripts/spec-gate.js +1 -1
package/scripts/student-consistent-training.js +73 -0
package/scripts/synthetic-data-provenance.js +98 -0
package/scripts/task-context-result.js +81 -0
package/scripts/telemetry-analytics.js +149 -0
package/scripts/thompson-sampling.js +2 -2
package/scripts/token-savings.js +7 -6
package/scripts/token-tco.js +46 -0
package/scripts/tool-registry.js +63 -3
package/scripts/verification-loop.js +10 -1
package/scripts/verifier-scoring.js +71 -0
package/scripts/workflow-sentinel.js +284 -28
package/scripts/workspace-agent-routines.js +118 -0
package/src/api/server.js +381 -120
package/scripts/analytics-report.js +0 -328
package/scripts/autonomous-workflow.js +0 -377
package/scripts/billing-setup.js +0 -109
package/scripts/creator-campaigns.js +0 -239
package/scripts/cross-encoder-reranker.js +0 -235
package/scripts/daemon-manager.js +0 -108
package/scripts/decision-trace.js +0 -354
package/scripts/delegation-runtime.js +0 -896
package/scripts/dispatch-brief.js +0 -159
package/scripts/distribution-surfaces.js +0 -110
package/scripts/feedback-history-distiller.js +0 -382
package/scripts/funnel-analytics.js +0 -35
package/scripts/history-distiller.js +0 -200
package/scripts/hosted-job-launcher.js +0 -256
package/scripts/intent-router.js +0 -392
package/scripts/lesson-reranker.js +0 -263
package/scripts/lesson-retrieval.js +0 -148
package/scripts/managed-lesson-agent.js +0 -183
package/scripts/operational-dashboard.js +0 -103
package/scripts/operational-summary.js +0 -129
package/scripts/operator-artifacts.js +0 -608
package/scripts/optimize-context.js +0 -17
package/scripts/org-dashboard.js +0 -206
package/scripts/partner-orchestration.js +0 -146
package/scripts/predictive-insights.js +0 -356
package/scripts/pulse.js +0 -80
package/scripts/reflector-agent.js +0 -221
package/scripts/sales-pipeline.js +0 -681
package/scripts/session-episode-store.js +0 -329
package/scripts/session-health-sensor.js +0 -242
package/scripts/session-report.js +0 -120
package/scripts/swarm-coordinator.js +0 -81
package/scripts/tool-kpi-tracker.js +0 -12
package/scripts/webhook-delivery.js +0 -62
package/scripts/workflow-sprint-intake.js +0 -475

package/adapters/mcp/server-stdio.js CHANGED Viewed

@@ -4,6 +4,10 @@
 const fs = require('fs');
 const path = require('path');
 const promptCache = new Map();
+const {
+  createUnavailableReport,
+  loadOptionalModule,
+} = require('../../scripts/private-core-boundary');
 function getCachedPrompt(key) {
   return promptCache.get(key);
@@ -46,14 +50,6 @@ const {
   readSessionHandoff,
 } = require('../../scripts/contextfs');
 const { buildRubricEvaluation } = require('../../scripts/rubric-engine');
-const {
-  listIntents,
-  planIntent,
-} = require('../../scripts/intent-router');
-const {
-  startHandoff,
-  completeHandoff,
-} = require('../../scripts/delegation-runtime');
 const {
   getActiveMcpProfile,
   getAllowedTools,
@@ -80,6 +76,9 @@ const {
 const {
   evaluateWorkflowSentinel,
 } = require('../../scripts/workflow-sentinel');
+const {
+  normalizeProviderAction,
+} = require('../../scripts/provider-action-normalizer');
 const { diagnoseFailure } = require('../../scripts/failure-diagnostics');
 const {
   analyzeCodeGraphImpact,
@@ -98,12 +97,11 @@ const {
   loadModel,
   getReliability,
 } = require('../../scripts/thompson-sampling');
-const {
-  searchLessons,
-} = require('../../scripts/lesson-search');
 const {
   retrieveRelevantLessons,
-} = require('../../scripts/lesson-retrieval');
+} = loadOptionalModule(path.join(__dirname, '../../scripts/lesson-retrieval'), () => ({
+  retrieveRelevantLessons: () => [],
+}));
 const {
   searchThumbgate,
 } = require('../../scripts/thumbgate-search');
@@ -116,7 +114,17 @@ const {
   readImportedDocument,
 } = require('../../scripts/document-intake');
 const { checkLimit, UPGRADE_MESSAGE } = require('../../scripts/rate-limiter');
-const { generateOrgDashboard } = require('../../scripts/org-dashboard');
+const { generateOrgDashboard } = loadOptionalModule(path.join(__dirname, '../../scripts/org-dashboard'), () => ({
+  generateOrgDashboard: () => ({
+    activeAgents: 0,
+    totalAgents: 0,
+    orgAdherenceRate: 0,
+    topBlockedGates: [],
+    riskAgents: [],
+    upgradeMessage: 'Org dashboard requires ThumbGate-Core.',
+    ...createUnavailableReport('Org dashboard'),
+  }),
+}));
 const {
   listHarnesses,
   runHarness,
@@ -124,21 +132,56 @@ const {
 const { runLoop: runAutoresearchLoop } = require('../../scripts/autoresearch-runner');
 const { TOOLS } = require('../../scripts/tool-registry');
 const { buildContextFootprintReport } = require('../../scripts/context-footprint');
-const { reflect: reflectOnFeedback } = require('../../scripts/reflector-agent');
+const { reflect: reflectOnFeedback } = loadOptionalModule(path.join(__dirname, '../../scripts/reflector-agent'), () => ({
+  reflect: () => createUnavailableReport('Feedback reflection'),
+}));
 const { submitProductIssue } = require('../../scripts/product-feedback');
 const {
   assembleUnifiedContext,
   formatUnifiedContext,
 } = require('../../scripts/context-manager');
 const { exportHfDataset } = require('../../scripts/export-hf-dataset');
-const { distributeContextToAgents } = require('../../scripts/swarm-coordinator');
-const { buildSessionReport } = require('../../scripts/session-report');
-const {
-  generateOperatorArtifact,
-  formatArtifactMarkdown,
-} = require('../../scripts/operator-artifacts');
 const PRO_CHECKOUT_URL = 'https://thumbgate-production.up.railway.app/checkout/pro';
+const PRIVATE_MCP_MODULES = Object.freeze({
+  intentRouter: path.resolve(__dirname, '../../scripts/intent-router.js'),
+  delegationRuntime: path.resolve(__dirname, '../../scripts/delegation-runtime.js'),
+  orgDashboard: path.resolve(__dirname, '../../scripts/org-dashboard.js'),
+  reflectorAgent: path.resolve(__dirname, '../../scripts/reflector-agent.js'),
+  swarmCoordinator: path.resolve(__dirname, '../../scripts/swarm-coordinator.js'),
+  sessionReport: path.resolve(__dirname, '../../scripts/session-report.js'),
+  operatorArtifacts: path.resolve(__dirname, '../../scripts/operator-artifacts.js'),
+  managedLessonAgent: path.resolve(__dirname, '../../scripts/managed-lesson-agent.js'),
+  semanticLayer: path.resolve(__dirname, '../../scripts/semantic-layer.js'),
+  lessonInference: path.resolve(__dirname, '../../scripts/lesson-inference.js'),
+  lessonSearch: path.resolve(__dirname, '../../scripts/lesson-search.js'),
+});
+function loadPrivateMcpModule(key) {
+  const modulePath = PRIVATE_MCP_MODULES[key];
+  if (!modulePath) {
+    throw new Error(`Unknown private MCP module: ${key}`);
+  }
+  try {
+    return require(modulePath);
+  } catch (error) {
+    const message = String(error && error.message || '');
+    if ((error && (error.code === 'MODULE_NOT_FOUND' || error.code === 'ERR_MODULE_NOT_FOUND'))
+      && (message.includes(modulePath) || message.includes(path.basename(modulePath)))) {
+      return null;
+    }
+    throw error;
+  }
+}
+function unavailablePrivateMcpFeature(toolName) {
+  return toTextResult({
+    ok: false,
+    availability: 'private_core',
+    tool: toolName,
+    message: `${toolName} is only available in the ThumbGate private core or hosted runtime.`,
+  });
+}
 function enforceLimit(action) {
   const limit = checkLimit(action);
@@ -158,7 +201,7 @@ const {
   finalizeSession: finalizeFeedbackSession,
 } = require('../../scripts/feedback-session');
-const SERVER_INFO = { name: 'thumbgate-mcp', version: '1.15.0' };
+const SERVER_INFO = { name: 'thumbgate-mcp', version: '1.16.0' };
 const COMMERCE_CATEGORIES = [
   'product_recommendation',
   'brand_compliance',
@@ -316,13 +359,14 @@ function buildDiagnoseFailureResponse(args = {}) {
   if (args.intentId) {
     try {
-      intentPlan = planIntent({
+      const module = loadPrivateMcpModule('intentRouter');
+      intentPlan = module ? module.planIntent({
         intentId: args.intentId,
         context: args.context || '',
         mcpProfile: requestedProfile,
         approved: args.approved === true,
         repoPath: args.repoPath,
-      });
+      }) : null;
     } catch (_) {
       intentPlan = null;
     }
@@ -511,15 +555,24 @@ async function callToolInner(name, args) {
       return toCaptureFeedbackTextResult(captureFeedback(args));
     case 'feedback_summary':
       return toTextResult(feedbackSummary(Number(args.recent || 20)));
-    case 'search_lessons':
-      return toTextResult(searchLessons(args.query || '', {
+    case 'search_lessons': {
+      const module = loadPrivateMcpModule('lessonSearch');
+      if (!module) return unavailablePrivateMcpFeature('search_lessons');
+      return toTextResult(module.searchLessons(args.query || '', {
         limit: Number(args.limit || 10),
         category: args.category,
         tags: Array.isArray(args.tags) ? args.tags : [],
       }));
+    }
     case 'retrieve_lessons': {
       // Cross-encoder reranking: retrieve more candidates, then rerank for precision
-      const { retrieveWithRerankingSync } = require('../../scripts/cross-encoder-reranker');
+      const { retrieveWithRerankingSync } = loadOptionalModule(path.join(__dirname, '../../scripts/cross-encoder-reranker'), () => ({
+        retrieveWithRerankingSync: (toolName, actionContext, options = {}) => retrieveRelevantLessons(
+          toolName,
+          actionContext,
+          { maxResults: options.maxResults || 5 },
+        ),
+      }));
       return toTextResult(retrieveWithRerankingSync(
         args.toolName,
         args.actionContext || '',
@@ -565,13 +618,17 @@ async function callToolInner(name, args) {
     case 'diagnose_failure':
       return buildDiagnoseFailureResponse(args);
     case 'reflect_on_feedback':
-      return toTextResult(reflectOnFeedback({
+      {
+        const module = loadPrivateMcpModule('reflectorAgent');
+        if (!module) return unavailablePrivateMcpFeature('reflect_on_feedback');
+        return toTextResult(module.reflect({
         conversationWindow: args.conversationWindow || [],
         context: args.context || '',
         whatWentWrong: args.whatWentWrong || '',
         structuredRule: null,
         feedbackEvent: args.feedbackEventId ? { id: args.feedbackEventId } : null,
-      }));
+        }));
+      }
     case 'report_product_issue':
       return toTextResult(await submitProductIssue({
         title: args.title,
@@ -580,52 +637,69 @@ async function callToolInner(name, args) {
         source: 'mcp tool',
       }));
     case 'list_intents':
-      return toTextResult(listIntents({
-        mcpProfile: args.mcpProfile,
-        bundleId: args.bundleId,
-        partnerProfile: args.partnerProfile,
-      }));
+      {
+        const module = loadPrivateMcpModule('intentRouter');
+        if (!module) return unavailablePrivateMcpFeature('list_intents');
+        return toTextResult(module.listIntents({
+          mcpProfile: args.mcpProfile,
+          bundleId: args.bundleId,
+          partnerProfile: args.partnerProfile,
+        }));
+      }
     case 'plan_intent':
-      return toTextResult(planIntent({
-        intentId: args.intentId,
-        context: args.context || '',
-        mcpProfile: args.mcpProfile,
-        bundleId: args.bundleId,
-        partnerProfile: args.partnerProfile,
-        delegationMode: args.delegationMode,
-        approved: args.approved === true,
-        repoPath: args.repoPath,
-      }));
-    case 'start_handoff':
-      return toTextResult(startHandoff({
-        plan: planIntent({
+      {
+        const module = loadPrivateMcpModule('intentRouter');
+        if (!module) return unavailablePrivateMcpFeature('plan_intent');
+        return toTextResult(module.planIntent({
           intentId: args.intentId,
           context: args.context || '',
           mcpProfile: args.mcpProfile,
           bundleId: args.bundleId,
           partnerProfile: args.partnerProfile,
-          delegationMode: 'sequential',
+          delegationMode: args.delegationMode,
           approved: args.approved === true,
           repoPath: args.repoPath,
-        }),
-        context: args.context || '',
-        mcpProfile: args.mcpProfile || getActiveMcpProfile(),
-        partnerProfile: args.partnerProfile || null,
-        repoPath: args.repoPath,
-        delegateProfile: args.delegateProfile || null,
-        plannedChecks: Array.isArray(args.plannedChecks) ? args.plannedChecks : [],
-      }));
+        }));
+      }
+    case 'start_handoff':
+      {
+        const intentRouter = loadPrivateMcpModule('intentRouter');
+        const delegationRuntime = loadPrivateMcpModule('delegationRuntime');
+        if (!intentRouter || !delegationRuntime) return unavailablePrivateMcpFeature('start_handoff');
+        return toTextResult(delegationRuntime.startHandoff({
+          plan: intentRouter.planIntent({
+            intentId: args.intentId,
+            context: args.context || '',
+            mcpProfile: args.mcpProfile,
+            bundleId: args.bundleId,
+            partnerProfile: args.partnerProfile,
+            delegationMode: 'sequential',
+            approved: args.approved === true,
+            repoPath: args.repoPath,
+          }),
+          context: args.context || '',
+          mcpProfile: args.mcpProfile || getActiveMcpProfile(),
+          partnerProfile: args.partnerProfile || null,
+          repoPath: args.repoPath,
+          delegateProfile: args.delegateProfile || null,
+          plannedChecks: Array.isArray(args.plannedChecks) ? args.plannedChecks : [],
+        }));
+      }
     case 'complete_handoff':
-      return toTextResult(completeHandoff({
-        handoffId: args.handoffId,
-        outcome: args.outcome,
-        resultContext: args.resultContext || '',
-        attempts: args.attempts,
-        violationCount: args.violationCount,
-        tokenEstimate: args.tokenEstimate,
-        latencyMs: args.latencyMs,
-        summary: args.summary || '',
-      }));
+      {
+        const module = loadPrivateMcpModule('delegationRuntime');
+        if (!module) return unavailablePrivateMcpFeature('complete_handoff');
+        return toTextResult(module.completeHandoff({
+          handoffId: args.handoffId,
+          outcome: args.outcome,
+          resultContext: args.resultContext || '',
+          attempts: args.attempts,
+          violationCount: args.violationCount,
+          tokenEstimate: args.tokenEstimate,
+          latencyMs: args.latencyMs,
+          summary: args.summary || '',
+        }));
+      }
     case 'enforcement_matrix':
       return toTextResult(listEnforcementMatrix());
     case 'security_scan': {
@@ -797,23 +871,33 @@ async function callToolInner(name, args) {
       });
     }
     case 'distribute_context_to_agents':
-      return toTextResult(distributeContextToAgents({
+      {
+        const module = loadPrivateMcpModule('swarmCoordinator');
+        if (!module) return unavailablePrivateMcpFeature('distribute_context_to_agents');
+        return toTextResult(module.distributeContextToAgents({
         query: args.query || '',
         agents: args.agents,
         maxItems: args.maxItems,
         maxChars: args.maxChars,
         namespaces: Array.isArray(args.namespaces) ? args.namespaces : [],
         ttlMs: args.ttlMs,
-      }));
+        }));
+      }
     case 'session_report':
-      return toTextResult(buildSessionReport({ windowHours: args.windowHours }));
+      {
+        const module = loadPrivateMcpModule('sessionReport');
+        if (!module) return unavailablePrivateMcpFeature('session_report');
+        return toTextResult(module.buildSessionReport({ windowHours: args.windowHours }));
+      }
     case 'generate_operator_artifact': {
-      const artifact = await generateOperatorArtifact({
+      const module = loadPrivateMcpModule('operatorArtifacts');
+      if (!module) return unavailablePrivateMcpFeature('generate_operator_artifact');
+      const artifact = await module.generateOperatorArtifact({
         type: args.type,
         windowHours: args.windowHours,
       });
       if (args.format === 'markdown') {
-        return toTextResult(formatArtifactMarkdown(artifact));
+        return toTextResult(module.formatArtifactMarkdown(artifact));
       }
       return toTextResult(artifact);
     }
@@ -827,20 +911,43 @@ async function callToolInner(name, args) {
         branchGovernance: getBranchGovernanceState(),
       }));
     case 'workflow_sentinel':
-      return toTextResult(evaluateWorkflowSentinel(args.toolName, {
+      {
+        const normalizedAction = normalizeProviderAction(args);
+        const changedFiles = Array.isArray(args.changedFiles) ? args.changedFiles : normalizedAction.affectedFiles;
+        return toTextResult(evaluateWorkflowSentinel(normalizedAction.toolName || args.toolName, {
         command: args.command,
         path: args.filePath,
-        changedFiles: Array.isArray(args.changedFiles) ? args.changedFiles : [],
+        changedFiles,
         repoPath: args.repoPath,
         baseBranch: args.baseBranch,
+        providerToolCall: args.providerToolCall,
+        toolCall: args.toolCall,
+        toolUse: args.toolUse,
+        content: args.content,
+        input: args.input,
+        arguments: args.arguments,
+        method: args.method,
+        params: args.params,
+        mcp: args.mcp,
+        mcpToolCall: args.mcpToolCall,
+        budget: args.budget,
+        usage: args.usage,
       }, {
+        provider: args.provider,
+        model: args.model,
+        normalizedAction,
+        usage: args.usage,
+        tokenEstimate: args.tokenEstimate,
+        costUsd: args.costUsd,
+        budget: args.budget,
         repoPath: args.repoPath,
         baseBranch: args.baseBranch,
-        affectedFiles: Array.isArray(args.changedFiles) ? args.changedFiles : undefined,
+        affectedFiles: changedFiles.length > 0 ? changedFiles : undefined,
         requirePrForReleaseSensitive: args.requirePrForReleaseSensitive === true,
         requireVersionNotBehindBase: args.requireVersionNotBehindBase === true,
         governanceState: getScopeState(),
       }));
+      }
     case 'register_claim_gate':
       return toTextResult(registerClaimGate(args.claimPattern, args.requiredActions, args.message));
     case 'gate_stats':
@@ -848,7 +955,11 @@ async function callToolInner(name, args) {
     case 'dashboard':
       return toTextResult(generateDashboard(getFeedbackPaths().FEEDBACK_DIR));
     case 'org_dashboard':
-      return toTextResult(generateOrgDashboard({ windowHours: Number(args.windowHours || 24) }));
+      {
+        const module = loadPrivateMcpModule('orgDashboard');
+        if (!module) return unavailablePrivateMcpFeature('org_dashboard');
+        return toTextResult(module.generateOrgDashboard({ windowHours: Number(args.windowHours || 24) }));
+      }
     case 'settings_status':
       return toTextResult(getSettingsStatus());
     case 'native_messaging_audit':
@@ -861,13 +972,15 @@ async function callToolInner(name, args) {
       enforceLimit('commerce_recall');
       return buildCommerceRecallResponse(args);
     case 'get_business_metrics': {
-      const { getBusinessMetrics } = require('../../scripts/semantic-layer');
-      const metrics = await getBusinessMetrics(args);
+      const module = loadPrivateMcpModule('semanticLayer');
+      if (!module) return unavailablePrivateMcpFeature('get_business_metrics');
+      const metrics = await module.getBusinessMetrics(args);
       return toTextResult(metrics);
     }
     case 'describe_semantic_entity': {
-      const { describeSemanticSchema } = require('../../scripts/semantic-layer');
-      const schema = describeSemanticSchema();
+      const module = loadPrivateMcpModule('semanticLayer');
+      if (!module) return unavailablePrivateMcpFeature('describe_semantic_entity');
+      const schema = module.describeSemanticSchema();
       const entity = schema.entities[args.type] || schema.metrics[args.type];
       if (!entity) {
         throw new Error(`Unknown semantic entity: ${args.type}`);
@@ -937,12 +1050,14 @@ async function callToolInner(name, args) {
     case 'finalize_feedback_session':
       return toTextResult(finalizeFeedbackSession(args.sessionId));
     case 'run_managed_lesson_agent': {
-      const { runManagedAgent } = require('../../scripts/managed-lesson-agent');
-      return toTextResult(await runManagedAgent({ dryRun: args.dryRun, limit: args.limit, model: args.model }));
+      const module = loadPrivateMcpModule('managedLessonAgent');
+      if (!module) return unavailablePrivateMcpFeature('run_managed_lesson_agent');
+      return toTextResult(await module.runManagedAgent({ dryRun: args.dryRun, limit: args.limit, model: args.model }));
     }
     case 'managed_agent_status': {
-      const { getManagedAgentStatus } = require('../../scripts/managed-lesson-agent');
-      return toTextResult(getManagedAgentStatus() || { message: 'No managed agent runs recorded yet.' });
+      const module = loadPrivateMcpModule('managedLessonAgent');
+      if (!module) return unavailablePrivateMcpFeature('managed_agent_status');
+      return toTextResult(module.getManagedAgentStatus() || { message: 'No managed agent runs recorded yet.' });
     }
     case 'run_self_distill': {
       const { runSelfDistill } = require('../../scripts/self-distill-agent');
@@ -953,8 +1068,13 @@ async function callToolInner(name, args) {
       return toTextResult(getSelfDistillStatus() || { message: 'No self-distill runs found.' });
     }
     case 'context_stuff_lessons': {
-      const { getAllLessonsForContext } = require('../../scripts/lesson-inference');
-      return toTextResult(getAllLessonsForContext({ maxTokenBudget: args.maxTokenBudget, signal: args.signal, format: args.format }));
+      const module = loadPrivateMcpModule('lessonInference');
+      if (!module) return unavailablePrivateMcpFeature('context_stuff_lessons');
+      return toTextResult(module.getAllLessonsForContext({
+        maxTokenBudget: args.maxTokenBudget,
+        signal: args.signal,
+        format: args.format,
+      }));
     }
     default:
       throw new Error(`Unsupported tool: ${name}`);
@@ -1175,4 +1295,10 @@ module.exports = {
   acquireLock,
   toCaptureFeedbackTextResult,
   formatCorrectiveActionsReminder,
+  __test__: {
+    PRIVATE_MCP_MODULES,
+    loadPrivateMcpModule,
+    unavailablePrivateMcpFeature,
+    callToolInner,
+  },
 };

package/adapters/opencode/opencode.json CHANGED Viewed

@@ -7,7 +7,7 @@
         "npx",
         "--yes",
         "--package",
-        "thumbgate@1.15.0",
+        "thumbgate@1.16.0",
         "thumbgate",
         "serve"
       ],

package/bench/prompt-eval-suite.json CHANGED Viewed

@@ -2,6 +2,10 @@
   "version": 1,
   "name": "ThumbGate Prompt Evaluation",
   "description": "Tests core ThumbGate prompts against expected outputs. Based on Anthropic prompt evaluation methodology: test against expected answers, compare versions, review outputs for errors.",
+  "successCriteria": {
+    "minAggregateScore": 80,
+    "requireNoRegressions": true
+  },
   "evaluations": [
     {
       "id": "lesson-distill-negative-clear",
@@ -81,7 +85,7 @@
         "hasDomain": true,
         "domain": "testing",
         "hasOutcome": true,
-        "outcomeContains": ["failure", "error"]
+        "outcomeContains": ["failure"]
       }
     },
     {