npm - thumbgate - Versions diffs - 1.15.0 → 1.16.1 - Mend

thumbgate 1.15.0 → 1.16.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (129) hide show

package/.claude-plugin/marketplace.json +6 -6
package/.claude-plugin/plugin.json +3 -3
package/.well-known/llms.txt +5 -5
package/.well-known/mcp/server-card.json +1 -1
package/README.md +59 -35
package/adapters/chatgpt/openapi.yaml +118 -2
package/adapters/claude/.mcp.json +2 -2
package/adapters/mcp/server-stdio.js +210 -84
package/adapters/opencode/opencode.json +1 -1
package/bench/prompt-eval-suite.json +5 -1
package/bin/cli.js +157 -8
package/config/evals/agent-safety-eval.json +338 -22
package/config/gates/routine.json +43 -0
package/config/github-about.json +3 -3
package/config/model-candidates.json +131 -0
package/openapi/openapi.yaml +118 -2
package/package.json +57 -49
package/public/blog.html +7 -7
package/public/codex-plugin.html +6 -6
package/public/compare.html +29 -23
package/public/dashboard.html +82 -10
package/public/guide.html +28 -28
package/public/index.html +216 -98
package/public/learn.html +50 -22
package/public/lessons.html +1 -1
package/public/numbers.html +17 -17
package/public/pro.html +82 -18
package/scripts/agent-audit-trace.js +55 -0
package/scripts/agent-memory-lifecycle.js +96 -0
package/scripts/agent-readiness-plan.js +118 -0
package/scripts/agentic-data-pipeline.js +21 -1
package/scripts/agents-sdk-sandbox-plan.js +57 -0
package/scripts/ai-org-governance.js +98 -0
package/scripts/ai-search-distribution.js +43 -0
package/scripts/artifact-agent-plan.js +81 -0
package/scripts/billing.js +27 -8
package/scripts/cli-schema.js +18 -2
package/scripts/code-mode-mcp-plan.js +71 -0
package/scripts/context-engine.js +1 -2
package/scripts/context-manager.js +4 -1
package/scripts/dashboard-render-spec.js +1 -1
package/scripts/dashboard.js +275 -9
package/scripts/decision-journal.js +13 -3
package/scripts/document-workflow-governance.js +62 -0
package/scripts/enterprise-agent-rollout.js +34 -0
package/scripts/experience-replay-governance.js +69 -0
package/scripts/export-hf-dataset.js +1 -1
package/scripts/feedback-loop.js +92 -4
package/scripts/feedback-to-rules.js +17 -23
package/scripts/gates-engine.js +4 -6
package/scripts/growth-campaigns.js +49 -0
package/scripts/harness-selector.js +16 -4
package/scripts/hybrid-supervisor-agent.js +64 -0
package/scripts/inference-cache-policy.js +72 -0
package/scripts/inference-economics.js +53 -0
package/scripts/internal-agent-bootstrap.js +12 -2
package/scripts/knowledge-layer-plan.js +108 -0
package/scripts/lesson-inference.js +183 -44
package/scripts/lesson-search.js +4 -1
package/scripts/llm-client.js +157 -26
package/scripts/mailer/resend-mailer.js +112 -1
package/scripts/mcp-transport-strategy.js +66 -0
package/scripts/memory-store-governance.js +60 -0
package/scripts/meta-agent-loop.js +7 -13
package/scripts/model-access-eligibility.js +38 -0
package/scripts/model-migration-readiness.js +55 -0
package/scripts/operational-integrity.js +96 -3
package/scripts/otel-declarative-config.js +56 -0
package/scripts/perplexity-client.js +1 -1
package/scripts/post-training-governance.js +34 -0
package/scripts/private-core-boundary.js +72 -0
package/scripts/production-agent-readiness.js +40 -0
package/scripts/prompt-eval.js +564 -32
package/scripts/prompt-programs.js +93 -0
package/scripts/provider-action-normalizer.js +585 -0
package/scripts/scaling-law-claims.js +60 -0
package/scripts/security-scanner.js +1 -1
package/scripts/self-distill-agent.js +7 -32
package/scripts/seo-gsd.js +232 -55
package/scripts/skill-rag-router.js +53 -0
package/scripts/spec-gate.js +1 -1
package/scripts/student-consistent-training.js +73 -0
package/scripts/synthetic-data-provenance.js +98 -0
package/scripts/task-context-result.js +81 -0
package/scripts/telemetry-analytics.js +149 -0
package/scripts/thompson-sampling.js +2 -2
package/scripts/token-savings.js +7 -6
package/scripts/token-tco.js +46 -0
package/scripts/tool-registry.js +63 -3
package/scripts/verification-loop.js +10 -1
package/scripts/verifier-scoring.js +71 -0
package/scripts/workflow-sentinel.js +284 -28
package/scripts/workspace-agent-routines.js +118 -0
package/src/api/server.js +381 -120
package/scripts/analytics-report.js +0 -328
package/scripts/autonomous-workflow.js +0 -377
package/scripts/billing-setup.js +0 -109
package/scripts/creator-campaigns.js +0 -239
package/scripts/cross-encoder-reranker.js +0 -235
package/scripts/daemon-manager.js +0 -108
package/scripts/decision-trace.js +0 -354
package/scripts/delegation-runtime.js +0 -896
package/scripts/dispatch-brief.js +0 -159
package/scripts/distribution-surfaces.js +0 -110
package/scripts/feedback-history-distiller.js +0 -382
package/scripts/funnel-analytics.js +0 -35
package/scripts/history-distiller.js +0 -200
package/scripts/hosted-job-launcher.js +0 -256
package/scripts/intent-router.js +0 -392
package/scripts/lesson-reranker.js +0 -263
package/scripts/lesson-retrieval.js +0 -148
package/scripts/managed-lesson-agent.js +0 -183
package/scripts/operational-dashboard.js +0 -103
package/scripts/operational-summary.js +0 -129
package/scripts/operator-artifacts.js +0 -608
package/scripts/optimize-context.js +0 -17
package/scripts/org-dashboard.js +0 -206
package/scripts/partner-orchestration.js +0 -146
package/scripts/predictive-insights.js +0 -356
package/scripts/pulse.js +0 -80
package/scripts/reflector-agent.js +0 -221
package/scripts/sales-pipeline.js +0 -681
package/scripts/session-episode-store.js +0 -329
package/scripts/session-health-sensor.js +0 -242
package/scripts/session-report.js +0 -120
package/scripts/swarm-coordinator.js +0 -81
package/scripts/tool-kpi-tracker.js +0 -12
package/scripts/webhook-delivery.js +0 -62
package/scripts/workflow-sprint-intake.js +0 -475

package/scripts/tool-registry.js CHANGED Viewed

@@ -387,7 +387,7 @@ const TOOLS = [
   }),
   readOnlyTool({
     name: 'enforcement_matrix',
-    description: 'Show the full Enforcement Matrix: feedback pipeline stats, active pre-action gates, and rejection ledger with revival conditions.',
+    description: 'Show the full Enforcement Matrix: feedback pipeline stats, active pre-action checks, and rejection ledger with revival conditions.',
     inputSchema: {
       type: 'object',
       properties: {},
@@ -773,9 +773,69 @@ const TOOLS = [
     description: 'Predict pre-action workflow risk, blast radius, and remediations before a tool call executes.',
     inputSchema: {
       type: 'object',
-      required: ['toolName'],
       properties: {
-        toolName: { type: 'string', description: 'Tool being assessed, such as Bash, Edit, or Write' },
+        toolName: { type: 'string', description: 'Tool being assessed, such as Bash, Edit, or Write. Optional when provider-native tool call payload is supplied.' },
+        provider: { type: 'string', description: 'Optional provider name, such as anthropic, openai, codex, cursor, gemini, or mcp' },
+        model: { type: 'string', description: 'Optional model name used for audit evidence and budget review' },
+        providerToolCall: {
+          type: 'object',
+          additionalProperties: true,
+          description: 'Provider-native tool call object, including Anthropic tool_use or OpenAI function/tool call shapes',
+        },
+        content: {
+          type: 'array',
+          items: { type: 'object', additionalProperties: true },
+          description: 'Provider-native message content blocks; Anthropic tool_use blocks are normalized automatically',
+        },
+        method: { type: 'string', description: 'Optional JSON-RPC/MCP method, such as tools/call' },
+        params: {
+          type: 'object',
+          additionalProperties: true,
+          description: 'Optional JSON-RPC/MCP params, including tools/call name and arguments, resources/read URI, or prompts/get template arguments',
+        },
+        usage: {
+          type: 'object',
+          additionalProperties: true,
+          description: 'Provider token/cost usage, such as input_tokens, output_tokens, or total_tokens',
+        },
+        tokenEstimate: { type: 'number', description: 'Estimated total tokens for this action when provider usage is unavailable' },
+        costUsd: { type: 'number', description: 'Estimated USD cost for this action when provider usage is unavailable' },
+        budget: {
+          type: 'object',
+          additionalProperties: true,
+          description: 'Optional per-action budget controls: maxTokensPerAction, remainingTokens, maxCostUsdPerAction, remainingCostUsd, maxParallelBranches',
+        },
+        workflowPattern: {
+          type: 'string',
+          enum: ['single_action', 'chaining', 'routing', 'parallelization', 'evaluator-optimizer', 'agent'],
+          description: 'Optional workflow architecture hint. Agents require inspection evidence; predefined workflows are easier to evaluate.',
+        },
+        workflow: {
+          type: 'object',
+          additionalProperties: true,
+          description: 'Optional workflow metadata: pattern, steps, routes, branches, tools, inspection, and verification evidence.',
+        },
+        goal: { type: 'string', description: 'Optional agent goal for open-ended tool planning.' },
+        tools: {
+          type: 'array',
+          items: { type: 'string' },
+          description: 'Optional abstract/combinable tool names available to an open-ended agent.',
+        },
+        branches: {
+          type: 'array',
+          items: { type: 'string' },
+          description: 'Optional parallel workflow branches for fan-out budget and review checks.',
+        },
+        steps: {
+          type: 'array',
+          items: { type: 'string' },
+          description: 'Optional predefined workflow steps for chaining/evaluator workflow audit evidence.',
+        },
+        routes: {
+          type: 'array',
+          items: { type: 'string' },
+          description: 'Optional routing workflow destinations or classes.',
+        },
         command: { type: 'string', description: 'Optional shell command when toolName is Bash' },
         filePath: { type: 'string', description: 'Optional primary file path for edit-like tools' },
         changedFiles: {

package/scripts/verification-loop.js CHANGED Viewed

@@ -6,11 +6,20 @@ const {
   getFeedbackPaths,
   appendDiagnosticRecord,
 } = require('./feedback-loop');
+const { loadOptionalModule } = require('./private-core-boundary');
 const {
   buildPartnerStrategy,
   computePartnerReward,
   resolveVerificationRetries,
-} = require('./partner-orchestration');
+} = loadOptionalModule('./partner-orchestration', () => ({
+  buildPartnerStrategy: ({ partnerProfile } = {}) => ({
+    profile: partnerProfile || 'public-shell',
+    verificationMode: 'local-only',
+    recommendedChecks: [],
+  }),
+  computePartnerReward: () => 0,
+  resolveVerificationRetries: (requestedMaxRetries) => requestedMaxRetries,
+}));
 const {
   diagnoseFailure,
 } = require('./failure-diagnostics');

package/scripts/verifier-scoring.js ADDED Viewed

@@ -0,0 +1,71 @@
+'use strict';
+function buildVerifierScoringRubric(options = {}) {
+  const criteria = options.criteria || [
+    'evidence_cited',
+    'scope_respected',
+    'tests_or_proof_run',
+    'claim_matches_artifacts',
+  ];
+  const granularity = Number.isFinite(options.granularity) ? options.granularity : 100;
+  const repeats = Number.isFinite(options.repeats) ? options.repeats : 3;
+  return {
+    rubricId: 'granular_llm_verifier',
+    criteria,
+    granularity,
+    repeats,
+    scoring: 'probability_weighted_average',
+    passThreshold: Number.isFinite(options.passThreshold) ? options.passThreshold : 0.82,
+    caveats: [
+      'calibrate against held-out human labels before production blocking',
+      'fall back to coarse scores when model cannot expose score-token probabilities',
+      'never use verifier score alone for destructive actions',
+    ],
+  };
+}
+function computeVerifierScore({ scores = [], rubric = buildVerifierScoringRubric() } = {}) {
+  const flattened = scores
+    .flatMap((criterion) => Array.isArray(criterion.repeats) ? criterion.repeats : [])
+    .filter((value) => Number.isFinite(value));
+  if (flattened.length === 0) {
+    return {
+      score: 0,
+      decision: 'warn',
+      issues: ['missing_verifier_scores'],
+    };
+  }
+  const normalized = flattened.map((value) => value > 1 ? value / rubric.granularity : value);
+  const score = normalized.reduce((sum, value) => sum + value, 0) / normalized.length;
+  const issues = [];
+  if (scores.length < rubric.criteria.length) issues.push('missing_criteria_scores');
+  if (flattened.length < rubric.criteria.length * rubric.repeats) issues.push('missing_repeat_verifications');
+  return {
+    score: Number(score.toFixed(4)),
+    decision: score >= rubric.passThreshold && issues.length === 0 ? 'allow' : 'warn',
+    issues,
+  };
+}
+function evaluateVerifierSetup(setup = {}) {
+  const issues = [];
+  if (!setup.criteria || setup.criteria.length < 3) issues.push('too_few_criteria');
+  if (!setup.repeats || setup.repeats < 2) issues.push('repeat_verification_required');
+  if (!setup.heldoutCalibration) issues.push('heldout_calibration_required');
+  if (setup.destructiveAction && !setup.humanReview) issues.push('human_review_required_for_destructive_action');
+  return {
+    decision: issues.length ? 'warn' : 'allow',
+    issues,
+  };
+}
+module.exports = {
+  buildVerifierScoringRubric,
+  computeVerifierScore,
+  evaluateVerifierSetup,
+};