npm - @mcptoolshop/research-os - Versions diffs - 0.4.0 → 0.5.0 - Mend

@mcptoolshop/research-os 0.4.0 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

package/CHANGELOG.md +134 -0
package/README.es.md +25 -2
package/README.fr.md +24 -1
package/README.hi.md +39 -1
package/README.it.md +25 -2
package/README.ja.md +24 -1
package/README.md +37 -1
package/README.pt-BR.md +24 -1
package/README.zh.md +25 -2
package/dist/calibration/aggregate-receipt-schema.d.ts +509 -0
package/dist/calibration/aggregate-receipt-schema.js +143 -0
package/dist/calibration/aggregate-receipt-schema.js.map +1 -0
package/dist/calibration/aggregate.d.ts +35 -0
package/dist/calibration/aggregate.js +454 -0
package/dist/calibration/aggregate.js.map +1 -0
package/dist/calibration/receipt-schema.d.ts +317 -0
package/dist/calibration/receipt-schema.js +68 -0
package/dist/calibration/receipt-schema.js.map +1 -0
package/dist/calibration/receipt.d.ts +31 -0
package/dist/calibration/receipt.js +151 -0
package/dist/calibration/receipt.js.map +1 -0
package/dist/cli.js +136 -9
package/dist/cli.js.map +1 -1
package/dist/index.d.ts +10 -1
package/dist/index.js +13 -6
package/dist/index.js.map +1 -1
package/package.json +1 -1

package/dist/cli.js CHANGED Viewed

@@ -3922,7 +3922,11 @@ var init_schema9 = __esm({
       finding_ids: z11.array(z11.string()),
       reviewer: ReviewerNameSchema,
       review_method: z11.string().min(1),
-      created_at: z11.string()
+      created_at: z11.string(),
+      // v0.5: optional profile lineage. Additive-optional — pre-v0.5 records
+      // without this field parse cleanly. Frozen packs unaffected (Zod .optional()
+      // with no .default() leaves absent keys absent on round-trip).
+      profile: z11.string().optional()
     });
     ReviewSnapshotSchema = z11.object({
       section_id: z11.string().regex(/^[0-9]{2}-[a-z0-9-]+$/),
@@ -5925,7 +5929,7 @@ function pickHighestPriority(decisions) {
   return "accepted_for_synthesis";
 }
 function deriveClaimReviews(args) {
-  const { claims, findings, reviewer, reviewMethod, activeSectionWaivers } = args;
+  const { claims, findings, reviewer, reviewMethod, activeSectionWaivers, profile } = args;
   const reviews = [];
   const now = (/* @__PURE__ */ new Date()).toISOString();
   const monopolyWaived = Array.isArray(activeSectionWaivers) && activeSectionWaivers.some((w) => w.scope === "min_independent_publishers");
@@ -5940,7 +5944,8 @@ function deriveClaimReviews(args) {
         finding_ids: [],
         reviewer,
         review_method: reviewMethod,
-        created_at: now
+        created_at: now,
+        ...profile !== void 0 ? { profile } : {}
       });
       continue;
     }
@@ -5974,7 +5979,8 @@ function deriveClaimReviews(args) {
       finding_ids: claimFindings.map((f) => f.finding_id),
       reviewer,
       review_method: reviewMethod,
-      created_at: now
+      created_at: now,
+      ...profile !== void 0 ? { profile } : {}
     });
   }
   return reviews;
@@ -6470,7 +6476,8 @@ async function finalizeReview(args) {
     findings: dedupedFindings,
     reviewer: args.reviewer,
     reviewMethod: args.reviewMethod,
-    activeSectionWaivers
+    activeSectionWaivers,
+    profile: args.profile !== DEFAULT_PROFILE ? args.profile : void 0
   });
   const decisionCounts = {
     accepted_for_synthesis: 0,
@@ -7543,8 +7550,8 @@ async function syncRepoKnowledge(options) {
     };
   }
   const exportResult = await exportRepoKnowledge({ packPath });
-  const { readFile: readFile26 } = await import("fs/promises");
-  const text = await readFile26(exportResult.outPath, "utf8");
+  const { readFile: readFile27 } = await import("fs/promises");
+  const text = await readFile27(exportResult.outPath, "utf8");
   const facts = text.split(/\r?\n/).filter((l) => l.trim().length > 0).map((l) => JSON.parse(l));
   try {
     const r = await rk.ingestFacts({ facts, namespace: "research-os" });
@@ -12192,7 +12199,7 @@ var init_src = __esm({
     init_triage();
     init_discover();
     init_errors();
-    RESEARCH_OS_VERSION = "0.4.0";
+    RESEARCH_OS_VERSION = "0.5.0";
   }
 });
@@ -13406,6 +13413,115 @@ async function applySourceCardOverrides(packPath, fromFile) {
 // src/cli.ts
 init_errors();
 init_src();
+// src/calibration/lookup.ts
+import { existsSync as existsSync33 } from "fs";
+import { readFile as readFile26 } from "fs/promises";
+import { join as join34 } from "path";
+// src/calibration/receipt-schema.ts
+import { z as z25 } from "zod";
+var StatusLabelSchema = z25.enum([
+  "trusted_baseline",
+  "conditional_pass",
+  "failed",
+  "comparison_only"
+]);
+var ArchitectureSchema = z25.enum(["single-pass", "two-pass"]);
+var RecallSchema = z25.object({
+  matched: z25.number().int().nonnegative(),
+  total: z25.number().int().nonnegative(),
+  ratio: z25.number().min(0).max(1)
+});
+var PerCategoryRecallSchema = z25.record(z25.string(), RecallSchema);
+var PassFailSchema = z25.object({
+  fp_ceiling: z25.enum(["PASS", "FAIL"]),
+  any_flag_recall_floor: z25.enum(["PASS", "FAIL"]),
+  per_category_any_flag_floor: z25.enum(["PASS", "FAIL"]),
+  strict_recall_floor: z25.enum(["PASS", "FAIL"]),
+  decision_vocab_completeness: z25.enum(["PASS", "FAIL"]),
+  latency_soft: z25.enum(["PASS", "WARN"]),
+  latency_hard: z25.enum(["PASS", "FAIL"]),
+  empty_or_malformed: z25.enum(["PASS", "FAIL"]),
+  overall: z25.enum(["PASS", "FAIL"])
+});
+var DecisionVocabBarSchema = z25.object({
+  architecture: ArchitectureSchema,
+  required: z25.number().int().positive(),
+  produced: z25.number().int().nonnegative(),
+  passed: z25.boolean()
+});
+var CalibrationReceiptSchema = z25.object({
+  schema_version: z25.literal(1),
+  profile_name: z25.string(),
+  status: StatusLabelSchema,
+  model: z25.string(),
+  architecture: ArchitectureSchema,
+  fixture: z25.string(),
+  fixture_total_claims: z25.number().int().positive(),
+  fixture_good_claims: z25.number().int().nonnegative(),
+  fixture_bad_claims: z25.number().int().nonnegative(),
+  calibrated_at: z25.string(),
+  research_os_version: z25.string(),
+  runtime_ms: z25.number().int().nonnegative(),
+  good_fp_count: z25.number().int().nonnegative(),
+  any_flag_recall: RecallSchema,
+  strict_recall: RecallSchema,
+  per_category_any_flag: PerCategoryRecallSchema,
+  per_category_strict: PerCategoryRecallSchema,
+  decision_vocabulary: z25.record(z25.string(), z25.number().int().nonnegative()),
+  decisions_produced_count: z25.number().int().nonnegative(),
+  decision_vocab_bar: DecisionVocabBarSchema,
+  unreachable_decisions: z25.array(z25.string()),
+  empty_or_malformed_responses: z25.number().int().nonnegative(),
+  pass_fail: PassFailSchema,
+  notes: z25.array(z25.string())
+});
+// src/calibration/receipt.ts
+function receiptToCalibrationSummary(receipt) {
+  const fp = receipt.good_fp_count;
+  const fpTotal = receipt.fixture_good_claims;
+  const fpPct = fpTotal > 0 ? Math.round(fp / fpTotal * 100) : 0;
+  const af = receipt.any_flag_recall;
+  const sr = receipt.strict_recall;
+  const unsupported = receipt.per_category_any_flag["unsupported_claim"];
+  return {
+    fixture: receipt.fixture,
+    good_false_positive_rate: `${fp}/${fpTotal} (${fpPct}%)`,
+    bad_any_flag_recall: `${af.matched}/${af.total} (${Math.round(af.ratio * 100)}%)`,
+    strict_category_recall: `${sr.matched}/${sr.total} (${Math.round(sr.ratio * 100)}%)`,
+    unsupported_claim_recall: unsupported ? `${unsupported.matched}/${unsupported.total} (${Math.round(unsupported.ratio * 100)}%)` : null,
+    notes: `status=${receipt.status} model=${receipt.model} arch=${receipt.architecture} overall=${receipt.pass_fail.overall} decisions=${receipt.decisions_produced_count}/6`
+  };
+}
+// src/calibration/lookup.ts
+async function loadReceiptForPack(packDir, profile) {
+  const receiptPath = receiptPathForPack(packDir, profile);
+  if (!existsSync33(receiptPath)) return null;
+  let raw;
+  try {
+    raw = JSON.parse(await readFile26(receiptPath, "utf8"));
+  } catch (err) {
+    throw new Error(
+      `Invalid calibration receipt at ${receiptPath}: ${err.message}`,
+      { cause: err }
+    );
+  }
+  const result = CalibrationReceiptSchema.safeParse(raw);
+  if (!result.success) {
+    throw new Error(
+      `Invalid calibration receipt at ${receiptPath}: ${result.error.message}`
+    );
+  }
+  return receiptToCalibrationSummary(result.data);
+}
+function receiptPathForPack(packDir, profile) {
+  return join34(packDir, "calibration", "reviewer-profiles", profile, "seeded-v1.json");
+}
+// src/cli.ts
 function reportError(err) {
   if (err instanceof ResearchOSError) {
     process.stderr.write(`research-os: ${err.code}: ${err.message}
@@ -14435,7 +14551,8 @@ program.command("review-promote").description(
   false
 ).action(async (section, opts) => {
   try {
-    const calibration = opts.calibrationFixture || opts.goodFp || opts.anyFlagRecall || opts.strictCatRecall || opts.unsupportedRecall || opts.calibrationNotes ? {
+    const explicitCalibration = opts.calibrationFixture || opts.goodFp || opts.anyFlagRecall || opts.strictCatRecall || opts.unsupportedRecall || opts.calibrationNotes;
+    let calibration = explicitCalibration ? {
       fixture: opts.calibrationFixture ?? null,
       good_false_positive_rate: opts.goodFp ?? null,
       bad_any_flag_recall: opts.anyFlagRecall ?? null,
@@ -14443,6 +14560,16 @@ program.command("review-promote").description(
       unsupported_claim_recall: opts.unsupportedRecall ?? null,
       notes: opts.calibrationNotes ?? null
     } : null;
+    if (!explicitCalibration) {
+      const summary = await loadReceiptForPack(opts.pack, opts.profile);
+      if (summary !== null) {
+        calibration = summary;
+        process.stdout.write(
+          `  [auto] calibration_summary populated from ${receiptPathForPack(opts.pack, opts.profile)}
+`
+        );
+      }
+    }
     const result = await promote({
       sectionId: section,
       packPath: opts.pack,