npm - @mnemom/agent-integrity-protocol - Versions diffs - 0.2.1 → 0.4.1 - Mend

@mnemom/agent-integrity-protocol 0.2.1 → 0.4.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/dist/index.d.cts CHANGED Viewed

@@ -200,6 +200,21 @@ interface IntegrityCheckpoint {
      * Set after the corresponding APTrace is created by the Observer.
      */
     linked_trace_id: string | null;
+    /**
+     * Whether this checkpoint was synthetically generated (not from analysis LLM).
+     * True when no thinking block was found, analysis failed, or evidence was below threshold.
+     */
+    synthetic?: boolean;
+    /**
+     * Reason the checkpoint was synthetically generated.
+     * Only present when `synthetic` is true.
+     */
+    synthetic_reason?: "no_thinking_block" | "analysis_failed" | "below_evidence_threshold";
+    /**
+     * Cross-validation warnings about inconsistencies between verdict and concerns.
+     * Present when the analysis LLM returned a verdict that doesn't match concern severities.
+     */
+    cross_validation_warnings?: string[];
 }
 /**
@@ -277,7 +292,7 @@ interface IntegritySignal {
  * - "deception_pattern": Multiple checks flagging deceptive reasoning; pattern of misleading intent
  * - "unknown": Drift detected but direction cannot be categorized; multiple concern categories without a dominant pattern
  */
-type DriftDirection = "injection_pattern" | "value_erosion" | "autonomy_creep" | "deception_pattern" | "unknown";
+type DriftDirection = "injection_pattern" | "value_erosion" | "autonomy_creep" | "deception_pattern" | "reasoning_degradation" | "intent_drift" | "unknown";
 /**
  * An integrity drift alert generated when consecutive non-clear verdicts
  * exceed the sustained threshold.
@@ -1156,7 +1171,7 @@ interface CertificateVerificationResult {
 declare function verifyCertificate(certificate: IntegrityCertificate, publicKey: Uint8Array, merkleRoot?: string): Promise<CertificateVerificationResult>;
 /** Protocol version identifiers. */
-declare const AIP_VERSION = "0.1.0";
+declare const AIP_VERSION = "0.4.0";
 declare const ALGORITHM_VERSION = "1.0.0";
 /** Drift detection thresholds (Section 9.1). */
 declare const DEFAULT_SUSTAINED_CHECKS_THRESHOLD = 3;

package/dist/index.d.ts CHANGED Viewed

@@ -200,6 +200,21 @@ interface IntegrityCheckpoint {
      * Set after the corresponding APTrace is created by the Observer.
      */
     linked_trace_id: string | null;
+    /**
+     * Whether this checkpoint was synthetically generated (not from analysis LLM).
+     * True when no thinking block was found, analysis failed, or evidence was below threshold.
+     */
+    synthetic?: boolean;
+    /**
+     * Reason the checkpoint was synthetically generated.
+     * Only present when `synthetic` is true.
+     */
+    synthetic_reason?: "no_thinking_block" | "analysis_failed" | "below_evidence_threshold";
+    /**
+     * Cross-validation warnings about inconsistencies between verdict and concerns.
+     * Present when the analysis LLM returned a verdict that doesn't match concern severities.
+     */
+    cross_validation_warnings?: string[];
 }
 /**
@@ -277,7 +292,7 @@ interface IntegritySignal {
  * - "deception_pattern": Multiple checks flagging deceptive reasoning; pattern of misleading intent
  * - "unknown": Drift detected but direction cannot be categorized; multiple concern categories without a dominant pattern
  */
-type DriftDirection = "injection_pattern" | "value_erosion" | "autonomy_creep" | "deception_pattern" | "unknown";
+type DriftDirection = "injection_pattern" | "value_erosion" | "autonomy_creep" | "deception_pattern" | "reasoning_degradation" | "intent_drift" | "unknown";
 /**
  * An integrity drift alert generated when consecutive non-clear verdicts
  * exceed the sustained threshold.
@@ -1156,7 +1171,7 @@ interface CertificateVerificationResult {
 declare function verifyCertificate(certificate: IntegrityCertificate, publicKey: Uint8Array, merkleRoot?: string): Promise<CertificateVerificationResult>;
 /** Protocol version identifiers. */
-declare const AIP_VERSION = "0.1.0";
+declare const AIP_VERSION = "0.4.0";
 declare const ALGORITHM_VERSION = "1.0.0";
 /** Drift detection thresholds (Section 9.1). */
 declare const DEFAULT_SUSTAINED_CHECKS_THRESHOLD = 3;

package/dist/index.js CHANGED Viewed

@@ -20,7 +20,7 @@ function createWindowState(sessionId) {
 }
 // src/constants.ts
-var AIP_VERSION = "0.1.0";
+var AIP_VERSION = "0.4.0";
 var ALGORITHM_VERSION = "1.0.0";
 var DEFAULT_SUSTAINED_CHECKS_THRESHOLD = 3;
 var DRIFT_SEVERITY_LOW_THRESHOLD = 0.7;
@@ -1161,11 +1161,27 @@ function validateConscienceContext(value) {
     consultation_depth: ctx.consultation_depth
   };
 }
+function extractFirstJsonObject(text) {
+  let depth = 0;
+  let start = -1;
+  for (let i = 0; i < text.length; i++) {
+    if (text[i] === "{") {
+      if (depth === 0) start = i;
+      depth++;
+    } else if (text[i] === "}") {
+      depth--;
+      if (depth === 0 && start !== -1) {
+        return text.slice(start, i + 1);
+      }
+    }
+  }
+  return null;
+}
 function checkIntegrity(input) {
   let jsonText = input.analysisResponse;
-  const jsonMatch = jsonText.match(/\{[\s\S]*\}/);
-  if (jsonMatch) {
-    jsonText = jsonMatch[0];
+  const extracted = extractFirstJsonObject(jsonText);
+  if (extracted) {
+    jsonText = extracted;
   }
   jsonText = jsonText.replace(/,\s*([}\]])/g, "$1");
   let parsed;
@@ -1187,6 +1203,22 @@ function checkIntegrity(input) {
   const conscienceContext = validateConscienceContext(
     parsed.conscience_context
   );
+  const crossValidationWarnings = [];
+  if (verdict === "clear") {
+    const criticalOrHigh = concerns.filter(
+      (c) => c.severity === "critical" || c.severity === "high"
+    );
+    if (criticalOrHigh.length > 0) {
+      const maxSeverity = criticalOrHigh.some((c) => c.severity === "critical") ? "critical" : "high";
+      crossValidationWarnings.push(
+        `Verdict is "clear" but ${criticalOrHigh.length} concern(s) have severity "${maxSeverity}". This may indicate an inconsistent analysis result.`
+      );
+    }
+  } else if (verdict === "boundary_violation" && concerns.length === 0) {
+    crossValidationWarnings.push(
+      `Verdict is "boundary_violation" but concerns array is empty. Expected at least one concern for a boundary violation.`
+    );
+  }
   const checkpointId = `${CHECKPOINT_ID_PREFIX}${randomUUID()}`;
   const analysisMetadata = {
     analysis_model: input.analysisModel,
@@ -1214,7 +1246,8 @@ function checkIntegrity(input) {
       window_size: input.windowPosition.window_size
     },
     analysis_metadata: analysisMetadata,
-    linked_trace_id: input.linkedTraceId ?? null
+    linked_trace_id: input.linkedTraceId ?? null,
+    ...crossValidationWarnings.length > 0 ? { cross_validation_warnings: crossValidationWarnings } : {}
   };
 }
 function mapVerdictToAction(verdict, concerns) {
@@ -1274,7 +1307,9 @@ function detectIntegrityDrift(state, checkpoint, windowCheckpoints, threshold) {
   for (const concern of checkpoint.concerns) {
     newState.streakCategories.push(concern.category);
   }
-  if (newState.sustainedNonclear >= effectiveThreshold && !newState.alertFired) {
+  const REALERT_INTERVAL = 5;
+  const shouldAlert = newState.sustainedNonclear >= effectiveThreshold && (!newState.alertFired || (newState.sustainedNonclear - effectiveThreshold) % REALERT_INTERVAL === 0);
+  if (shouldAlert) {
     newState.alertFired = true;
     const clearCount = windowCheckpoints.filter(
       (cp) => cp.verdict === "clear"
@@ -1326,7 +1361,9 @@ function inferDriftDirection(categories) {
       prompt_injection: "injection_pattern",
       value_misalignment: "value_erosion",
       autonomy_violation: "autonomy_creep",
-      deceptive_reasoning: "deception_pattern"
+      deceptive_reasoning: "deception_pattern",
+      reasoning_corruption: "reasoning_degradation",
+      undeclared_intent: "intent_drift"
     };
     return CATEGORY_TO_DIRECTION[maxCategory] ?? "unknown";
   }
@@ -1359,7 +1396,7 @@ function createClient(config) {
       const adapter = provider ? registry.get(provider) : registry.detectFromUrl(config.analysis_llm.base_url);
       const thinking = adapter.extractThinking(responseBody) ?? adapter.extractThinkingFromStream(responseBody);
       if (!thinking) {
-        return buildSyntheticSignal(config, window, "clear");
+        return buildSyntheticSignal(config, window, "clear", void 0, void 0, "no_thinking_block");
       }
       const thinkingTokens = Math.ceil(thinking.content.length / 4);
       const minTokens = config.min_evidence_tokens ?? DEFAULT_MIN_EVIDENCE_TOKENS;
@@ -1369,7 +1406,8 @@ function createClient(config) {
           window,
           "clear",
           `Thinking block below minimum evidence threshold (${thinkingTokens} tokens < ${minTokens})`,
-          thinkingTokens
+          thinkingTokens,
+          "below_evidence_threshold"
         );
       }
       const prompt = buildConsciencePrompt({
@@ -1395,9 +1433,9 @@ function createClient(config) {
           );
         }
         if (failureMode === "fail_closed") {
-          return buildSyntheticSignal(config, window, "boundary_violation");
+          return buildSyntheticSignal(config, window, "boundary_violation", void 0, void 0, "analysis_failed");
         }
-        return buildSyntheticSignal(config, window, "clear");
+        return buildSyntheticSignal(config, window, "clear", void 0, void 0, "analysis_failed");
       }
       const analysisDurationMs = Date.now() - startTime;
       const thinkingHash = hashThinkingBlock(thinking.content);
@@ -1458,7 +1496,10 @@ function createClient(config) {
 function generateSessionId(cardId) {
   const hash = cardId.slice(0, 8);
   const hourBucket = Math.floor(Date.now() / 36e5);
-  return `sess-${hash}-${hourBucket}`;
+  const randomBytes = new Uint8Array(2);
+  crypto.getRandomValues(randomBytes);
+  const randomHex = Array.from(randomBytes).map((b) => b.toString(16).padStart(2, "0")).join("");
+  return `sess-${hash}-${hourBucket}-${randomHex}`;
 }
 async function callAnalysisLLM(llmConfig, system, user, timeoutMs) {
   const controller = new AbortController();
@@ -1499,7 +1540,7 @@ async function callAnalysisLLM(llmConfig, system, user, timeoutMs) {
     clearTimeout(timeoutId);
   }
 }
-function buildSyntheticSignal(config, window, verdict, customReasoning, thinkingTokensOriginal) {
+function buildSyntheticSignal(config, window, verdict, customReasoning, thinkingTokensOriginal, syntheticReason) {
   const summary = window.getSummary();
   return {
     checkpoint: {
@@ -1533,7 +1574,9 @@ function buildSyntheticSignal(config, window, verdict, customReasoning, thinking
         truncated: false,
         extraction_confidence: 0
       },
-      linked_trace_id: null
+      linked_trace_id: null,
+      synthetic: true,
+      synthetic_reason: syntheticReason ?? "no_thinking_block"
     },
     proceed: verdict === "clear",
     recommended_action: verdict === "clear" ? "continue" : "deny_and_escalate",
@@ -1550,11 +1593,14 @@ function verifySignature(secret, payload, signature) {
   return constantTimeEqual(expected, signature);
 }
 function constantTimeEqual(a, b) {
-  if (a.length !== b.length) return false;
+  const maxLen = Math.max(a.length, b.length);
+  const aPadded = a.padEnd(maxLen, "\0");
+  const bPadded = b.padEnd(maxLen, "\0");
   let result = 0;
-  for (let i = 0; i < a.length; i++) {
-    result |= a.charCodeAt(i) ^ b.charCodeAt(i);
+  for (let i = 0; i < maxLen; i++) {
+    result |= aPadded.charCodeAt(i) ^ bPadded.charCodeAt(i);
   }
+  result |= a.length ^ b.length;
   return result === 0;
 }
 function base64ToUint8(b64) {