npm - @grainulation/harvest - Versions diffs - 1.0.1 → 1.0.2 - Mend

@grainulation/harvest 1.0.1 → 1.0.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

package/lib/tokens.js ADDED Viewed

@@ -0,0 +1,317 @@
+"use strict";
+/**
+ * Token cost tracking and attribution.
+ *
+ * Tracks token consumption from Agent SDK data per sprint, per user, per model.
+ * Computes cost-per-verified-claim as the key efficiency metric.
+ *
+ * Agent SDK exposes: total_cost_usd, input_tokens, output_tokens,
+ * cache_creation_input_tokens, cache_read_input_tokens per query() call.
+ *
+ * Pricing (per MTok, Opus 4.6 defaults):
+ *   input:         $5.00
+ *   output:        $25.00
+ *   cache_read:    $0.50  (90% discount on input)
+ *   cache_write:   $6.25  (1.25x input)
+ */
+const DEFAULT_PRICING = {
+  "claude-opus-4-6": {
+    input: 5.0,
+    output: 25.0,
+    cacheRead: 0.5,
+    cacheWrite: 6.25,
+  },
+  "claude-sonnet-4-6": {
+    input: 3.0,
+    output: 15.0,
+    cacheRead: 0.3,
+    cacheWrite: 3.75,
+  },
+  "claude-haiku-4-5": {
+    input: 0.8,
+    output: 4.0,
+    cacheRead: 0.08,
+    cacheWrite: 1.0,
+  },
+};
+const DEFAULT_MODEL = "claude-opus-4-6";
+/**
+ * Compute cost from token counts and pricing.
+ * @param {object} usage - { input_tokens, output_tokens, cache_read_input_tokens, cache_creation_input_tokens }
+ * @param {string} [model] - Model identifier
+ * @param {object} [customPricing] - Override pricing
+ * @returns {object} - { totalCostUsd, breakdown }
+ */
+function computeCost(usage, model, customPricing) {
+  const pricing =
+    (customPricing && customPricing[model]) ||
+    DEFAULT_PRICING[model] ||
+    DEFAULT_PRICING[DEFAULT_MODEL];
+  const input = ((usage.input_tokens || 0) / 1_000_000) * pricing.input;
+  const output = ((usage.output_tokens || 0) / 1_000_000) * pricing.output;
+  const cacheRead =
+    ((usage.cache_read_input_tokens || 0) / 1_000_000) * pricing.cacheRead;
+  const cacheWrite =
+    ((usage.cache_creation_input_tokens || 0) / 1_000_000) * pricing.cacheWrite;
+  const totalCostUsd = round6(input + output + cacheRead + cacheWrite);
+  return {
+    totalCostUsd,
+    breakdown: {
+      input: round6(input),
+      output: round6(output),
+      cacheRead: round6(cacheRead),
+      cacheWrite: round6(cacheWrite),
+    },
+    tokens: {
+      input: usage.input_tokens || 0,
+      output: usage.output_tokens || 0,
+      cacheRead: usage.cache_read_input_tokens || 0,
+      cacheWrite: usage.cache_creation_input_tokens || 0,
+      total:
+        (usage.input_tokens || 0) +
+        (usage.output_tokens || 0) +
+        (usage.cache_read_input_tokens || 0) +
+        (usage.cache_creation_input_tokens || 0),
+    },
+  };
+}
+/**
+ * Analyze token economics across sprints.
+ *
+ * Each sprint may have a `tokenUsage` field (from Agent SDK interception)
+ * or a `compilation.tokenUsage` field. Format:
+ *   { input_tokens, output_tokens, cache_read_input_tokens,
+ *     cache_creation_input_tokens, model, total_cost_usd }
+ *
+ * @param {Array} sprints - Sprint objects
+ * @returns {object} - Token economics report
+ */
+function analyzeTokens(sprints) {
+  const sprintCosts = [];
+  let totalCostUsd = 0;
+  let totalTokens = 0;
+  let totalClaims = 0;
+  let totalVerifiedClaims = 0;
+  for (const sprint of sprints) {
+    const usage = extractUsage(sprint);
+    const claimCount = sprint.claims.length;
+    const verifiedCount = countVerifiedClaims(sprint);
+    totalClaims += claimCount;
+    totalVerifiedClaims += verifiedCount;
+    if (!usage) {
+      sprintCosts.push({
+        sprint: sprint.name,
+        cost: null,
+        tokens: null,
+        claimCount,
+        verifiedClaims: verifiedCount,
+        costPerClaim: null,
+        costPerVerifiedClaim: null,
+      });
+      continue;
+    }
+    const model = usage.model || DEFAULT_MODEL;
+    const cost =
+      usage.total_cost_usd != null
+        ? {
+            totalCostUsd: usage.total_cost_usd,
+            breakdown: null,
+            tokens: tokenSummary(usage),
+          }
+        : computeCost(usage, model);
+    totalCostUsd += cost.totalCostUsd;
+    totalTokens += cost.tokens.total;
+    const costPerClaim =
+      claimCount > 0 ? round6(cost.totalCostUsd / claimCount) : null;
+    const costPerVerifiedClaim =
+      verifiedCount > 0 ? round6(cost.totalCostUsd / verifiedCount) : null;
+    sprintCosts.push({
+      sprint: sprint.name,
+      model,
+      cost: cost.totalCostUsd,
+      breakdown: cost.breakdown,
+      tokens: cost.tokens,
+      claimCount,
+      verifiedClaims: verifiedCount,
+      costPerClaim,
+      costPerVerifiedClaim,
+    });
+  }
+  // Cache efficiency: ratio of cache reads to total input
+  const totalCacheReads = sprintCosts.reduce(
+    (a, s) => a + (s.tokens ? s.tokens.cacheRead : 0),
+    0,
+  );
+  const totalInput = sprintCosts.reduce(
+    (a, s) =>
+      a +
+      (s.tokens
+        ? s.tokens.input + s.tokens.cacheRead + s.tokens.cacheWrite
+        : 0),
+    0,
+  );
+  const cacheHitRate =
+    totalInput > 0 ? Math.round((totalCacheReads / totalInput) * 100) : null;
+  const sprintsWithCost = sprintCosts.filter((s) => s.cost !== null);
+  const avgCostPerSprint =
+    sprintsWithCost.length > 0
+      ? round6(totalCostUsd / sprintsWithCost.length)
+      : null;
+  const costPerVerifiedClaim =
+    totalVerifiedClaims > 0 ? round6(totalCostUsd / totalVerifiedClaims) : null;
+  const costPerClaim =
+    totalClaims > 0 ? round6(totalCostUsd / totalClaims) : null;
+  return {
+    summary: {
+      totalSprints: sprints.length,
+      sprintsWithUsageData: sprintsWithCost.length,
+      totalCostUsd: round6(totalCostUsd),
+      totalTokens,
+      totalClaims,
+      totalVerifiedClaims,
+      costPerClaim,
+      costPerVerifiedClaim,
+      avgCostPerSprint,
+      cacheHitRate,
+    },
+    perSprint: sprintCosts,
+    insight: generateTokenInsight(
+      sprintCosts,
+      costPerVerifiedClaim,
+      cacheHitRate,
+    ),
+  };
+}
+/**
+ * Extract token usage data from a sprint.
+ */
+function extractUsage(sprint) {
+  // Direct tokenUsage on sprint
+  if (sprint.tokenUsage) return sprint.tokenUsage;
+  // From compilation metadata
+  if (sprint.compilation && sprint.compilation.tokenUsage)
+    return sprint.compilation.tokenUsage;
+  // From compilation.meta
+  if (
+    sprint.compilation &&
+    sprint.compilation.meta &&
+    sprint.compilation.meta.tokenUsage
+  ) {
+    return sprint.compilation.meta.tokenUsage;
+  }
+  return null;
+}
+/**
+ * Count claims that survived compilation (verified).
+ * A claim is "verified" if it has evidence >= documented, or status is active/resolved.
+ */
+function countVerifiedClaims(sprint) {
+  if (sprint.compilation && sprint.compilation.claims) {
+    return sprint.compilation.claims.length;
+  }
+  // Fallback: count claims with evidence better than stated/web
+  return sprint.claims.filter((c) => {
+    const tier = c.evidence || "stated";
+    return tier !== "stated" && tier !== "web";
+  }).length;
+}
+function tokenSummary(usage) {
+  return {
+    input: usage.input_tokens || 0,
+    output: usage.output_tokens || 0,
+    cacheRead: usage.cache_read_input_tokens || 0,
+    cacheWrite: usage.cache_creation_input_tokens || 0,
+    total:
+      (usage.input_tokens || 0) +
+      (usage.output_tokens || 0) +
+      (usage.cache_read_input_tokens || 0) +
+      (usage.cache_creation_input_tokens || 0),
+  };
+}
+function generateTokenInsight(sprintCosts, costPerVerified, cacheHitRate) {
+  const parts = [];
+  const withCost = sprintCosts.filter((s) => s.cost !== null);
+  if (withCost.length === 0) {
+    return "No token usage data found. Token tracking requires Agent SDK integration.";
+  }
+  if (costPerVerified !== null) {
+    if (costPerVerified < 0.01) {
+      parts.push(
+        `Excellent efficiency: $${costPerVerified.toFixed(4)} per verified claim.`,
+      );
+    } else if (costPerVerified < 0.05) {
+      parts.push(
+        `Good efficiency: $${costPerVerified.toFixed(4)} per verified claim.`,
+      );
+    } else {
+      parts.push(
+        `Cost per verified claim: $${costPerVerified.toFixed(4)}. Consider improving cache usage or reducing exploratory queries.`,
+      );
+    }
+  }
+  if (cacheHitRate !== null) {
+    if (cacheHitRate > 50) {
+      parts.push(
+        `Strong cache utilization at ${cacheHitRate}% -- prompt caching is working well.`,
+      );
+    } else if (cacheHitRate > 20) {
+      parts.push(
+        `Cache hit rate: ${cacheHitRate}%. Room to improve by reusing system prompts across operations.`,
+      );
+    }
+  }
+  // Trend: cost per claim improving over time?
+  if (withCost.length >= 3) {
+    const firstHalf = withCost.slice(0, Math.floor(withCost.length / 2));
+    const secondHalf = withCost.slice(Math.floor(withCost.length / 2));
+    const avgFirst = avg(firstHalf.map((s) => s.costPerClaim).filter(Boolean));
+    const avgSecond = avg(
+      secondHalf.map((s) => s.costPerClaim).filter(Boolean),
+    );
+    if (avgFirst && avgSecond && avgSecond < avgFirst * 0.85) {
+      parts.push(
+        "Research is getting cheaper: cost per claim is trending down across recent sprints.",
+      );
+    }
+  }
+  return parts.length > 0
+    ? parts.join(" ")
+    : "Token usage tracked across sprints.";
+}
+function avg(arr) {
+  return arr.length > 0 ? arr.reduce((a, b) => a + b, 0) / arr.length : null;
+}
+function round6(n) {
+  return Math.round(n * 1_000_000) / 1_000_000;
+}
+module.exports = { analyzeTokens, computeCost, DEFAULT_PRICING };

package/lib/velocity.js CHANGED Viewed

@@ -1,4 +1,4 @@
-'use strict';
+"use strict";
 /**
  * Sprint timing and phase analysis.
@@ -11,15 +11,15 @@
  */
 const PHASE_PREFIXES = {
-  cal: 'calibration',
-  burn: 'control-burn',
-  d: 'define',
-  r: 'research',
-  p: 'prototype',
-  e: 'evaluate',
-  f: 'feedback',
-  x: 'challenge',
-  w: 'witness',
+  cal: "calibration",
+  burn: "control-burn",
+  d: "define",
+  r: "research",
+  p: "prototype",
+  e: "evaluate",
+  f: "feedback",
+  x: "challenge",
+  w: "witness",
 };
 function measureVelocity(sprints) {
@@ -31,16 +31,16 @@ function measureVelocity(sprints) {
     // Extract timestamps from claims
     const claimDates = claims
-      .map(c => c.created || c.date || c.timestamp)
+      .map((c) => c.created || c.date || c.timestamp)
       .filter(Boolean)
-      .map(d => new Date(d))
-      .filter(d => !isNaN(d.getTime()))
+      .map((d) => new Date(d))
+      .filter((d) => !isNaN(d.getTime()))
       .sort((a, b) => a - b);
     // Extract timestamps from git log
     const gitDates = gitLog
-      .map(g => new Date(g.date))
-      .filter(d => !isNaN(d.getTime()))
+      .map((g) => new Date(g.date))
+      .filter((d) => !isNaN(d.getTime()))
       .sort((a, b) => a - b);
     // Use whichever source has data
@@ -53,15 +53,18 @@ function measureVelocity(sprints) {
         claimsPerDay: null,
         phases: extractPhaseTimings(claims),
         stalls: [],
-        note: 'Insufficient timestamp data.',
+        note: "Insufficient timestamp data.",
       });
       continue;
     }
     const startDate = allDates[0];
     const endDate = allDates[allDates.length - 1];
-    const durationDays = Math.max(1, Math.ceil((endDate - startDate) / (1000 * 60 * 60 * 24)));
-    const claimsPerDay = Math.round(claims.length / durationDays * 10) / 10;
+    const durationDays = Math.max(
+      1,
+      Math.ceil((endDate - startDate) / (1000 * 60 * 60 * 24)),
+    );
+    const claimsPerDay = Math.round((claims.length / durationDays) * 10) / 10;
     // Detect stalls: gaps > 2 days between consecutive activity
     const stalls = [];
@@ -69,8 +72,8 @@ function measureVelocity(sprints) {
       const gap = (allDates[i] - allDates[i - 1]) / (1000 * 60 * 60 * 24);
       if (gap > 2) {
         stalls.push({
-          afterDate: allDates[i - 1].toISOString().split('T')[0],
-          beforeDate: allDates[i].toISOString().split('T')[0],
+          afterDate: allDates[i - 1].toISOString().split("T")[0],
+          beforeDate: allDates[i].toISOString().split("T")[0],
           gapDays: Math.round(gap * 10) / 10,
         });
       }
@@ -78,8 +81,8 @@ function measureVelocity(sprints) {
     results.push({
       sprint: sprint.name,
-      startDate: startDate.toISOString().split('T')[0],
-      endDate: endDate.toISOString().split('T')[0],
+      startDate: startDate.toISOString().split("T")[0],
+      endDate: endDate.toISOString().split("T")[0],
       durationDays,
       totalClaims: claims.length,
       claimsPerDay,
@@ -90,13 +93,23 @@ function measureVelocity(sprints) {
   }
   // Aggregate stats
-  const validResults = results.filter(r => r.durationDays !== null);
-  const avgDuration = validResults.length > 0
-    ? Math.round(validResults.reduce((a, r) => a + r.durationDays, 0) / validResults.length * 10) / 10
-    : null;
-  const avgClaimsPerDay = validResults.length > 0
-    ? Math.round(validResults.reduce((a, r) => a + r.claimsPerDay, 0) / validResults.length * 10) / 10
-    : null;
+  const validResults = results.filter((r) => r.durationDays !== null);
+  const avgDuration =
+    validResults.length > 0
+      ? Math.round(
+          (validResults.reduce((a, r) => a + r.durationDays, 0) /
+            validResults.length) *
+            10,
+        ) / 10
+      : null;
+  const avgClaimsPerDay =
+    validResults.length > 0
+      ? Math.round(
+          (validResults.reduce((a, r) => a + r.claimsPerDay, 0) /
+            validResults.length) *
+            10,
+        ) / 10
+      : null;
   const totalStalls = results.reduce((a, r) => a + r.stalls.length, 0);
   return {
@@ -120,7 +133,9 @@ function extractPhaseTimings(claims) {
     const match = claim.id.match(/^([a-z]+)/);
     if (!match) continue;
     const letters = match[1];
-    const prefix = Object.keys(PHASE_PREFIXES).find(k => letters.startsWith(k)) || letters.charAt(0);
+    const prefix =
+      Object.keys(PHASE_PREFIXES).find((k) => letters.startsWith(k)) ||
+      letters.charAt(0);
     const phaseName = PHASE_PREFIXES[prefix] || prefix;
     if (!phases[phaseName]) {
@@ -132,11 +147,17 @@ function extractPhaseTimings(claims) {
     if (date) {
       const d = new Date(date);
       if (!isNaN(d.getTime())) {
-        if (!phases[phaseName].firstDate || d < new Date(phases[phaseName].firstDate)) {
-          phases[phaseName].firstDate = d.toISOString().split('T')[0];
+        if (
+          !phases[phaseName].firstDate ||
+          d < new Date(phases[phaseName].firstDate)
+        ) {
+          phases[phaseName].firstDate = d.toISOString().split("T")[0];
         }
-        if (!phases[phaseName].lastDate || d > new Date(phases[phaseName].lastDate)) {
-          phases[phaseName].lastDate = d.toISOString().split('T')[0];
+        if (
+          !phases[phaseName].lastDate ||
+          d > new Date(phases[phaseName].lastDate)
+        ) {
+          phases[phaseName].lastDate = d.toISOString().split("T")[0];
         }
       }
     }
@@ -149,14 +170,19 @@ function generateVelocityInsight(results, totalStalls) {
   const parts = [];
   if (results.length === 0) {
-    return 'No sprint timing data available.';
+    return "No sprint timing data available.";
   }
-  const avgDuration = results.reduce((a, r) => a + r.durationDays, 0) / results.length;
-  parts.push(`Average sprint duration: ${Math.round(avgDuration * 10) / 10} days.`);
+  const avgDuration =
+    results.reduce((a, r) => a + r.durationDays, 0) / results.length;
+  parts.push(
+    `Average sprint duration: ${Math.round(avgDuration * 10) / 10} days.`,
+  );
   if (totalStalls > 0) {
-    parts.push(`${totalStalls} stall(s) detected across sprints (gaps > 2 days between activity).`);
+    parts.push(
+      `${totalStalls} stall(s) detected across sprints (gaps > 2 days between activity).`,
+    );
   }
   // Find the slowest phase across all sprints
@@ -168,10 +194,12 @@ function generateVelocityInsight(results, totalStalls) {
   }
   const topPhase = Object.entries(phaseTotals).sort((a, b) => b[1] - a[1])[0];
   if (topPhase) {
-    parts.push(`Most active phase: ${topPhase[0]} (${topPhase[1]} claims across all sprints).`);
+    parts.push(
+      `Most active phase: ${topPhase[0]} (${topPhase[1]} claims across all sprints).`,
+    );
   }
-  return parts.join(' ');
+  return parts.join(" ");
 }
 module.exports = { measureVelocity };