npm - task-summary-extractor - Versions diffs - 8.1.0 - Mend

task-summary-extractor 8.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (38) hide show

package/ARCHITECTURE.md +605 -0
package/EXPLORATION.md +451 -0
package/QUICK_START.md +272 -0
package/README.md +544 -0
package/bin/taskex.js +64 -0
package/package.json +63 -0
package/process_and_upload.js +107 -0
package/prompt.json +265 -0
package/setup.js +505 -0
package/src/config.js +327 -0
package/src/logger.js +355 -0
package/src/pipeline.js +2006 -0
package/src/renderers/markdown.js +968 -0
package/src/services/firebase.js +106 -0
package/src/services/gemini.js +779 -0
package/src/services/git.js +329 -0
package/src/services/video.js +305 -0
package/src/utils/adaptive-budget.js +266 -0
package/src/utils/change-detector.js +466 -0
package/src/utils/cli.js +415 -0
package/src/utils/context-manager.js +499 -0
package/src/utils/cost-tracker.js +156 -0
package/src/utils/deep-dive.js +549 -0
package/src/utils/diff-engine.js +315 -0
package/src/utils/dynamic-mode.js +567 -0
package/src/utils/focused-reanalysis.js +317 -0
package/src/utils/format.js +32 -0
package/src/utils/fs.js +39 -0
package/src/utils/global-config.js +315 -0
package/src/utils/health-dashboard.js +216 -0
package/src/utils/inject-cli-flags.js +58 -0
package/src/utils/json-parser.js +245 -0
package/src/utils/learning-loop.js +301 -0
package/src/utils/progress-updater.js +451 -0
package/src/utils/progress.js +166 -0
package/src/utils/prompt.js +32 -0
package/src/utils/quality-gate.js +429 -0
package/src/utils/retry.js +129 -0

package/src/utils/quality-gate.js ADDED Viewed

@@ -0,0 +1,429 @@
+/**
+ * Quality Gate — validates AI analysis output quality and determines
+ * whether a segment needs re-analysis.
+ *
+ * Scoring dimensions:
+ *  - Structural completeness (required fields present)
+ *  - Content density (meaningful data extracted)
+ *  - Parse integrity (JSON parsed successfully, no truncation)
+ *  - Cross-reference consistency (IDs, timestamps, references make sense)
+ *
+ * Returns a quality report with a numeric score (0-100) and actionable
+ * diagnostics for retry decisions.
+ */
+'use strict';
+// ======================== QUALITY THRESHOLDS ========================
+const THRESHOLDS = {
+  /** Minimum score to PASS without retry (0-100) */
+  PASS: 45,
+  /** Score range for WARNING — will pass but flag issues (45-65 is typical) */
+  WARN: 65,
+  /** Maximum retries per segment */
+  MAX_RETRIES: 1,
+};
+// Required top-level fields in a valid analysis
+const REQUIRED_FIELDS = [
+  'tickets',
+  'action_items',
+  'change_requests',
+  'summary',
+];
+// Optional but valuable fields (boost score when present)
+const VALUED_FIELDS = [
+  'blockers',
+  'scope_changes',
+  'file_references',
+  'your_tasks',
+];
+// ======================== SCORING FUNCTIONS ========================
+/**
+ * Score structural completeness: are the required fields present and non-empty?
+ * @param {object} analysis - Parsed analysis
+ * @returns {{ score: number, issues: string[] }} - 0-100 score + issues
+ */
+function scoreStructure(analysis) {
+  if (!analysis || typeof analysis !== 'object') {
+    return { score: 0, issues: ['Analysis is null or not an object'] };
+  }
+  const issues = [];
+  let present = 0;
+  for (const field of REQUIRED_FIELDS) {
+    if (analysis[field] === undefined || analysis[field] === null) {
+      issues.push(`Missing required field: "${field}"`);
+    } else {
+      present++;
+    }
+  }
+  // Bonus for valued optional fields
+  let bonus = 0;
+  for (const field of VALUED_FIELDS) {
+    if (analysis[field] !== undefined && analysis[field] !== null) {
+      bonus += 3; // up to 12 bonus points
+    }
+  }
+  const baseScore = (present / REQUIRED_FIELDS.length) * 80;
+  return { score: Math.min(100, baseScore + bonus), issues };
+}
+/**
+ * Score content density: how much meaningful data was extracted?
+ * Empty arrays are valid but sparse; we want to reward rich extraction.
+ * Also scores confidence field coverage.
+ * @param {object} analysis
+ * @returns {{ score: number, issues: string[] }}
+ */
+function scoreDensity(analysis) {
+  if (!analysis || typeof analysis !== 'object') {
+    return { score: 0, issues: ['No analysis to score'] };
+  }
+  const issues = [];
+  let points = 0;
+  let maxPoints = 0;
+  // Tickets
+  maxPoints += 25;
+  const tickets = analysis.tickets || [];
+  if (tickets.length > 0) {
+    points += 12;
+    const richTickets = tickets.filter(t =>
+      t.ticket_id && t.discussed_state && (t.comments?.length > 0 || t.code_changes?.length > 0)
+    );
+    points += Math.min(13, (richTickets.length / Math.max(tickets.length, 1)) * 13);
+  } else {
+    issues.push('No tickets extracted — verify if segment discusses tickets');
+  }
+  // Action items
+  maxPoints += 17;
+  const actions = analysis.action_items || [];
+  if (actions.length > 0) {
+    points += 8;
+    const richActions = actions.filter(a => a.assigned_to && a.description);
+    points += Math.min(9, (richActions.length / Math.max(actions.length, 1)) * 9);
+  }
+  // Change requests
+  maxPoints += 17;
+  const crs = analysis.change_requests || [];
+  if (crs.length > 0) {
+    points += 8;
+    const richCrs = crs.filter(cr => cr.where && cr.what);
+    points += Math.min(9, (richCrs.length / Math.max(crs.length, 1)) * 9);
+  }
+  // Summary
+  maxPoints += 13;
+  const summary = analysis.summary || '';
+  if (summary.length > 50) {
+    points += 13;
+  } else if (summary.length > 0) {
+    points += 6;
+    issues.push('Summary is very short (< 50 chars)');
+  } else {
+    issues.push('No summary extracted');
+  }
+  // your_tasks
+  maxPoints += 13;
+  const tasks = analysis.your_tasks;
+  if (tasks) {
+    const taskCount =
+      (tasks.tasks_todo?.length || 0) +
+      (tasks.tasks_waiting_on_others?.length || 0) +
+      (tasks.decisions_needed?.length || 0) +
+      (tasks.completed_in_call?.length || 0);
+    if (taskCount > 0) {
+      points += 13;
+    } else {
+      points += 4;
+    }
+  }
+  // Confidence coverage — reward items that have confidence fields
+  maxPoints += 15;
+  const allItems = [
+    ...tickets,
+    ...actions,
+    ...crs,
+    ...(analysis.blockers || []),
+    ...(analysis.scope_changes || []),
+  ];
+  if (allItems.length > 0) {
+    const withConfidence = allItems.filter(item =>
+      item.confidence && ['HIGH', 'MEDIUM', 'LOW'].includes(item.confidence)
+    );
+    const coverageRatio = withConfidence.length / allItems.length;
+    points += Math.round(coverageRatio * 15);
+    if (coverageRatio < 0.5) {
+      issues.push(`Low confidence coverage: only ${withConfidence.length}/${allItems.length} items have confidence fields`);
+    }
+    // Bonus check: confidence distribution shouldn't be all the same
+    if (withConfidence.length >= 3) {
+      const levels = new Set(withConfidence.map(i => i.confidence));
+      if (levels.size === 1) {
+        issues.push(`All items have same confidence (${[...levels][0]}) — suspicious uniformity`);
+      }
+    }
+  } else {
+    points += 5; // No items to score — neutral
+  }
+  const score = Math.round((points / maxPoints) * 100);
+  return { score, issues };
+}
+/**
+ * Score parse integrity: did the JSON parse cleanly?
+ * @param {object} parseContext - { parseSuccess, rawLength, parsedKeys }
+ * @returns {{ score: number, issues: string[] }}
+ */
+function scoreIntegrity(parseContext) {
+  const { parseSuccess, rawLength = 0, truncated = false } = parseContext;
+  const issues = [];
+  if (!parseSuccess) {
+    issues.push('JSON parse failed — output could not be parsed');
+    return { score: 0, issues };
+  }
+  let score = 80;
+  if (truncated) {
+    issues.push('Output was truncated — data may be incomplete');
+    score -= 30;
+  }
+  // Very short raw output suggests the model didn't produce enough
+  if (rawLength < 500) {
+    issues.push(`Raw output very short (${rawLength} chars) — may be minimal`);
+    score -= 20;
+  } else if (rawLength < 2000) {
+    issues.push(`Raw output is short (${rawLength} chars)`);
+    score -= 10;
+  }
+  return { score: Math.max(0, score), issues };
+}
+/**
+ * Score cross-reference consistency within the analysis.
+ * @param {object} analysis
+ * @returns {{ score: number, issues: string[] }}
+ */
+function scoreCrossReferences(analysis) {
+  if (!analysis || typeof analysis !== 'object') {
+    return { score: 50, issues: [] }; // neutral if no analysis
+  }
+  const issues = [];
+  let score = 100;
+  // Check: ticket IDs should be unique
+  const tickets = analysis.tickets || [];
+  const ticketIds = tickets.map(t => t.ticket_id).filter(Boolean);
+  const uniqueIds = new Set(ticketIds);
+  if (ticketIds.length > 0 && uniqueIds.size < ticketIds.length) {
+    issues.push(`Duplicate ticket IDs found: ${ticketIds.length - uniqueIds.size} duplicate(s)`);
+    score -= 15;
+  }
+  // Check: action item IDs should be sequential and unique
+  const actions = analysis.action_items || [];
+  const actionIds = actions.map(a => a.id).filter(Boolean);
+  const uniqueActionIds = new Set(actionIds);
+  if (actionIds.length > 0 && uniqueActionIds.size < actionIds.length) {
+    issues.push(`Duplicate action item IDs: ${actionIds.length - uniqueActionIds.size} duplicate(s)`);
+    score -= 10;
+  }
+  // Check: change request IDs should reference real tickets
+  const crs = analysis.change_requests || [];
+  for (const cr of crs) {
+    if (cr.ticket_id && !uniqueIds.has(cr.ticket_id) && tickets.length > 0) {
+      issues.push(`CR "${cr.id}" references unknown ticket "${cr.ticket_id}"`);
+      score -= 5;
+    }
+  }
+  return { score: Math.max(0, score), issues };
+}
+// ======================== MAIN QUALITY GATE ========================
+/**
+ * Run the full quality gate on a segment analysis.
+ *
+ * @param {object} analysis - The parsed analysis object
+ * @param {object} context - Additional context for scoring
+ * @param {boolean} context.parseSuccess - Whether JSON parsing succeeded
+ * @param {number} context.rawLength - Length of raw AI output
+ * @param {boolean} [context.truncated] - Whether output was truncated during repair
+ * @param {number} [context.segmentIndex] - Which segment (0-based)
+ * @param {number} [context.totalSegments] - Total segments
+ * @returns {QualityReport}
+ */
+function assessQuality(analysis, context = {}) {
+  const structure = scoreStructure(analysis);
+  const density = scoreDensity(analysis);
+  const integrity = scoreIntegrity(context);
+  const crossRef = scoreCrossReferences(analysis);
+  // Weighted composite score
+  const weights = { structure: 0.25, density: 0.35, integrity: 0.25, crossRef: 0.15 };
+  const compositeScore = Math.round(
+    structure.score * weights.structure +
+    density.score * weights.density +
+    integrity.score * weights.integrity +
+    crossRef.score * weights.crossRef
+  );
+  const allIssues = [
+    ...structure.issues.map(i => `[structure] ${i}`),
+    ...density.issues.map(i => `[density] ${i}`),
+    ...integrity.issues.map(i => `[integrity] ${i}`),
+    ...crossRef.issues.map(i => `[consistency] ${i}`),
+  ];
+  let grade;
+  if (compositeScore >= THRESHOLDS.WARN) {
+    grade = 'PASS';
+  } else if (compositeScore >= THRESHOLDS.PASS) {
+    grade = 'WARN';
+  } else {
+    grade = 'FAIL';
+  }
+  return {
+    grade,
+    score: compositeScore,
+    dimensions: {
+      structure: { score: structure.score, weight: weights.structure },
+      density: { score: density.score, weight: weights.density },
+      integrity: { score: integrity.score, weight: weights.integrity },
+      crossRef: { score: crossRef.score, weight: weights.crossRef },
+    },
+    issues: allIssues,
+    shouldRetry: grade === 'FAIL',
+    retryHints: grade === 'FAIL' ? buildRetryHints(analysis, allIssues) : [],
+  };
+}
+/**
+ * Build retry hints — specific instructions to inject into the retry prompt
+ * to address the quality issues found.
+ * @param {object} analysis
+ * @param {string[]} issues
+ * @returns {string[]}
+ */
+function buildRetryHints(analysis, issues) {
+  const hints = [];
+  if (issues.some(i => i.includes('Missing required field'))) {
+    hints.push('CRITICAL: Your previous response was missing required fields. You MUST include ALL of: tickets, action_items, change_requests, summary. Use empty arrays [] if no items exist.');
+  }
+  if (issues.some(i => i.includes('JSON parse failed'))) {
+    hints.push('CRITICAL: Your previous response could not be parsed as JSON. Respond with ONLY valid JSON — no markdown fences, no extra text before or after the JSON object. Start with { and end with }.');
+  }
+  if (issues.some(i => i.includes('truncated'))) {
+    hints.push('Your previous response was truncated. Be more concise — use shorter descriptions, fewer comments per ticket (max 3), and compact formatting to fit within the output limit.');
+  }
+  if (issues.some(i => i.includes('No tickets extracted'))) {
+    hints.push('Your previous response contained no tickets. Listen carefully to the video — if specific work items, bugs, features, or tasks are discussed, extract them as tickets with IDs.');
+  }
+  if (issues.some(i => i.includes('No summary'))) {
+    hints.push('Your previous response was missing a summary. Include a 2-4 sentence executive summary of what was discussed in this segment.');
+  }
+  if (issues.some(i => i.includes('very short'))) {
+    hints.push('Your previous response was too brief. Analyze the video more thoroughly — extract ALL tickets, action items, changes discussed, and blockers mentioned.');
+  }
+  if (issues.some(i => i.includes('confidence coverage'))) {
+    hints.push('Your previous response was missing confidence fields. Every ticket, action_item, change_request, blocker, and scope_change MUST have "confidence": "HIGH|MEDIUM|LOW" and "confidence_reason" explaining why.');
+  }
+  if (issues.some(i => i.includes('suspicious uniformity'))) {
+    hints.push('Your previous response had all items at the same confidence level. Differentiate: use HIGH for items explicitly discussed + corroborated by docs, MEDIUM for partial evidence, LOW for inferred items.');
+  }
+  return hints;
+}
+/**
+ * Generate a human-readable quality summary line.
+ * @param {QualityReport} report
+ * @param {string} segmentName
+ * @returns {string}
+ */
+function formatQualityLine(report, segmentName) {
+  const icon = report.grade === 'PASS' ? '✓' : report.grade === 'WARN' ? '⚠' : '✗';
+  const dims = report.dimensions;
+  return `    ${icon} Quality: ${report.score}/100 (${report.grade}) — ` +
+    `struct:${dims.structure.score} density:${dims.density.score} ` +
+    `integrity:${dims.integrity.score} xref:${dims.crossRef.score}`;
+}
+/**
+ * Extract confidence distribution statistics from an analysis.
+ * @param {object} analysis
+ * @returns {{ total: number, high: number, medium: number, low: number, missing: number, coverage: number }}
+ */
+function getConfidenceStats(analysis) {
+  if (!analysis || typeof analysis !== 'object') {
+    return { total: 0, high: 0, medium: 0, low: 0, missing: 0, coverage: 0 };
+  }
+  const allItems = [
+    ...(analysis.tickets || []),
+    ...(analysis.action_items || []),
+    ...(analysis.change_requests || []),
+    ...(analysis.blockers || []),
+    ...(analysis.scope_changes || []),
+  ];
+  const total = allItems.length;
+  if (total === 0) return { total: 0, high: 0, medium: 0, low: 0, missing: 0, coverage: 1 };
+  let high = 0, medium = 0, low = 0, missing = 0;
+  for (const item of allItems) {
+    switch (item.confidence) {
+      case 'HIGH': high++; break;
+      case 'MEDIUM': medium++; break;
+      case 'LOW': low++; break;
+      default: missing++; break;
+    }
+  }
+  return { total, high, medium, low, missing, coverage: Math.round(((total - missing) / total) * 100) };
+}
+module.exports = {
+  assessQuality,
+  formatQualityLine,
+  buildRetryHints,
+  getConfidenceStats,
+  THRESHOLDS,
+  // Expose for testing
+  scoreStructure,
+  scoreDensity,
+  scoreIntegrity,
+  scoreCrossReferences,
+};

package/src/utils/retry.js ADDED Viewed

@@ -0,0 +1,129 @@
+/**
+ * Retry utility — exponential backoff with jitter for transient failures.
+ *
+ * Used for Gemini API calls and Firebase operations that may fail
+ * due to rate limits, network issues, or temporary outages.
+ */
+'use strict';
+const { MAX_RETRIES, RETRY_BASE_DELAY_MS } = require('../config');
+/**
+ * Known transient error patterns that should be retried.
+ */
+const TRANSIENT_PATTERNS = [
+  /429/i,                       // Rate limited
+  /too many requests/i,
+  /quota exceeded/i,
+  /resource exhausted/i,
+  /ECONNRESET/i,
+  /ETIMEDOUT/i,
+  /ENOTFOUND/i,
+  /EPIPE/i,
+  /socket hang up/i,
+  /network/i,
+  /503/i,                       // Service unavailable
+  /502/i,                       // Bad gateway
+  /500/i,                       // Internal server error (sometimes transient)
+  /UNAVAILABLE/i,
+  /INTERNAL/i,
+  /overloaded/i,
+  /capacity/i,
+];
+/**
+ * Determine if an error is likely transient and worth retrying.
+ * @param {Error} err
+ * @returns {boolean}
+ */
+function isTransientError(err) {
+  const msg = err.message || '';
+  const code = err.code || '';
+  const status = err.status || err.statusCode || 0;
+  // HTTP status codes that are transient
+  if ([429, 500, 502, 503, 504].includes(status)) return true;
+  // Check message against known patterns
+  const combined = `${msg} ${code}`;
+  return TRANSIENT_PATTERNS.some(p => p.test(combined));
+}
+/**
+ * Execute an async function with exponential backoff retry.
+ *
+ * @param {Function} fn - Async function to execute
+ * @param {object} [opts]
+ * @param {number} [opts.maxRetries] - Max retry attempts (default from config)
+ * @param {number} [opts.baseDelay] - Base delay in ms (default from config)
+ * @param {string} [opts.label] - Human-readable label for log messages
+ * @param {Function} [opts.onRetry] - Called with (attempt, delay, err) before each retry
+ * @param {Function} [opts.shouldRetry] - Custom predicate (err) → boolean
+ * @returns {Promise<any>} Result of fn()
+ */
+async function withRetry(fn, opts = {}) {
+  const maxRetries = opts.maxRetries ?? MAX_RETRIES;
+  const baseDelay = opts.baseDelay ?? RETRY_BASE_DELAY_MS;
+  const label = opts.label || 'operation';
+  const shouldRetry = opts.shouldRetry || isTransientError;
+  const onRetry = opts.onRetry || null;
+  let lastError;
+  for (let attempt = 0; attempt <= maxRetries; attempt++) {
+    try {
+      return await fn();
+    } catch (err) {
+      lastError = err;
+      if (attempt >= maxRetries || !shouldRetry(err)) {
+        throw err;
+      }
+      // Exponential backoff with jitter: baseDelay * 2^attempt * (0.5-1.5)
+      const jitter = 0.5 + Math.random();
+      const delay = Math.min(baseDelay * Math.pow(2, attempt) * jitter, 60000);
+      if (onRetry) {
+        onRetry(attempt + 1, delay, err);
+      } else {
+        const msg = err.message || String(err);
+        console.warn(`  ⚠ ${label} failed (attempt ${attempt + 1}/${maxRetries + 1}): ${msg.slice(0, 120)}`);
+        console.warn(`    → Retrying in ${(delay / 1000).toFixed(1)}s...`);
+      }
+      await new Promise(r => setTimeout(r, delay));
+    }
+  }
+  throw lastError;
+}
+/**
+ * Run multiple async tasks with a concurrency limit.
+ *
+ * @param {Array} items - Items to process
+ * @param {Function} fn - Async function (item, index) → result
+ * @param {number} [concurrency=3] - Max concurrent tasks
+ * @returns {Promise<Array>} Results in original order
+ */
+async function parallelMap(items, fn, concurrency = 3) {
+  const results = new Array(items.length);
+  let nextIndex = 0;
+  async function worker() {
+    while (nextIndex < items.length) {
+      const idx = nextIndex++;
+      results[idx] = await fn(items[idx], idx);
+    }
+  }
+  const workers = Array.from(
+    { length: Math.min(concurrency, items.length) },
+    () => worker()
+  );
+  await Promise.all(workers);
+  return results;
+}
+module.exports = { withRetry, parallelMap, isTransientError };