npm - task-summary-extractor - Versions diffs - 8.1.0 → 8.3.0 - Mend

task-summary-extractor 8.1.0 → 8.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

package/ARCHITECTURE.md +17 -12
package/EXPLORATION.md +25 -21
package/README.md +23 -15
package/package.json +2 -2
package/process_and_upload.js +7 -100
package/prompt.json +199 -131
package/src/{utils → modes}/deep-dive.js +2 -2
package/src/{utils → modes}/dynamic-mode.js +2 -2
package/src/{utils → modes}/focused-reanalysis.js +2 -2
package/src/{utils → modes}/progress-updater.js +1 -1
package/src/pipeline.js +9 -8
package/src/services/gemini.js +4 -4
package/src/services/git.js +0 -29
package/src/utils/adaptive-budget.js +0 -2
package/src/utils/cli.js +30 -3
package/src/utils/context-manager.js +0 -4
package/src/utils/diff-engine.js +0 -3
package/src/utils/json-parser.js +1 -1
package/src/utils/learning-loop.js +0 -1
package/src/utils/quality-gate.js +0 -6
package/src/utils/retry.js +10 -4
package/src/utils/prompt.js +0 -32
/package/src/{utils → modes}/change-detector.js +0 -0
/package/src/utils/{progress.js → checkpoint.js} +0 -0

package/ARCHITECTURE.md CHANGED Viewed

@@ -76,20 +76,23 @@ flowchart TB
         GIT["git.js"]
     end
-    subgraph Utils["Utilities — 19 modules"]
+    subgraph Utils["Utilities"]
         QG["quality-gate"]
-        FR["focused-reanalysis"]
         LL["learning-loop"]
         DE["diff-engine"]
-        CD["change-detector"]
-        PU["progress-updater"]
         CM["context-manager"]
         JP["json-parser"]
         AB["adaptive-budget"]
         HD["health-dashboard"]
+        OT["+ 7 more"]
+    end
+    subgraph Modes["Modes — AI pipeline phases"]
+        FR["focused-reanalysis"]
+        CD["change-detector"]
+        PU["progress-updater"]
         DD["deep-dive"]
         DM["dynamic-mode"]
-        OT["+ 7 more"]
     end
     subgraph Renderers["Renderers"]
@@ -101,6 +104,7 @@ flowchart TB
     P1 -.->|"--dynamic"| DYN
     Pipeline --> Services
     Pipeline --> Utils
+    Pipeline --> Modes
     Pipeline --> Renderers
     UP --> GIT
     UP --> CD
@@ -115,7 +119,7 @@ flowchart TB
 | Phase | Name | What Happens |
 |-------|------|-------------|
 | 1 | **Init** | CLI parsing, interactive folder selection (if no arg), config validation, logger setup, load learning insights, route to dynamic/progress mode |
-| 2 | **Discover** | Find videos, discover documents, resolve user name, check resume state |
+| 2 | **Discover** | Find videos/audio, discover documents, resolve user name, check resume state |
 | 3 | **Services** | Firebase auth, Gemini init, prepare document parts |
 | 4 | **Process** | Compress → Upload → Analyze → Quality Gate → Retry → Focused Pass |
 | 5 | **Compile** | Cross-segment compilation, diff engine comparison |
@@ -294,17 +298,17 @@ flowchart TB
 ## Extraction Schema
-The AI extracts 6 structured categories from each meeting. The categories are content-adaptive — the AI populates whichever fields are relevant to the actual discussion.
+The AI extracts 6 structured categories from any content source (video, audio, documents, or mixed). The prompt auto-detects the input type and adapts: temporal content (video/audio) gets timestamps; document-only content uses section references and null timestamps. All field names remain identical regardless of input type for backward compatibility.
 ### Categories
 | Category | Key Fields | Adapts To |
 |----------|-----------|----------|
-| **Tickets / Items** | `ticket_id`, `title`, `status`, `assignee`, `reviewer`, `video_segments` with timestamps, `speaker_comments`, `details` with priority, confidence | Sprint items, requirements, interview topics, incident items |
-| **Change Requests** | `WHERE` (target: file, system, process, scope), `WHAT` (specific change), `HOW` (approach), `WHY` (justification), `dependencies`, `blocked_by`, confidence | Code changes, requirement changes, process changes, scope adjustments |
-| **References** | `name`, `type`, `role`, cross-refs to tickets & CRs, `context_doc_match` | Files, documents, URLs, tools, systems, resources mentioned |
-| **Action Items** | `description`, `assigned_to`, `status`, `deadline`, `dependencies`, related tickets & CRs, confidence | Any follow-up work discussed |
-| **Blockers** | `description`, `severity`, `owner`, `status`, `proposed_resolution`, confidence | Technical blockers, approval gates, resource constraints |
+| **Tickets / Items** | `ticket_id`, `title`, `status`, `assignee`, `reviewer`, `video_segments` with timestamps (or null for docs), `speaker_comments`, `details` with priority, confidence | Sprint items, requirements, interview topics, incident items, legal matters, deals |
+| **Change Requests** | `WHERE` (target: file, system, process, scope), `WHAT` (specific change), `HOW` (approach), `WHY` (justification), `dependencies`, `blocked_by`, confidence | Code changes, requirement changes, process changes, scope adjustments, contract revisions, policy updates |
+| **References** | `name`, `type`, `role`, cross-refs to tickets & CRs, `context_doc_match` | Files, documents, URLs, tools, systems, resources, contracts, reports mentioned |
+| **Action Items** | `description`, `assigned_to`, `status`, `deadline`, `dependencies`, related tickets & CRs, confidence | Any follow-up work discussed or documented |
+| **Blockers** | `description`, `severity`, `owner`, `status`, `proposed_resolution`, confidence | Technical blockers, approval gates, resource constraints, legal reviews, budget approvals |
 | **Scope Changes** | `type` (added/removed/deferred), `original` vs `new` scope, `decided_by`, `impact`, confidence | Feature scope, project scope, contract scope, training scope |
 ### Personalized Task Section
@@ -500,6 +504,7 @@ taskex --dynamic --request "Document this microservices architecture"
 |-----------|--------|-------------|
 | `.vtt` `.srt` `.txt` `.md` `.csv` | Inline text | Read and passed directly as text parts |
 | `.pdf` | Gemini File API | Uploaded as binary, Gemini processes natively |
+| `.mp3` `.wav` `.ogg` `.m4a` | Gemini File API | Uploaded as audio, Gemini processes natively |
 | `.docx` `.doc` | Firebase only | Uploaded for archival, not processable by Gemini |
 Directories skipped during recursive discovery: `node_modules`, `.git`, `compressed`, `logs`, `gemini_runs`, `runs`

package/EXPLORATION.md CHANGED Viewed

@@ -1,6 +1,6 @@
 # Task Summary Extractor — Where We Are & Where We Can Go
-> **Version 8.1.0** — February 2026
+> **Version 8.3.0** — February 2026
 > Module map, codebase stats, and future roadmap.
 > For setup and CLI reference, see [README.md](README.md) · [Quick Start](QUICK_START.md)
 > For architecture diagrams and algorithms, see [ARCHITECTURE.md](ARCHITECTURE.md)
@@ -66,7 +66,7 @@
 | Config + Logger | 2 | 578 |
 | Entry points (taskex + legacy) | 2 | 165 |
 | Setup script | 1 | 505 |
-| Prompt (JSON) | 1 | 265 |
+| Prompt (JSON) | 1 | 308 |
 | **Total** | **33 files** | **~10,600 lines** |
 ### Version History
@@ -85,6 +85,8 @@
 | **v7.2.1** | Storage URL + Audit | Firebase Storage URLs as Gemini External URLs (skip File API upload), 3-strategy file resolution, URI reuse for retry/focused pass, Gemini file cleanup, confidence % fix, logger/firebase/git/version fixes |
 | **v7.2.2** | Upload Control | `--force-upload` to re-upload existing files, `--no-storage-url` to force Gemini File API, production-ready docs |
 | **v8.1.0** | Smart Global Config | Persistent `~/.taskexrc` config, `taskex config` subcommand, first-run API key prompting, 5-level config resolution, production audit (14 fixes), shared CLI flag injection, boolean flag parser fix |
+| **v8.2.0** | Architecture Cleanup | `src/modes/` for AI pipeline phases, `retry.js` self-contained defaults, dead code removal, export trimming, `process_and_upload.js` slim shim, `progress.js` → `checkpoint.js`, merged `prompt.js` into `cli.js` |
+| **v8.3.0** | Universal Content Analysis | prompt.json v4.0.0 — input type auto-detection (video/audio/document/mixed), timestamps conditional, domain-adaptive extraction for any content source, gemini.js bridge text generalized |
 | **v8.0.0** | npm Package | Global CLI (`taskex`), `--gemini-key`/`--firebase-*` config flags, CWD-based path resolution, CWD-first `.env`, `bin/taskex.js` entry point, npm publish-ready `package.json` |
 | **v7.2.3** | Production Hardening | Cross-platform ffmpeg detection, shell injection fix (spawnSync), auto git init for `--update-progress`, `runs/` excluded from doc discovery, entry point docs updated |
@@ -176,7 +178,7 @@ The logger now writes **three parallel outputs**:
 | Adaptive Thinking Budget | `adaptive-budget.js` | Segment position, complexity, context docs → dynamic 8K–32K range |
 | Smart Boundary Detection | `context-manager.js` | Mid-conversation detection, open ticket carry-forward, continuity hints |
 | Health Dashboard | `health-dashboard.js` | Quality scores, extraction density bars, retry stats, efficiency metrics |
-| Enhanced Prompt | `prompt.json` | Timestamp accuracy, dedup rules, self-verification checklist, retry hints |
+| Enhanced Prompt | `prompt.json` | Universal content analysis (v4.0.0): input type detection, timestamps conditional on content type, domain-adaptive extraction, self-verification checklist |
 ### Current Capabilities
@@ -270,36 +272,38 @@ src/
 ├── config.js                277 ln  Central config, env vars, model registry, validation
 ├── logger.js                306 ln  ★ v6 — Triple output: detailed + minimal + structured JSONL, phase spans, metrics
 ├── pipeline.js            1,985 ln  Multi-mode orchestrator with Storage URL optimization, upload control flags, learning loop, focused re-analysis, diff engine, deep-dive, dynamic, auto git init
+├── modes/                          ★ v8.2.0 — AI-heavy pipeline phase modules
+│   ├── change-detector.js   417 ln  Git-based change correlation engine
+│   ├── deep-dive.js         473 ln  ★ v6.2 — Topic discovery, parallel doc generation, index builder
+│   ├── dynamic-mode.js      494 ln  ★ v7.0 — Context-only doc generation, topic planning, parallel writing
+│   ├── focused-reanalysis.js 268 ln ★ v6 — Weakness detection, targeted second pass, intelligent merge
+│   └── progress-updater.js  402 ln  ★ v6.1 — AI-powered progress assessment, status report generation
 ├── renderers/
 │   └── markdown.js          879 ln  ★ v6 — Confidence badges (🟢🟡🔴), confidence distribution table, diff section
 ├── services/
 │   ├── firebase.js           92 ln  Init, upload, exists check (with retry, async I/O)
 │   ├── gemini.js            677 ln  ★ v7.2.1 — 3-strategy file resolution, External URL support, cleanup, doc prep, analysis, compilation
-│   ├── git.js               330 ln  ★ v7.2.3 — Git CLI wrapper: log, diff, status, changed files, auto-init
+│   ├── git.js               310 ln  ★ v7.2.3 — Git CLI wrapper: log, diff, status, changed files, auto-init
 │   └── video.js             285 ln  ★ v7.2.3 — ffmpeg compress, segment, probe (cross-platform, spawnSync)
-└── utils/
+└── utils/                          Pure utilities — parsing, retry, budget, config
     ├── adaptive-budget.js   232 ln  ★ v5 — Transcript complexity → dynamic budget
-    ├── change-detector.js   417 ln  ★ v6.1 — Git-based change correlation engine
-    ├── cli.js               391 ln  ★ v8.0.0 — Interactive prompts, model selector, folder picker, config flags, taskex help
+    ├── checkpoint.js        145 ln  Checkpoint/resume persistence (renamed from progress.js in v8.2.0)
+    ├── cli.js               415 ln  ★ v8.0.0 — Interactive prompts, model selector, folder picker, config flags, taskex help
     ├── context-manager.js   424 ln  4-tier priority, VTT slicing, progressive context, boundary detection
     ├── cost-tracker.js      140 ln  Token counting, USD cost estimation (+ focused pass tracking)
-    ├── deep-dive.js         473 ln  ★ v6.2 — Topic discovery, parallel doc generation, index builder
     ├── diff-engine.js       280 ln  ★ v6 — Cross-run delta: new/removed/changed items, Markdown rendering
-    ├── dynamic-mode.js      494 ln  ★ v7.0 — Context-only doc generation, topic planning, parallel writing
-    ├── focused-reanalysis.js 268 ln ★ v6 — Weakness detection, targeted second pass, intelligent merge
     ├── format.js             27 ln  Duration, bytes formatting
     ├── fs.js                 40 ln  Recursive doc finder (skips runs/)
+    ├── global-config.js     320 ln  ★ v8.1.0 — ~/.taskexrc persistent config, interactive setup
     ├── health-dashboard.js  191 ln  ★ v5 — Quality report, density bars, efficiency metrics
+    ├── inject-cli-flags.js   58 ln  ★ v8.1.0 — CLI flag → env var injection
     ├── json-parser.js       216 ln  5-strategy JSON extraction + repair
     ├── learning-loop.js     270 ln  ★ v6 — History I/O, trend analysis, budget auto-tuning, recommendations
-    ├── progress.js          145 ln  Checkpoint/resume persistence
-    ├── progress-updater.js  402 ln  ★ v6.1 — AI-powered progress assessment, status report generation
-    ├── prompt.js             28 ln  Interactive user prompts
     ├── quality-gate.js      372 ln  ★ v6 — 4+1 dimension scoring (+ confidence coverage), retry hints
-    └── retry.js             112 ln  Exponential backoff, parallel map
+    └── retry.js             112 ln  Exponential backoff, parallel map (self-contained defaults)
-prompt.json                  265 ln  ★ v6 — Confidence scoring instructions, evidence-based schema
-process_and_upload.js        115 ln  Backward-compatible entry point with config flag injection (v8.0.0)
+prompt.json                  308 ln  ★ v4.0.0 — Universal content analysis: video, audio, documents, mixed input; auto-detects input type + domain
+process_and_upload.js         14 ln  Backward-compatible shim — delegates to bin/taskex.js
 setup.js                     505 ln  Automated first-time setup & environment validation (v8.0.0)
 ```
@@ -314,14 +318,14 @@ The following features from the original exploration have been **fully implement
 | Feature | Status | Implemented In |
 |---------|--------|----------------|
 | 📊 Confidence Scoring Per Extracted Item | ✅ Done | `prompt.json`, `quality-gate.js`, `markdown.js` |
-| 🔄 Multi-Pass Analysis (Focused Re-extraction) | ✅ Done | `focused-reanalysis.js` (268 ln), pipeline integration |
+| 🔄 Multi-Pass Analysis (Focused Re-extraction) | ✅ Done | `modes/focused-reanalysis.js` (268 ln), pipeline integration |
 | 🧠 Learning & Improvement Loop | ✅ Done | `learning-loop.js` (270 ln), pipeline init + save |
 | 📝 Diff-Aware Compilation | ✅ Done | `diff-engine.js` (280 ln), pipeline output + MD |
 | 🔍 Structured Logging & Observability | ✅ Done | `logger.js` rewritten (303 ln), JSONL + spans + metrics |
 | Parallel segment analysis (via CLI) | ✅ Done | `--parallel-analysis` flag, pipeline batching |
-| 🔎 Smart Change Detection & Progress Tracking | ✅ Done | `git.js` (258 ln), `change-detector.js` (417 ln), `progress-updater.js` (402 ln), pipeline `--update-progress` mode |
-| 🗓️ Deep Dive Document Generation | ✅ Done | `deep-dive.js` (473 ln), pipeline phase 9 |
-| 📝 Dynamic Mode (doc-only generation) | ✅ Done | `dynamic-mode.js` (494 ln), pipeline `--dynamic` route |
+| 🔎 Smart Change Detection & Progress Tracking | ✅ Done | `git.js` (310 ln), `modes/change-detector.js` (417 ln), `modes/progress-updater.js` (402 ln), pipeline `--update-progress` mode |
+| 🗓️ Deep Dive Document Generation | ✅ Done | `modes/deep-dive.js` (473 ln), pipeline phase 9 |
+| 📝 Dynamic Mode (doc-only generation) | ✅ Done | `modes/dynamic-mode.js` (494 ln), pipeline `--dynamic` route |
 | 🤖 Runtime Model Selection | ✅ Done | `config.js` model registry, `cli.js` selector, `--model` flag |
 ---
@@ -416,7 +420,7 @@ The following features from the original exploration have been **fully implement
 | **Slack webhook** — post summary to a channel | ~1 hr | Team-wide visibility |
 | **Segment preview** — show first 3 VTT lines per segment before analyzing | ~30 min | Better UX during processing |
 | **Custom output templates** — Handlebars/Mustache for MD output | ~4 hrs | Teams customize report format |
-| **Audio-only mode** — support .mp3/.wav without video | ~2 hrs | Works for phone calls, podcasts |
+| **~~Audio-only mode~~** | ~~Done~~ | prompt.json v4.0.0 supports audio/doc/mixed — pipeline video requirement is next |
 | **Watch mode** — monitor a folder and auto-process new recordings | ~3 hrs | Hands-free automation |
 | **Git integration** — auto-commit results to repo | ~1 hr | Version-controlled meeting history |
 | **Confidence threshold filter** — CLI flag to exclude LOW confidence items from output | ~1 hr | Cleaner reports on demand |

package/README.md CHANGED Viewed

@@ -1,16 +1,16 @@
 # Task Summary Extractor
-> **v8.1.0** — AI-powered meeting analysis & document generation CLI. Install globally, run anywhere.
+> **v8.3.0** — AI-powered content analysis CLI — meetings, recordings, documents, or any mix. Install globally, run anywhere.
 <p align="center">
   <img src="https://img.shields.io/badge/node-%3E%3D18.0.0-green" alt="Node.js" />
   <img src="https://img.shields.io/badge/gemini-2.5--flash-blue" alt="Gemini" />
   <img src="https://img.shields.io/badge/firebase-11.x-orange" alt="Firebase" />
-  <img src="https://img.shields.io/badge/version-8.1.0-brightgreen" alt="Version" />
+  <img src="https://img.shields.io/badge/version-8.3.0-brightgreen" alt="Version" />
   <img src="https://img.shields.io/badge/npm-task--summary--extractor-red" alt="npm" />
 </p>
-**Record a meeting → get a structured task document.** Or point it at any folder and generate docs from context.
+**Analyze any content → get a structured task document.** Feed it meeting recordings, audio files, documents, or any mix — it extracts work items, action items, blockers, and more. Or point it at any folder and generate docs from context.
 📖 **New here?** Jump to [Setup (3 steps)](#setup-3-steps) — you'll be running in under 5 minutes.
@@ -18,9 +18,9 @@
 ## What It Does
-### 🎥 Video Analysis (default mode)
+### 🎥 Content Analysis (default mode)
-Drop a recording in a folder → run the tool → get a Markdown task document with:
+Drop a recording (video/audio) or documents in a folder → run the tool → get a Markdown task document with:
 - **Tickets** — ID, title, status, assignee, confidence score
 - **Change Requests** — what changed, where, how, why
@@ -191,7 +191,7 @@ Choose what the tool does. Only use one at a time:
 | Flag | Mode | What You Get |
 |------|------|-------------|
-| *(none)* | **Video analysis** | `results.md` — structured task document |
+| *(none)* | **Content analysis** | `results.md` — structured task document |
 | `--dynamic` | **Doc generation** | `INDEX.md` + 3–15 topic documents |
 | `--deep-dive` | **Topic explainers** | `INDEX.md` + per-topic deep-dive docs |
 | `--update-progress` | **Progress check** | `progress.md` — item status via git |
@@ -271,7 +271,7 @@ INFO       --help (-h)  --version (-v)
 ## Output
-### Video Analysis
+### Content Analysis
 ```
 my-meeting/runs/{timestamp}/
@@ -312,12 +312,12 @@ my-meeting/runs/{timestamp}/
 ## Folder Setup Tips
-Drop docs alongside your video to give the AI context. **More context = better extraction.**
+Drop content files and supporting docs in a folder. **More context = better extraction.**
 ```
 my-meeting/
-├── Recording.mp4                  ← Video (required for video mode)
-├── Recording.vtt                  ← Subtitles (highly recommended)
+├── Recording.mp4                  ← Video recording (primary for video mode)
+├── Recording.vtt                  ← Subtitles (highly recommended for recordings)
 ├── agenda.md                      ← Loose docs at root are fine
 │
 ├── .tasks/                        ← Gets priority weighting (optional)
@@ -328,7 +328,7 @@ my-meeting/
     └── requirements.md
 ```
-**Supported formats:** `.mp4` `.mkv` `.webm` `.avi` `.mov` (video) · `.vtt` `.srt` `.txt` `.md` `.csv` `.pdf` (docs)
+**Supported formats:** `.mp4` `.mkv` `.webm` `.avi` `.mov` (video) · `.mp3` `.wav` `.ogg` `.m4a` (audio) · `.vtt` `.srt` `.txt` `.md` `.csv` `.pdf` (docs)
 The tool **recursively scans all subfolders**. `.tasks/` gets highest priority weighting but everything is included.
@@ -406,7 +406,7 @@ GEMINI_API_KEY=your-key-here
 | Feature | Description |
 |---------|-------------|
-| **Video Compression** | H.264 CRF 24, text-optimized sharpening, configurable speed |
+| **Video/Audio Compression** | H.264 CRF 24, text-optimized sharpening, configurable speed |
 | **Smart Segmentation** | ≤5 min chunks with boundary-aware splitting |
 | **Cross-Segment Continuity** | Ticket IDs, names, and context carry forward |
 | **Document Discovery** | Auto-finds docs in all subfolders |
@@ -468,7 +468,7 @@ Your call folders, `.env`, logs, and videos are all `.gitignore`d — nothing ge
 task-summary-extractor/
 ├── bin/
 │   └── taskex.js               Global CLI entry point
-├── process_and_upload.js       Backward-compatible entry point
+├── process_and_upload.js       Backward-compatible entry (delegates to bin/taskex)
 ├── setup.js                    First-time setup & validation
 ├── package.json                Dependencies, scripts, bin config
 ├── prompt.json                 Gemini extraction prompt
@@ -476,15 +476,21 @@ task-summary-extractor/
 ├── src/
 │   ├── config.js               Config, model registry, env vars
 │   ├── logger.js               Structured JSONL logger (triple output)
-│   ├── pipeline.js             Multi-mode orchestrator (1,985 lines)
+│   ├── pipeline.js             Multi-mode orchestrator (~2,000 lines)
 │   ├── services/
 │   │   ├── gemini.js           Gemini AI — 3-strategy file resolution + External URL support
 │   │   ├── firebase.js         Firebase Storage (async I/O)
 │   │   ├── video.js            ffmpeg compression
 │   │   └── git.js              Git CLI wrapper
+│   ├── modes/                  AI-heavy pipeline phase modules
+│   │   ├── deep-dive.js        Topic discovery & deep-dive doc generation
+│   │   ├── dynamic-mode.js     Dynamic document planning & generation
+│   │   ├── focused-reanalysis.js  Targeted reanalysis of weak segments
+│   │   ├── progress-updater.js Git-based progress assessment
+│   │   └── change-detector.js  Git change correlation engine
 │   ├── renderers/
 │   │   └── markdown.js         Report renderer
-│   └── utils/                  21 modules — see ARCHITECTURE.md
+│   └── utils/                  Pure utilities — parsing, retry, budget, config
 │
 ├── QUICK_START.md              Step-by-step setup guide
 ├── ARCHITECTURE.md             Technical deep dive
@@ -512,6 +518,8 @@ task-summary-extractor/
 | Version | Highlights |
 |---------|-----------|
+| **v8.3.0** | **Universal content analysis** — prompt v4.0.0 supports video, audio, documents, and mixed content; input type auto-detection; timestamps conditional on content type; gemini.js bridge text generalized; all markdown docs updated |
+| **v8.2.0** | **Architecture cleanup** — `src/modes/` for AI pipeline phases, `retry.js` self-contained defaults, dead code removal, export trimming, `process_and_upload.js` slim shim, `progress.js` → `checkpoint.js`, merged `prompt.js` into `cli.js` |
 | **v8.1.0** | **Smart global config** — `taskex config` persistent setup (`~/.taskexrc`), first-run prompting, 5-level config resolution, production audit fixes, shared CLI flag injection, boolean flag parser fix |
 | **v8.0.0** | **npm package** — `npm i -g task-summary-extractor`, `taskex` global CLI, `--gemini-key` / `--firebase-*` config flags, run from anywhere, CWD-first `.env` resolution |
 | **v7.2.3** | Production hardening — cross-platform ffmpeg, shell injection fix, auto git init for progress tracking, `runs/` excluded from doc discovery |

package/package.json CHANGED Viewed

@@ -1,10 +1,10 @@
 {
   "name": "task-summary-extractor",
-  "version": "8.1.0",
+  "version": "8.3.0",
   "description": "AI-powered meeting analysis & document generation CLI — video + document processing, deep dive docs, dynamic mode, interactive CLI with model selection, confidence scoring, learning loop, git progress tracking",
   "main": "process_and_upload.js",
   "bin": {
-    "taskex": "./bin/taskex.js"
+    "taskex": "bin/taskex.js"
   },
   "files": [
     "bin/",

package/process_and_upload.js CHANGED Viewed

@@ -1,107 +1,14 @@
 #!/usr/bin/env node
 /**
- * taskex — AI-powered meeting analysis & document generation.
+ * Backward-compatible entry point — delegates to bin/taskex.js.
  *
- * Backward-compatible entry point — delegates to src/pipeline.js.
- * For global installs, use the `taskex` command directly.
+ * For global installs, use the `taskex` CLI command directly.
+ * This file exists for `node process_and_upload.js` and `npm start` compatibility.
  *
  * Usage:
- *   taskex [options] [folder]
- *   node process_and_upload.js [options] "C:\path\to\call folder"
+ *   taskex [options] [folder]                      (recommended)
+ *   node process_and_upload.js [options] [folder]   (legacy)
  *
- * Config flags (override .env):
- *   --gemini-key <key>          Gemini API key
- *   --firebase-key <key>        Firebase API key
- *   --firebase-project <id>     Firebase project ID
- *   --firebase-bucket <bucket>  Firebase storage bucket
- *   --firebase-domain <domain>  Firebase auth domain
- *
- * Options:
- *   --name <name>              Your name (skips interactive prompt)
- *   --model <id>               Gemini model (default: gemini-2.5-flash)
- *   --skip-upload              Skip Firebase Storage uploads
- *   --force-upload             Upload even if remote file exists
- *   --no-storage-url           Disable Storage URL strategy for Gemini
- *   --skip-compression         Skip video compression (use existing segments)
- *   --skip-gemini              Skip Gemini AI analysis
- *   --resume                   Resume from last checkpoint
- *   --reanalyze                Force re-analysis of all segments
- *   --parallel <n>             Max parallel uploads (default: 3)
- *   --parallel-analysis <n>    Max concurrent Gemini analyses (default: 2)
- *   --thinking-budget <n>      Gemini thinking token budget
- *   --compilation-thinking-budget <n>  Compilation thinking budget
- *   --log-level <level>        Log level: debug, info, warn, error
- *   --output <dir>             Custom output directory
- *   --dry-run                  Show what would be done without executing
- *   --dynamic                  Document-only mode (no video required)
- *   --deep-dive                Generate deep-dive documents after analysis
- *   --request <text>           Custom research prompt for deep-dive/dynamic
- *   --update-progress          Smart change detection & progress update
- *   --repo <path>              Git repo path for progress tracking
- *   --no-focused-pass          Disable focused re-analysis pass
- *   --no-learning              Disable learning loop
- *   --no-diff                  Disable diff against previous run
- *   --help, -h                 Show help
- *   --version, -v              Show version
- *
- * Project structure:
- *   src/
- *     config.js               — Environment-based config with validation
- *     logger.js               — Buffered dual-file logger with levels
- *     pipeline.js             — Main orchestrator with CLI flags & progress
- *     services/
- *       firebase.js           — Firebase init, upload with retry, exists checks
- *       gemini.js             — Gemini init, segment analysis with retry
- *       git.js                — Git CLI wrapper for change detection
- *       video.js              — ffmpeg compression, segmentation, probing
- *     renderers/
- *       markdown.js           — Action-focused Markdown renderer
- *     utils/
- *       adaptive-budget.js    — Transcript complexity → thinking budget
- *       change-detector.js    — Git + document change correlation engine
- *       cli.js                — CLI argument parser & interactive prompts
- *       context-manager.js    — Smart context prioritization for Gemini
- *       cost-tracker.js       — Model-specific token cost tracking
- *       deep-dive.js          — AI topic discovery & document generation
- *       diff-engine.js        — Compilation diff between runs
- *       dynamic-mode.js       — Document-only analysis mode
- *       focused-reanalysis.js — Second-pass extraction for weak dimensions
- *       format.js             — Duration/size formatting helpers
- *       fs.js                 — Recursive file discovery
- *       health-dashboard.js   — Quality report builder
- *       json-parser.js        — Robust JSON extraction from AI output
- *       learning-loop.js      — Cross-run history & trend analysis
- *       progress.js           — Pipeline checkpoint/resume persistence
- *       progress-updater.js   — Smart progress assessment & rendering
- *       prompt.js             — Interactive CLI prompts (stdin/stdout)
- *       quality-gate.js       — Multi-dimension confidence scoring
- *       retry.js              — Exponential backoff retry with parallelMap
+ * Run `taskex --help` for full CLI reference.
  */
-'use strict';
-// ── Inject CLI config flags into process.env ──────────────────────────────
-// Must run BEFORE any require() that touches config.js / dotenv
-const { injectCliFlags } = require('./src/utils/inject-cli-flags');
-injectCliFlags();
-// ── Delegate to pipeline ──────────────────────────────────────────────────
-const { run, getLog } = require('./src/pipeline');
-run().catch(err => {
-  // showHelp() throws with code HELP_SHOWN — clean exit, not an error
-  if (err.code === 'HELP_SHOWN' || err.code === 'VERSION_SHOWN') {
-    process.exit(0);
-  }
-  const log = getLog();
-  if (log) {
-    log.error(`FATAL: ${err.message || err}`);
-    log.error(err.stack || '');
-    log.step('FAILED');
-    log.close();
-  }
-  process.stderr.write(`\nFATAL: ${err.message || err}\n`);
-  process.stderr.write(`${err.stack || ''}\n`);
-  process.exit(1);
-});
+require('./bin/taskex');