npm - escribano - Versions diffs - 0.1.0 - Mend

escribano 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (124) hide show

package/LICENSE +21 -0
package/README.md +297 -0
package/dist/0_types.js +279 -0
package/dist/actions/classify-session.js +77 -0
package/dist/actions/create-contexts.js +44 -0
package/dist/actions/create-topic-blocks.js +68 -0
package/dist/actions/extract-metadata.js +24 -0
package/dist/actions/generate-artifact-v3.js +296 -0
package/dist/actions/generate-artifact.js +61 -0
package/dist/actions/generate-summary-v3.js +260 -0
package/dist/actions/outline-index.js +204 -0
package/dist/actions/process-recording-v2.js +494 -0
package/dist/actions/process-recording-v3.js +412 -0
package/dist/actions/process-session.js +183 -0
package/dist/actions/publish-summary-v3.js +303 -0
package/dist/actions/sync-to-outline.js +196 -0
package/dist/adapters/audio.silero.adapter.js +69 -0
package/dist/adapters/cap.adapter.js +94 -0
package/dist/adapters/capture.cap.adapter.js +107 -0
package/dist/adapters/capture.filesystem.adapter.js +124 -0
package/dist/adapters/embedding.ollama.adapter.js +141 -0
package/dist/adapters/intelligence.adapter.js +202 -0
package/dist/adapters/intelligence.mlx.adapter.js +395 -0
package/dist/adapters/intelligence.ollama.adapter.js +741 -0
package/dist/adapters/publishing.outline.adapter.js +75 -0
package/dist/adapters/storage.adapter.js +81 -0
package/dist/adapters/storage.fs.adapter.js +83 -0
package/dist/adapters/transcription.whisper.adapter.js +206 -0
package/dist/adapters/video.ffmpeg.adapter.js +405 -0
package/dist/adapters/whisper.adapter.js +168 -0
package/dist/batch-context.js +329 -0
package/dist/db/helpers.js +50 -0
package/dist/db/index.js +95 -0
package/dist/db/migrate.js +80 -0
package/dist/db/repositories/artifact.sqlite.js +77 -0
package/dist/db/repositories/cluster.sqlite.js +92 -0
package/dist/db/repositories/context.sqlite.js +75 -0
package/dist/db/repositories/index.js +10 -0
package/dist/db/repositories/observation.sqlite.js +70 -0
package/dist/db/repositories/recording.sqlite.js +56 -0
package/dist/db/repositories/subject.sqlite.js +64 -0
package/dist/db/repositories/topic-block.sqlite.js +45 -0
package/dist/db/types.js +4 -0
package/dist/domain/classification.js +60 -0
package/dist/domain/context.js +97 -0
package/dist/domain/index.js +2 -0
package/dist/domain/observation.js +17 -0
package/dist/domain/recording.js +41 -0
package/dist/domain/segment.js +93 -0
package/dist/domain/session.js +93 -0
package/dist/domain/time-range.js +38 -0
package/dist/domain/transcript.js +79 -0
package/dist/index.js +173 -0
package/dist/pipeline/context.js +162 -0
package/dist/pipeline/events.js +2 -0
package/dist/prerequisites.js +226 -0
package/dist/scripts/rebuild-index.js +53 -0
package/dist/scripts/seed-fixtures.js +290 -0
package/dist/services/activity-segmentation.js +333 -0
package/dist/services/activity-segmentation.test.js +191 -0
package/dist/services/app-normalization.js +212 -0
package/dist/services/cluster-merge.js +69 -0
package/dist/services/clustering.js +237 -0
package/dist/services/debug.js +58 -0
package/dist/services/frame-sampling.js +318 -0
package/dist/services/signal-extraction.js +106 -0
package/dist/services/subject-grouping.js +342 -0
package/dist/services/temporal-alignment.js +99 -0
package/dist/services/vlm-enrichment.js +84 -0
package/dist/services/vlm-service.js +130 -0
package/dist/stats/index.js +3 -0
package/dist/stats/observer.js +65 -0
package/dist/stats/repository.js +36 -0
package/dist/stats/resource-tracker.js +86 -0
package/dist/stats/types.js +1 -0
package/dist/test-classification-prompts.js +181 -0
package/dist/tests/cap.adapter.test.js +75 -0
package/dist/tests/capture.cap.adapter.test.js +69 -0
package/dist/tests/classify-session.test.js +140 -0
package/dist/tests/db/repositories.test.js +243 -0
package/dist/tests/domain/time-range.test.js +31 -0
package/dist/tests/integration.test.js +84 -0
package/dist/tests/intelligence.adapter.test.js +102 -0
package/dist/tests/intelligence.ollama.adapter.test.js +178 -0
package/dist/tests/process-v2.test.js +90 -0
package/dist/tests/services/clustering.test.js +112 -0
package/dist/tests/services/frame-sampling.test.js +152 -0
package/dist/tests/utils/ocr.test.js +76 -0
package/dist/tests/utils/parallel.test.js +57 -0
package/dist/tests/visual-observer.test.js +175 -0
package/dist/utils/id-normalization.js +15 -0
package/dist/utils/index.js +9 -0
package/dist/utils/model-detector.js +154 -0
package/dist/utils/ocr.js +80 -0
package/dist/utils/parallel.js +32 -0
package/migrations/001_initial.sql +109 -0
package/migrations/002_clusters.sql +41 -0
package/migrations/003_observations_vlm_fields.sql +14 -0
package/migrations/004_observations_unique.sql +18 -0
package/migrations/005_processing_stats.sql +29 -0
package/migrations/006_vlm_raw_response.sql +6 -0
package/migrations/007_subjects.sql +23 -0
package/migrations/008_artifacts_recording.sql +6 -0
package/migrations/009_artifact_subjects.sql +10 -0
package/package.json +82 -0
package/prompts/action-items.md +55 -0
package/prompts/blog-draft.md +54 -0
package/prompts/blog-research.md +87 -0
package/prompts/card.md +54 -0
package/prompts/classify-segment.md +38 -0
package/prompts/classify.md +37 -0
package/prompts/code-snippets.md +163 -0
package/prompts/extract-metadata.md +149 -0
package/prompts/notes.md +83 -0
package/prompts/runbook.md +123 -0
package/prompts/standup.md +50 -0
package/prompts/step-by-step.md +125 -0
package/prompts/subject-grouping.md +31 -0
package/prompts/summary-v3.md +89 -0
package/prompts/summary.md +77 -0
package/prompts/topic-classifier.md +24 -0
package/prompts/topic-extract.md +13 -0
package/prompts/vlm-batch.md +21 -0
package/prompts/vlm-single.md +19 -0

package/prompts/notes.md ADDED Viewed

@@ -0,0 +1,83 @@
+# Session Notes
+You are a technical researcher/student taking detailed, research-backed notes from a session.
+## Context
+Metadata: {{METADATA}}
+Visual Log: {{VISUAL_LOG}}
+Detected Language: {{LANGUAGE}}
+## Visual Integration Rule
+Include screenshots to illustrate complex concepts or UI layouts using `[SCREENSHOT: timestamp]`.
+## Language Rule
+Use English for all headings, structural elements, and organizational labels. The technical content, step-by-step explanations, research findings, and core concepts must be written in the original language ({{LANGUAGE}}).
+## Structure
+### 1. Session Overview (Summary)
+Write a concise 3-5 sentence summary synthesizing the key themes, objectives, and outcomes of this session. This is your "bottom of the page" Cornell-style summary—capture the essence in your own words.
+### 2. Key Questions & Cues
+List 5-8 questions or keywords that capture the main themes and can serve as recall triggers when reviewing these notes later. Frame them as questions where possible (e.g., "What is...", "Why does...", "How to...").
+Example format:
+- **What**: [core concept name]
+- **Why**: [rationale/purpose]
+- **How**: [implementation or process]
+- **Key Terms**: [important technical terms]
+### 3. Main Concepts & Atomic Ideas
+For each significant concept discussed, create a focused section with:
+- **Concept Name** (English heading)
+  - **Definition**: What it is, in original language ({{LANGUAGE}})
+  - **Why It Matters**: The purpose, problem solved, or relevance
+  - **Key Details**: Specific technical aspects, constraints, or considerations
+  - **Connections**: How this relates to other concepts in this session
+Organize these as distinct "atomic notes"—one clear idea per section.
+### 4. Technical Details & Examples
+Capture specific technical information with context:
+**Commands & Code**
+- Code snippets or commands (in original language {{LANGUAGE}})
+- Purpose/what it does
+- Parameters and their meanings
+- Example usage scenarios
+**Problems & Solutions**
+- Challenge or issue described
+- Troubleshooting approach taken
+- Resolution and why it worked
+- Alternative approaches mentioned
+**Architectural Decisions**
+- Design choices made
+- Trade-offs considered
+- Rationale for final decision
+### 5. References & Resources
+List all references mentioned with context:
+- Documentation links (with brief description of relevance)
+- Tools, libraries, or frameworks (with version info if mentioned)
+- Related reading or follow-up research
+- Dependencies or prerequisites
+### 6. Action Items & Next Steps
+Capture concrete actions identified during the session:
+- Tasks to complete
+- Experiments to try
+- Topics to research further
+- Decisions requiring follow-up
+## Guidelines for Effective Notes
+- **Paraphrase, Don't Transcribe**: Rewrite ideas in your own words rather than copying verbatim.
+- **Be Specific**: Include actual code, command output, or technical details rather than vague descriptions.
+- **Capture the "Why"**: Always explain why something matters, not just what it is.
+- **Use Examples**: Include concrete examples discussed or referenced.
+- **Note Uncertainties**: Mark areas that were unclear or require further investigation.
+- **Link Ideas**: When concepts relate, explicitly state the connection.
+## Transcript
+{{TRANSCRIPT_ALL}}

package/prompts/runbook.md ADDED Viewed

@@ -0,0 +1,123 @@
+# Debugging Runbook
+You are a senior engineer documenting a troubleshooting session.
+## Context
+Metadata: {{METADATA}}
+Visual Log: {{VISUAL_LOG}}
+Detected Language: {{LANGUAGE}}
+## Instructions
+### Visual Integration Rule
+You MUST illustrate the runbook by requesting screenshots at critical moments (e.g., when an error message appears, when a fix is verified). Use the tag `[SCREENSHOT: timestamp]` where timestamp is the exact seconds.
+Example: "The console showed a 404 error [SCREENSHOT: 45.5]."
+### Language Rule
+Use English for all headings, structural elements, and section labels. All technical details, error messages, specific troubleshooting steps, resolution explanations, and code examples must remain in the original language ({{LANGUAGE}}).
+### Blameless Documentation Principle
+Focus on systems, processes, and contributing factors—not on individuals or teams. Assume everyone involved had good intentions and acted with the information available at the time. Document what happened, why it happened systemically, and how to prevent it—not who is to blame.
+## Structure
+### 1. Summary
+**Provide a concise, high-level overview of the troubleshooting session.**
+- What was broken or failing?
+- What was the primary symptom observed?
+- What was the final outcome?
+### 2. Impact Assessment
+**Document the effect of the issue.**
+- What was affected? (e.g., users, services, features, data)
+- How severe was the impact? (e.g., critical degradation, partial outage, localized issue)
+- Any quantifiable metrics? (e.g., error rate, latency, affected users)
+### 3. Detection
+**How was the issue discovered?**
+- What monitoring, alerting, or user report identified the problem?
+- When was it first noticed?
+- What triggered the investigation?
+### 4. Timeline
+**Chronological account of key events during troubleshooting.**
+- Use timestamps where available from the transcript
+- Include major actions taken and decisions made
+- Note any shifts in investigation direction or hypothesis
+- Format: `[Time/Sequence] — Actor/Context — Action/Observation`
+### 5. Problem Description
+**Detailed description of what was broken or failing.**
+- Expected behavior vs. actual behavior
+- Specific error messages from {{TECHNICAL_TERMS}}
+- Symptoms observed (e.g., latency, errors, incorrect results)
+- Scope of the issue (how widespread?)
+### 6. Investigation Steps
+**Document the path taken to identify the root cause.**
+- What hypotheses were formed and tested?
+- What diagnostic tools or approaches were used?
+- Which paths were explored and ruled out?
+- How did the investigation narrow down to the cause?
+### 7. Root Cause(s)
+**Identify the underlying issue(s) that caused the problem.**
+- Primary root cause (most direct cause)
+- Contributing factors (if applicable—e.g., configuration issues, system interactions, recent changes)
+- Use "5 Whys" approach if helpful: trace back from symptom to deeper systemic cause
+### 8. Trigger (if applicable)
+**If the issue was triggered by a specific event, identify it.**
+- What latent bug was activated?
+- What change, event, or condition triggered the failure?
+- Distinguish between the trigger (what activated it) and the root cause (the underlying flaw)
+### 9. Resolution
+**How the issue was fixed or the solution applied.**
+- Specific steps taken to resolve the issue
+- Immediate mitigation vs. long-term fix
+- Any configuration changes, code changes, or workarounds
+### 10. Verification
+**How to verify the fix is working.**
+- What tests or checks confirm the issue is resolved?
+- What metrics or behaviors should return to normal?
+- How to ensure no regressions?
+### 11. Lessons Learned
+**Reflect on what the session revealed about the system and process.**
+**What Went Well:**
+- What worked effectively during troubleshooting?
+- What tools, processes, or approaches helped resolve the issue quickly?
+- What should be replicated in future sessions?
+**What Went Wrong:**
+- What could have been done better or faster?
+- What information was missing or delayed?
+- What made investigation difficult?
+**Where We Got Lucky (Near Misses):**
+- What prevented this from being worse?
+- What fortunate circumstances helped resolution?
+### 12. Action Items
+**Concrete follow-up items to prevent recurrence or improve future troubleshooting.**
+| Action Item | Type | Owner | Status |
+|-------------|------|-------|--------|
+| [Specific action] | [Prevent/Mitigate/Improve] | [Responsible person/team] | [TODO/DONE/In Progress] |
+**Types:**
+- **Prevent**: Changes to eliminate this root cause
+- **Mitigate**: Measures to reduce impact if it recurs
+- **Improve**: Process/tooling improvements for faster troubleshooting
+### 13. Supporting Evidence
+**Links or references to additional context.**
+- Logs, metrics, screenshots, or monitoring dashboards referenced
+- Documentation, playbooks, or runbooks consulted
+- Related bugs, issues, or pull requests
+## Transcript
+{{TRANSCRIPT_ALL}}

package/prompts/standup.md ADDED Viewed

@@ -0,0 +1,50 @@
+# Standup Format - Bullet-Point Status Update
+You are generating a standup-style status update from a work session. Focus on what was accomplished and what's next.
+## Session Metadata
+- **Duration:** {{SESSION_DURATION}}
+- **Date:** {{SESSION_DATE}}
+## Work Done
+{{WORK_SUBJECTS}}
+---
+## Instructions
+Generate a concise standup update with three sections:
+1. **What I did** - 3-5 bullet points of main activities
+2. **Key outcomes** - 2-3 concrete results or progress
+3. **Next steps** - 1-3 items for next session
+**Format example:**
+```markdown
+## Standup - Feb 25, 2026
+**What I did:**
+- Optimized Escribano scene detection pipeline
+- Fixed LLM truncation and database constraint errors
+- Benchmarked MLX vs Ollama VLM models
+- Reviewed competitor architecture (Screenpipe)
+**Key outcomes:**
+- Scene detection reduced from 6119s to 166s (20.6x speedup)
+- VLM batch inference working with new skip-frame strategy
+- Identified qwen3_next as candidate for inference improvements
+**Next:**
+- Merge perf/scene-detection-skip-keyframes branch
+- Test qwen3_next model for inference improvements
+- Add unit tests for mlx_bridge.py
+```
+**Rules:**
+- Maximum 10-12 lines total
+- Be specific, not generic
+- Focus on accomplishments, not activities
+- Skip personal content entirely
+- Use present tense

package/prompts/step-by-step.md ADDED Viewed

@@ -0,0 +1,125 @@
+# Step-by-Step Guide
+You are a technical writer creating a **how-to guide** (goal-oriented procedural documentation) from a demonstration session. This guide helps users who already know what they want to achieve by providing clear, actionable steps.
+## Context
+Metadata: {{METADATA}}
+Visual Log: {{VISUAL_LOG}}
+Detected Language: {{LANGUAGE}}
+## Visual Integration Rule
+You MUST illustrate each major step by requesting a screenshot. Use the tag `[SCREENSHOT: timestamp]` where timestamp is the seconds from the Metadata or Visual Log.
+Example:
+1. Open the project configuration [SCREENSHOT: 12.0].
+2. Update the API endpoint in `.env`.
+## Language Rule
+Use English for headings, structural elements, and section labels. The actual instructions, technical explanations, command descriptions, and all procedural content must remain in the original language ({{LANGUAGE}}).
+## Structure Requirements
+### 1. Problem Statement (What This Guide Solves)
+Begin with a clear statement of the problem or task this guide addresses. Answer: "What will the reader accomplish?"
+### 2. Prerequisites
+List requirements in a bulleted list. Include:
+- Software, tools, or versions needed
+- Access or permissions required
+- Prior knowledge or skills assumed
+- Files or resources to have ready
+### 3. Step-by-Step Instructions
+Follow these strict formatting rules:
+**Introductory Sentence**: Provide context that isn't in the heading. Don't repeat the heading.
+**Step Format**:
+- Each step must start with an **imperative verb**
+- Use **complete sentences**
+- Maintain **parallel structure** (consistent verb form)
+- **State the goal before the action** when it clarifies purpose
+- **State the location/context before the action** (e.g., "In the terminal, run...")
+- **State the action first, then the result** or justification
+**Multi-Action Steps**: Combine small related actions using angle brackets: `Click **File > New > Document**`
+**Sub-steps**:
+- Use lowercase letters for sub-steps
+- Use lowercase Roman numerals for sub-sub-steps
+- End parent step with colon or period
+**Optional Steps**: Prefix with "Optional:" (not "(Optional)")
+**Single-Step Procedures**: Format as bullet list, not numbered
+**Command Steps**: Follow this order:
+1. Describe what the command does (imperative)
+2. Show the command in code block
+3. Explain placeholders (e.g., "Replace `NAME` with...")
+4. Explain the command's function if necessary
+5. Show expected output
+6. Explain the result
+**Example**:
+```
+1. Plan the Terraform deployment:
+    terraform plan -out=NAME
+    Replace `NAME` with the name of your Terraform plan.
+    The `terraform plan` command creates an execution plan showing what resources will be added, changed, or destroyed.
+    The output is similar to the following:
+      Plan: 26 to add, 0 to change, 0 to destroy.
+    This output shows what resources to add, change, or destroy.
+```
+### 4. Expected Result
+Describe what success looks like after completing all steps. Include:
+- What the reader should see or have
+- How to verify the result
+- What the reader can do next
+### 5. Troubleshooting
+Address common issues mentioned in the transcript. For each issue:
+- State the problem clearly
+- Provide the solution
+- Explain why it occurred (briefly)
+## Writing Principles (Anti-patterns to Avoid)
+❌ **Don't** use directional language ("above", "below", "right-hand side")
+❌ **Don't** say "please"
+❌ **Don't** say "run the following command" (focus on what it does)
+❌ **Don't** include keyboard shortcuts (just say what to do)
+❌ **Don't** give alternate ways to complete a task (pick the best one)
+❌ **Don't** over-explain or include unnecessary background (this is a how-to guide, not a tutorial or explanation)
+❌ **Don't** repeat procedure headings in introductory sentences
+❌ **Don't** make steps too long—split if needed
+✅ **Do** focus on concrete, actionable steps
+✅ **Do** provide visible results early and often
+✅ **Do** maintain flow and rhythm between steps
+✅ **Do** include exact expected output when helpful
+✅ **Do** explain placeholders clearly
+✅ **Do** ensure the guide works reliably every time
+## Quality Checklist
+- [ ] Each step starts with an imperative verb
+- [ ] All steps use complete sentences
+- [ ] Parallel structure is maintained
+- [ ] Context/location appears before action
+- [ ] Optional steps are marked "Optional:"
+- [ ] No directional language used
+- [ ] No "please" included
+- [ ] Commands are explained, not introduced with "run"
+- [ ] Expected output is shown for commands
+- [ ] Problem statement is clear
+- [ ] Prerequisites are complete
+- [ ] Troubleshooting addresses common issues
+## Transcript
+{{TRANSCRIPT_ALL}}

package/prompts/subject-grouping.md ADDED Viewed

@@ -0,0 +1,31 @@
+You are analyzing a work session that has been divided into {{BLOCK_COUNT}} segments (TopicBlocks).
+Your task is to group these segments into 1-6 coherent SUBJECTS. A subject represents a distinct thread of work (e.g., "Escribano pipeline optimization", "Personal time", "Email and admin", "Research on competitors").
+GROUPING RULES:
+1. Group segments that belong to the same work thread, even if they're not consecutive in time
+2. Personal activities (WhatsApp, Instagram, social media, personal calls) should be grouped into a "Personal" subject
+3. Email/calendar/admin is only its own group when email IS the primary activity — not just because an email app was open in the background
+4. Deep work on the same project/codebase should be grouped together
+5. Research sessions should be grouped separately from coding sessions unless clearly related
+RULE PRIORITY (when in doubt):
+- Classify by primary ACTIVITY TYPE and project context, not by which apps happened to be open
+- If all segments are about the same project, one group is correct — do not invent artificial splits
+SEGMENTS TO GROUP:
+{{BLOCK_DESCRIPTIONS}}
+For each group, output ONE line in this EXACT format:
+Group 1: label: [Descriptive subject name] | blockIds: [uuid1, uuid2, uuid3]
+Example output:
+Group 1: label: Escribano VLM Integration | blockIds: [{{EXAMPLE_BLOCK_IDS}}]
+CRITICAL REQUIREMENTS:
+- Each group MUST have "label" and "blockIds"
+- Block IDs are the UUIDs shown in each BLOCK above (copy them exactly)
+- Include ALL {{BLOCK_COUNT}} block IDs across all groups (every block must be assigned exactly once)
+- Create 1-6 groups (one group is fine if all work is the same project)
+- Use clear, descriptive labels for each subject
+- Output ONLY the group lines — no explanation, no preamble, no markdown

package/prompts/summary-v3.md ADDED Viewed

@@ -0,0 +1,89 @@
+You are a productivity assistant analyzing a developer's work session recording.
+Generate a detailed narrative summary of this work session, organized by themes rather than strict chronology.
+## Session Metadata
+- **Duration:** {{SESSION_DURATION}} minutes
+- **Date:** {{SESSION_DATE}}
+- **Activities Identified:** {{ACTIVITY_COUNT}}
+## Activity Timeline
+{{ACTIVITY_TIMELINE}}
+## Apps & Pages Used
+### Applications
+{{APPS_LIST}}
+### Websites Visited
+{{URLS_LIST}}
+## Instructions
+Write a comprehensive yet readable summary that:
+1. **Groups activities by theme** — combine related work (e.g., all terminal work together, all research together)
+2. **Describes the session as a work log** — what was being worked on, with transitions between themes
+3. **Includes specifics** from the visual descriptions (file names, app names, error messages, URLs)
+4. **Incorporates audio transcript quotes** when they add context (decisions made, explanations spoken)
+5. **Uses markdown headers** for major thematic sections (not every activity change)
+6. **Ends with structured outcomes** — what was accomplished, what's unresolved, what's next
+Write 500-1500 words depending on session complexity. Be specific, not generic.
+Do NOT include a section listing raw observations — synthesize them into narrative.
+Do NOT use bullet points for narrative sections — organize into flowing paragraphs.
+Write in work log style using **FIRST PERSON** present continuous tense:
+- "Working on..." "Debugging..." "Reviewing..."
+- "Editing the config file..." "Running tests..." "Checking the logs..."
+- NOT: "The developer..." "The user was..." "They were..."
+## Format Example
+```markdown
+# Session Summary: [Date]
+## Overview
+[Brief 2-3 sentence overview in first person: "Spent 3 hours optimizing the VLM pipeline, achieving a 4x speedup through scene detection and model quantization improvements."]
+## Timeline
+* **0:00** (27m): terminal
+* **27:15** (45m): debugging
+* **72:00** (30m): research
+...
+## Apps & Pages Used
+### Applications
+Terminal, Google Chrome, VS Code
+### Websites Visited
+- github.com/owner/repo
+- docs.example.com/guide
+## Terminal Work: Model Benchmarking (0:00–27:00)
+Running benchmark scripts in the terminal to compare VLM model performance. Processing 342 frames through the pipeline and measuring inference speed. The qwen3-vl:4b model shows promising results with 115 tok/s throughput...
+## Debugging & Optimization (27:00–72:00)
+Encountering parsing errors in the benchmark script. The JSON output from the VLM is being truncated on later frames. Investigating the root cause by adding debug logging and adjusting the MAX_TOKENS parameter...
+## Research & Documentation (72:00–102:00)
+Researching alternative VLM implementations on Google Chrome. Found an arXiv paper comparing vision-language models on standardized benchmarks. Reviewing the GitHub repository for mlx-vlm examples...
+## Key Outcomes
+### ✅ Accomplished
+- Achieved 4x speedup in the processing pipeline
+- Fixed JSON parsing errors in benchmark script
+- Documented performance metrics in HTML reports
+### ⏳ Unresolved
+- Need to test with larger model (InternVL-14B)
+- Some frame descriptions still truncated at high batch sizes
+### ➡️ Next Steps
+- Integrate 4bit model into production pipeline
+- Explore continuous batching for parallel processing
+- Add unit tests for the new adapter
+```

package/prompts/summary.md ADDED Viewed

@@ -0,0 +1,77 @@
+# Session Summary
+You are an expert scribe specializing in creating comprehensive, actionable session documentation. Your task is to transform the following transcript into a professional session summary that stakeholders can reference for decision-making and follow-up.
+## Context
+**Metadata**: {{METADATA}}
+**Visual Log**: {{VISUAL_LOG}}
+**Detected Language**: {{LANGUAGE}}
+## Visual Integration Rule
+If the session involves visual demonstrations or screen-sharing, include screenshots of major moments using the tag `[SCREENSHOT: timestamp]`.
+## Instructions
+### Language Rule
+- Use English for all headings, structure, and meta-analysis
+- All actual discussion content, quotes, and explanations must remain in the original language ({{LANGUAGE}})
+### Structure Requirements
+Create a summary with the following sections:
+#### 1. Session Overview
+A concise 2-3 sentence summary answering:
+- What was the primary purpose of this session?
+- What was the main outcome or result?
+- Who participated (if identifiable)?
+#### 2. Attendees & Context
+- **Participants**: List identified speakers/participants (use speaker labels from transcript if names unavailable)
+- **Duration**: Note session length if available in metadata
+- **Type**: Briefly characterize the session (e.g., planning meeting, technical review, brainstorming, 1-on-1)
+#### 3. Key Discussion Points
+Organize the main topics discussed. For each topic:
+- **Topic heading** (English)
+- Brief bullet points of key points covered (in original language)
+- Include significant questions raised and responses given
+- Reference timestamp ranges where relevant (e.g., `[12:34-18:45]`)
+#### 4. Decisions Made
+List clear conclusions or agreements reached. For each decision:
+- What was decided (concise, actionable)
+- Who made or agreed to the decision
+- Approximate timestamp if referenced in discussion
+- **Format**: Start with a verb (e.g., "Approved", "Decided", "Agreed to")
+#### 5. Action Items
+Critical: List all tasks or commitments made. For each action item:
+- **Action**: Specific task description (what needs to be done)
+- **Owner**: Who is responsible (person or role)
+- **Due Date**: When it needs to be completed (if specified; otherwise note "TBD")
+- **Priority**: High/Medium/Low (infer from context if not stated)
+- **Related Decision**: Link to relevant decision number if applicable
+#### 6. Open Items & Outstanding Issues
+Identify topics that were:
+- Discussed but not resolved
+- Deferred or tabled for later discussion
+- Requiring additional information or research
+- Mark as **"Parking Lot"** if explicitly deferred
+#### 7. Next Steps
+What happens after this session:
+- **Follow-up Meeting**: Date/time if scheduled
+- **Immediate Next Actions**: Most urgent items to address
+- **Dependencies**: What blocks progress on open items
+#### 8. Supporting References
+- **Links/References**: Any documents, URLs, or resources mentioned
+- **Key Metrics**: Numbers, dates, or data points highlighted
+- **Related Sessions**: References to previous or planned future sessions (if mentioned)
+---
+## Transcript
+{{TRANSCRIPT_ALL}}

package/prompts/topic-classifier.md ADDED Viewed

@@ -0,0 +1,24 @@
+# Topic Classification Prompt
+You are analyzing a cluster of observations from a screen recording session.
+## Input
+A list of observation summaries containing:
+- OCR text from screenshots
+- VLM descriptions of visual content
+- Audio transcripts
+## Task
+Generate 1-3 specific, descriptive topic labels that capture what the user was doing.
+## Rules
+- Be specific: "debugging whisper hallucinations" not just "debugging"
+- Be descriptive: "learning Ollama embeddings" not just "learning"
+- Focus on the USER'S ACTIVITY, not just visible content
+- Max 3 topics per cluster
+- Output MUST be valid JSON
+## Output Format
+```json
+{"topics": ["topic 1", "topic 2"]}
+```

package/prompts/topic-extract.md ADDED Viewed

@@ -0,0 +1,13 @@
+Analyze these observations from a screen recording session and generate 1-3 descriptive topic labels.
+Observations:
+{{OBSERVATIONS}}
+Output ONLY a JSON object with this format:
+{"topics": ["specific topic 1", "specific topic 2"]}
+Rules:
+- Be specific: "debugging TypeScript errors" not just "debugging"
+- Be descriptive: "learning React hooks" not just "learning"
+- Focus on what the user is DOING, not just what's visible
+- Max 3 topics

package/prompts/vlm-batch.md ADDED Viewed

@@ -0,0 +1,21 @@
+Analyze these {{FRAME_COUNT}} screenshots from a screen recording.
+For each frame, output ONE line in this EXACT format:
+Frame 1: description: [what user is doing + context/intent] | activity: [one word] | apps: [list] | topics: [list]
+Activity MUST be one of: debugging coding review meeting research reading terminal other
+Good descriptions capture WHAT the user is doing, WHAT they're working on, and WHY:
+- "Fixing TypeScript type error in the fetch handler after a failed API integration test" (not just "debugging error")
+- "Reading Qwen3-VL documentation to understand multimodal token format for the VLM adapter" (not just "reading docs")
+- "Searching Stack Overflow for React useEffect cleanup patterns to fix a memory leak" (not just "browsing")
+- "Reviewing PR #142 which adds batch processing to the MLX inference pipeline" (not just "reviewing PR")
+- "Running database migrations in terminal to add the new observations table schema" (not just "in terminal")
+- "Watching a YouTube tutorial on SQLite query optimization for the frame sampling service" (not just "watching video")
+Example output:
+Frame 1: description: Fixing TypeScript type error in the fetch handler after a failed API integration test | activity: debugging | apps: [VS Code, Chrome] | topics: [TypeScript, API]
+Frame 2: description: Reading Qwen3-VL documentation to understand multimodal token format for the VLM adapter | activity: reading | apps: [Chrome] | topics: [Qwen3-VL, VLM]
+Frame 3: description: Running database migrations in terminal to add the new observations table schema | activity: terminal | apps: [iTerm, VS Code] | topics: [SQLite, migrations]
+Now analyze all {{FRAME_COUNT}} frames:

package/prompts/vlm-single.md ADDED Viewed

@@ -0,0 +1,19 @@
+Analyze this screenshot from a screen recording.
+Output ONE line in this EXACT format:
+description: [what user is doing + context/intent] | activity: [one word] | apps: [list] | topics: [list]
+Activity MUST be one of: debugging coding review meeting research reading terminal other
+Good descriptions capture WHAT the user is doing, WHAT they're working on, and WHY:
+- "Fixing TypeScript type error in the fetch handler after a failed API integration test" (not just "debugging error")
+- "Reading Qwen3-VL documentation to understand multimodal token format for the VLM adapter" (not just "reading docs")
+- "Searching Stack Overflow for React useEffect cleanup patterns to fix a memory leak" (not just "browsing")
+- "Reviewing PR #142 which adds batch processing to the MLX inference pipeline" (not just "reviewing PR")
+- "Running database migrations in terminal to add the new observations table schema" (not just "in terminal")
+- "Watching a YouTube tutorial on SQLite query optimization for the frame sampling service" (not just "watching video")
+Example:
+description: Fixing TypeScript type error in the fetch handler after a failed API integration test | activity: debugging | apps: [VS Code, Chrome] | topics: [TypeScript, API]
+Now analyze the screenshot: