npm - whspr - Versions diffs - 1.0.14 → 1.0.15 - Mend

whspr 1.0.14 → 1.0.15

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/README.md CHANGED Viewed

@@ -43,6 +43,11 @@ whspr
 # With verbose output
 whspr --verbose
+# Pipe output to another command (instead of clipboard)
+whspr --pipe "pbcopy"              # Explicit clipboard
+whspr --pipe "claude"              # Pipe directly to Claude Code
+whspr -p "cat >> notes.txt"        # Append to a file
 ```
 Press **Enter** to stop recording.
@@ -53,9 +58,12 @@ Press **Enter** to stop recording.
 - 15-minute max recording time
 - Transcription via Groq Whisper API
 - AI-powered post-processing to fix transcription errors
+- Progress bar during post-processing
+- Cost tracking for Anthropic models
 - Custom vocabulary support via `WHSPR.md` (global and local)
 - Configurable settings via `~/.whspr/settings.json`
-- Automatic clipboard copy
+- Automatic clipboard copy (or pipe to any command with `--pipe`)
+- Optional auto-save for transcriptions and audio files
 ## Settings
@@ -70,40 +78,46 @@ Create `~/.whspr/settings.json` to customize whspr's behavior:
   "model": "groq:openai/gpt-oss-120b",
   "systemPrompt": "Your task is to clean up transcribed text...",
   "customPromptPrefix": "Here's my custom user prompt:",
-  "transcriptionPrefix": "Here's my raw transcription output:"
+  "transcriptionPrefix": "Here's my raw transcription output:",
+  "alwaysSaveTranscriptions": false,
+  "alwaysSaveAudio": false,
+  "saveTranscriptionsToCwd": false
 }
 ```
-| Option | Type | Default | Description |
-|--------|------|---------|-------------|
-| `verbose` | boolean | `false` | Enable verbose output |
-| `suffix` | string | none | Text appended to all transcriptions |
-| `transcriptionModel` | string | `"whisper-large-v3-turbo"` | Whisper model (`"whisper-large-v3"` or `"whisper-large-v3-turbo"`) |
-| `language` | string | `"en"` | ISO 639-1 language code (e.g., `"en"`, `"zh"`, `"es"`) |
-| `model` | string | `"groq:openai/gpt-oss-120b"` | Post-processing model in `provider:model-name` format (see below) |
-| `systemPrompt` | string | (built-in) | System prompt for AI post-processing |
-| `customPromptPrefix` | string | `"Here's my custom user prompt:"` | Prefix before custom prompt content |
-| `transcriptionPrefix` | string | `"Here's my raw transcription output that I need you to edit:"` | Prefix before raw transcription |
+| Option                     | Type    | Default                                                         | Description                                                                    |
+| -------------------------- | ------- | --------------------------------------------------------------- | ------------------------------------------------------------------------------ |
+| `verbose`                  | boolean | `false`                                                         | Enable verbose output                                                          |
+| `suffix`                   | string  | none                                                            | Text appended to all transcriptions                                            |
+| `transcriptionModel`       | string  | `"whisper-large-v3-turbo"`                                      | Whisper model (`"whisper-large-v3"` or `"whisper-large-v3-turbo"`)             |
+| `language`                 | string  | `"en"`                                                          | ISO 639-1 language code (e.g., `"en"`, `"zh"`, `"es"`)                         |
+| `model`                    | string  | `"groq:openai/gpt-oss-120b"`                                    | Post-processing model in `provider:model-name` format (see below)              |
+| `systemPrompt`             | string  | (built-in)                                                      | System prompt for AI post-processing                                           |
+| `customPromptPrefix`       | string  | `"Here's my custom user prompt:"`                               | Prefix before custom prompt content                                            |
+| `transcriptionPrefix`      | string  | `"Here's my raw transcription output that I need you to edit:"` | Prefix before raw transcription                                                |
+| `alwaysSaveTranscriptions` | boolean | `false`                                                         | Always save transcription text files to `~/.whspr/transcriptions/`             |
+| `alwaysSaveAudio`          | boolean | `false`                                                         | Always save audio MP3 files to `~/.whspr/recordings/`                          |
+| `saveTranscriptionsToCwd`  | boolean | `false`                                                         | Save transcriptions to current directory instead of `~/.whspr/transcriptions/` |
 ### Supported Providers
 The `model` setting uses a `provider:model-name` format. Supported providers:
-| Provider | API Key Required |
-|----------|------------------|
-| `groq` | `GROQ_API_KEY` |
+| Provider    | API Key Required    |
+| ----------- | ------------------- |
+| `groq`      | `GROQ_API_KEY`      |
 | `anthropic` | `ANTHROPIC_API_KEY` |
 ### Common Models
-| Provider | Model | Description |
-|----------|-------|-------------|
-| `anthropic` | `claude-sonnet-4-5` | Balanced speed and quality (recommended) |
-| `anthropic` | `claude-haiku-4-5` | Fastest responses, smaller model |
-| `anthropic` | `claude-opus-4-5` | Best quality, slower and more expensive |
-| `groq` | `openai/gpt-oss-120b` | Default model |
-| `groq` | `llama-3.3-70b-versatile` | Fast, versatile Llama model |
-| `groq` | `moonshotai/kimi-k2-instruct-0905` | Moonshot Kimi model |
+| Provider    | Model                              | Description                              |
+| ----------- | ---------------------------------- | ---------------------------------------- |
+| `anthropic` | `claude-sonnet-4-5`                | Balanced speed and quality (recommended) |
+| `anthropic` | `claude-haiku-4-5`                 | Fastest responses, smaller model         |
+| `anthropic` | `claude-opus-4-5`                  | Best quality, slower and more expensive  |
+| `groq`      | `openai/gpt-oss-120b`              | Default model                            |
+| `groq`      | `llama-3.3-70b-versatile`          | Fast, versatile Llama model              |
+| `groq`      | `moonshotai/kimi-k2-instruct-0905` | Moonshot Kimi model                      |
 > **Note:** Model names are set by the providers and may change at any time. Check [Groq Models](https://console.groq.com/docs/models) and [Anthropic Models](https://docs.anthropic.com/en/docs/about-claude/models) for the latest available models.
@@ -116,6 +130,32 @@ The `model` setting uses a `provider:model-name` format. Supported providers:
 }
 ```
+### Example: Auto-save Transcriptions to Current Directory
+```json
+{
+  "alwaysSaveTranscriptions": true,
+  "saveTranscriptionsToCwd": true
+}
+```
+## Pipe Output
+Use `--pipe` (or `-p`) to send the transcription to any command instead of the clipboard:
+```bash
+# Pipe to Claude Code for further processing
+whspr --pipe "claude"
+# Append to a file
+whspr --pipe "cat >> meeting-notes.txt"
+# Send via curl
+whspr --pipe "xargs -I {} curl -X POST -d 'text={}' https://api.example.com"
+```
+If the pipe command fails, whspr falls back to copying to the clipboard.
 ## Custom Vocabulary
 Create a `WHSPR.md` (or `WHISPER.md`) file to provide custom vocabulary, names, or instructions for the AI post-processor.
@@ -152,9 +192,11 @@ When both exist, they are combined (global first, then local).
 3. Converts the recording to MP3
 4. Sends audio to Groq's Whisper API for transcription
 5. Loads custom prompts from `~/.whspr/WHSPR.md` and/or `./WHSPR.md`
-6. Sends transcription + custom vocabulary to AI for post-processing
+6. Sends transcription + custom vocabulary to AI for post-processing (with progress bar)
 7. Applies suffix (if configured)
-8. Prints result and copies to clipboard
+8. Displays result with word count, character count, and cost estimate
+9. Pipes to command (`--pipe`) or copies to clipboard
+10. Saves transcription/audio files (if configured)
 If transcription fails, the recording is saved to `~/.whspr/recordings/` for manual recovery.

package/dist/index.d.ts CHANGED Viewed

@@ -16,4 +16,7 @@ export interface WhsprSettings {
     systemPrompt?: string;
     customPromptPrefix?: string;
     transcriptionPrefix?: string;
+    alwaysSaveTranscriptions?: boolean;
+    alwaysSaveAudio?: boolean;
+    saveTranscriptionsToCwd?: boolean;
 }

package/dist/index.js CHANGED Viewed

@@ -4,10 +4,11 @@ import { transcribe } from "./transcribe.js";
 import { postprocess } from "./postprocess.js";
 import { copyToClipboard } from "./utils/clipboard.js";
 import { calculateCost, formatCost } from "./utils/pricing.js";
-import { renderStartupHeader, formatCompactStats, formatStatus, colors, BOX } from "./ui.js";
+import { renderStartupHeader, formatCompactStats, formatStatus, colors, BOX, } from "./ui.js";
 import fs from "fs";
 import path from "path";
 import os from "os";
+import { spawn } from "child_process";
 // Default prompts (can be overridden in settings.json)
 export const DEFAULTS = {
     transcriptionModel: "whisper-large-v3-turbo",
@@ -27,6 +28,13 @@ const DEFAULT_SETTINGS = {
 };
 const WHSPR_DIR = path.join(os.homedir(), ".whspr");
 const SETTINGS_PATH = path.join(WHSPR_DIR, "settings.json");
+const TRANSCRIPTIONS_DIR = path.join(WHSPR_DIR, "transcriptions");
+const RECORDINGS_DIR = path.join(WHSPR_DIR, "recordings");
+function generateTimestampedFilename(extension) {
+    const now = new Date();
+    const timestamp = now.toISOString().replace(/[:.]/g, "-").slice(0, 19);
+    return `transcription-${timestamp}${extension}`;
+}
 function parseModelProvider(model) {
     const colonIndex = model.indexOf(":");
     if (colonIndex === -1) {
@@ -98,7 +106,40 @@ function loadCustomPrompt(verbose) {
     return { prompt: combinedPrompt, sources };
 }
 const settings = loadSettings();
-const verbose = settings.verbose || process.argv.includes("--verbose") || process.argv.includes("-v");
+const verbose = settings.verbose ||
+    process.argv.includes("--verbose") ||
+    process.argv.includes("-v");
+// Parse --pipe flag
+function getPipeCommand() {
+    const pipeIndex = process.argv.findIndex((arg) => arg === "--pipe" || arg === "-p");
+    if (pipeIndex !== -1 && process.argv[pipeIndex + 1]) {
+        return process.argv[pipeIndex + 1];
+    }
+    return null;
+}
+const pipeCommand = getPipeCommand();
+// Execute a command with text piped to stdin
+function pipeToCommand(text, command) {
+    return new Promise((resolve, reject) => {
+        const child = spawn(command, [], {
+            shell: true,
+            stdio: ["pipe", "inherit", "inherit"],
+        });
+        child.on("error", (err) => {
+            reject(new Error(`Failed to execute pipe command: ${err.message}`));
+        });
+        child.on("close", (code) => {
+            if (code === 0) {
+                resolve();
+            }
+            else {
+                reject(new Error(`Pipe command exited with code ${code}`));
+            }
+        });
+        child.stdin.write(text);
+        child.stdin.end();
+    });
+}
 function status(message) {
     process.stdout.write(`\x1b[2K\r${formatStatus(message)}`);
 }
@@ -122,14 +163,14 @@ async function main() {
     if (!process.env.GROQ_API_KEY) {
         console.error(colors.error("Error: GROQ_API_KEY environment variable is not set"));
         console.log(colors.metadata("Get your API key at https://console.groq.com/keys"));
-        console.log(colors.metadata("Then run: export GROQ_API_KEY=\"your-api-key\""));
+        console.log(colors.metadata('Then run: export GROQ_API_KEY="your-api-key"'));
         process.exit(1);
     }
     // Check for provider-specific API key for post-processing
     if (provider === "anthropic" && !process.env.ANTHROPIC_API_KEY) {
         console.error(colors.error("Error: ANTHROPIC_API_KEY environment variable is not set"));
         console.log(colors.metadata("Get your API key at https://console.anthropic.com/settings/keys"));
-        console.log(colors.metadata("Then run: export ANTHROPIC_API_KEY=\"your-api-key\""));
+        console.log(colors.metadata('Then run: export ANTHROPIC_API_KEY="your-api-key"'));
         process.exit(1);
     }
     // Load custom prompt early to show in startup header
@@ -180,7 +221,10 @@ async function main() {
             // 6. Output and copy
             clearStatus();
             const processTime = ((Date.now() - processStart) / 1000).toFixed(1);
-            const wordCount = fixedText.trim().split(/\s+/).filter(w => w.length > 0).length;
+            const wordCount = fixedText
+                .trim()
+                .split(/\s+/)
+                .filter((w) => w.length > 0).length;
             const charCount = fixedText.length;
             // Calculate cost if usage info is available
             let costString;
@@ -192,7 +236,9 @@ async function main() {
             const termWidth = Math.min(process.stdout.columns || 60, 80);
             const lineWidth = termWidth - 2;
             const label = " TRANSCRIPT ";
-            console.log(colors.dim(BOX.topLeft + BOX.horizontal) + colors.header.bold(label) + colors.dim(BOX.horizontal.repeat(lineWidth - label.length - 1) + BOX.topRight));
+            console.log(colors.dim(BOX.topLeft + BOX.horizontal) +
+                colors.header.bold(label) +
+                colors.dim(BOX.horizontal.repeat(lineWidth - label.length - 1) + BOX.topRight));
             const lines = fixedText.split("\n");
             for (const line of lines) {
                 // Wrap long lines
@@ -200,31 +246,79 @@ async function main() {
                 while (remaining.length > 0) {
                     const chunk = remaining.slice(0, lineWidth - 2);
                     remaining = remaining.slice(lineWidth - 2);
-                    console.log(colors.dim(BOX.vertical + " ") + colors.white(chunk.padEnd(lineWidth - 2)) + colors.dim(" " + BOX.vertical));
+                    console.log(colors.dim(BOX.vertical + " ") +
+                        colors.white(chunk.padEnd(lineWidth - 2)) +
+                        colors.dim(" " + BOX.vertical));
                 }
                 if (line.length === 0) {
-                    console.log(colors.dim(BOX.vertical + " " + " ".repeat(lineWidth - 2) + " " + BOX.vertical));
+                    console.log(colors.dim(BOX.vertical +
+                        " " +
+                        " ".repeat(lineWidth - 2) +
+                        " " +
+                        BOX.vertical));
                 }
             }
             const stats = ` ${wordCount} words \u2022 ${charCount} chars `;
             const bottomLine = BOX.horizontal.repeat(lineWidth - stats.length - 1) + " ";
-            console.log(colors.dim(BOX.bottomLeft + bottomLine) + colors.metadata(stats) + colors.dim(BOX.bottomRight));
-            await copyToClipboard(fixedText);
+            console.log(colors.dim(BOX.bottomLeft + bottomLine) +
+                colors.metadata(stats) +
+                colors.dim(BOX.bottomRight));
             console.log(formatCompactStats({
                 audioDuration: formatDuration(recording.durationSeconds),
                 processingTime: processTime + "s",
                 cost: costString,
             }));
-            console.log(colors.success("\u2713") + colors.metadata(" Copied to clipboard"));
-            // 7. Clean up
+            // Either pipe to command or copy to clipboard
+            if (pipeCommand) {
+                try {
+                    await pipeToCommand(fixedText, pipeCommand);
+                    console.log(colors.success("\u2713") +
+                        colors.metadata(` Piped to: ${pipeCommand}`));
+                }
+                catch (err) {
+                    console.error(colors.error(`Pipe failed: ${err}`));
+                    // Fall back to clipboard
+                    await copyToClipboard(fixedText);
+                    console.log(colors.success("\u2713") +
+                        colors.metadata(" Copied to clipboard (pipe failed)"));
+                }
+            }
+            else {
+                await copyToClipboard(fixedText);
+                console.log(colors.success("\u2713") + colors.metadata(" Copied to clipboard"));
+            }
+            // 7. Save transcription if configured
+            if (settings.alwaysSaveTranscriptions) {
+                const filename = generateTimestampedFilename(".txt");
+                let savePath;
+                if (settings.saveTranscriptionsToCwd) {
+                    savePath = path.join(process.cwd(), filename);
+                }
+                else {
+                    fs.mkdirSync(TRANSCRIPTIONS_DIR, { recursive: true });
+                    savePath = path.join(TRANSCRIPTIONS_DIR, filename);
+                }
+                fs.writeFileSync(savePath, fixedText, "utf-8");
+                console.log(colors.success("\u2713") +
+                    colors.metadata(` Saved transcription to: ${savePath}`));
+            }
+            // 8. Save audio if configured
+            if (settings.alwaysSaveAudio) {
+                fs.mkdirSync(RECORDINGS_DIR, { recursive: true });
+                const audioFilename = generateTimestampedFilename(".mp3");
+                const audioSavePath = path.join(RECORDINGS_DIR, audioFilename);
+                fs.copyFileSync(mp3Path, audioSavePath);
+                console.log(colors.success("\u2713") +
+                    colors.metadata(` Saved audio to: ${audioSavePath}`));
+            }
+            // 9. Clean up
             fs.unlinkSync(mp3Path);
         }
         catch (error) {
             clearStatus();
-            // Save recording on failure
-            const backupDir = path.join(os.homedir(), ".whspr", "recordings");
-            fs.mkdirSync(backupDir, { recursive: true });
-            const backupPath = path.join(backupDir, `recording-${Date.now()}.mp3`);
+            // Save recording on failure (post-processing failed, save audio only)
+            fs.mkdirSync(RECORDINGS_DIR, { recursive: true });
+            const backupPath = path.join(RECORDINGS_DIR, `recording-${Date.now()}.mp3`);
             fs.renameSync(mp3Path, backupPath);
             console.error(colors.error(`Error: ${error}`));
             console.log(colors.info(`Recording saved to: ${backupPath}`));

package/dist/postprocess.js CHANGED Viewed

@@ -10,7 +10,8 @@ export async function postprocess(rawTranscription, customPrompt, options) {
             messages: [
                 {
                     role: "system",
-                    content: systemPrompt + "\n\nIMPORTANT: Output ONLY the corrected transcription text. Do not wrap it in JSON, markdown code blocks, or any other formatting. Just output the fixed text directly.",
+                    content: systemPrompt +
+                        "\n\nIMPORTANT: Output ONLY the corrected transcription text. Do not wrap it in JSON, markdown code blocks, or any other formatting. Just output the fixed text directly.",
                 },
                 {
                     role: "user",

package/dist/ui.js CHANGED Viewed

@@ -25,7 +25,9 @@ export function renderStartupHeader(config) {
     const termWidth = Math.min(process.stdout.columns || 60, 66);
     const innerWidth = termWidth - 4; // Account for "│  " and " │"
     const headerLabel = " WHSPR ";
-    const topLine = BOX.topLeft + BOX.horizontal + colors.header.bold(headerLabel) +
+    const topLine = BOX.topLeft +
+        BOX.horizontal +
+        colors.header.bold(headerLabel) +
         colors.dim(BOX.horizontal.repeat(termWidth - headerLabel.length - 3) + BOX.topRight);
     console.log(topLine);
     // Model line
@@ -33,7 +35,8 @@ export function renderStartupHeader(config) {
     const modelValue = config.model;
     const modelLine = `${modelLabel}${modelValue}`;
     console.log(colors.dim(BOX.vertical + "  ") +
-        colors.metadata(modelLabel) + colors.white(modelValue) +
+        colors.metadata(modelLabel) +
+        colors.white(modelValue) +
         " ".repeat(Math.max(0, innerWidth - modelLine.length)) +
         colors.dim(" " + BOX.vertical));
     // Vocab line (only show if sources exist)
@@ -42,7 +45,8 @@ export function renderStartupHeader(config) {
         const vocabValue = config.vocabSources.join(" + ");
         const vocabLine = `${vocabLabel}${vocabValue}`;
         console.log(colors.dim(BOX.vertical + "  ") +
-            colors.metadata(vocabLabel) + colors.info(vocabValue) +
+            colors.metadata(vocabLabel) +
+            colors.info(vocabValue) +
             " ".repeat(Math.max(0, innerWidth - vocabLine.length)) +
             colors.dim(" " + BOX.vertical));
     }
@@ -51,8 +55,10 @@ export function renderStartupHeader(config) {
     console.log(); // Empty line after header
 }
 export function formatCompactStats(stats) {
-    let result = colors.metadata("Audio: ") + colors.white(stats.audioDuration) +
-        colors.metadata(" \u2022 Processing: ") + colors.white(stats.processingTime);
+    let result = colors.metadata("Audio: ") +
+        colors.white(stats.audioDuration) +
+        colors.metadata(" \u2022 Processing: ") +
+        colors.white(stats.processingTime);
     if (stats.cost) {
         result += colors.metadata(" \u2022 Cost: ") + colors.white(stats.cost);
     }

package/dist/utils/pricing.js CHANGED Viewed

@@ -1,10 +1,10 @@
 export const MODEL_PRICING = {
     // Groq models
-    "openai/gpt-oss-120b": { input: 0.00, output: 0.00 }, // Free tier pricing
+    "openai/gpt-oss-120b": { input: 0.0, output: 0.0 }, // Free tier pricing
     // Anthropic models
-    "claude-sonnet-4-5": { input: 3.00, output: 15.00 },
-    "claude-haiku-4-5": { input: 0.80, output: 4.00 },
-    "claude-opus-4-5": { input: 15.00, output: 75.00 },
+    "claude-sonnet-4-5": { input: 3.0, output: 15.0 },
+    "claude-haiku-4-5": { input: 0.8, output: 4.0 },
+    "claude-opus-4-5": { input: 15.0, output: 75.0 },
 };
 export function calculateCost(modelName, usage) {
     const pricing = MODEL_PRICING[modelName];

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "whspr",
-  "version": "1.0.14",
+  "version": "1.0.15",
   "description": "CLI tool for audio transcription with Groq Whisper API",
   "type": "module",
   "bin": {