npm - whspr - Versions diffs - 1.0.6 → 1.0.10 - Mend

whspr 1.0.6 → 1.0.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/dist/index.d.ts CHANGED Viewed

@@ -2,6 +2,7 @@
 export declare const DEFAULTS: {
     transcriptionModel: "whisper-large-v3-turbo";
     language: string;
+    model: "groq:openai/gpt-oss-120b";
     systemPrompt: string;
     customPromptPrefix: string;
     transcriptionPrefix: string;
@@ -11,6 +12,7 @@ export interface WhsprSettings {
     suffix?: string;
     transcriptionModel?: "whisper-large-v3" | "whisper-large-v3-turbo";
     language?: string;
+    model?: string;
     systemPrompt?: string;
     customPromptPrefix?: string;
     transcriptionPrefix?: string;

package/dist/index.js CHANGED Viewed

@@ -11,18 +11,46 @@ import os from "os";
 export const DEFAULTS = {
     transcriptionModel: "whisper-large-v3-turbo",
     language: "en",
-    systemPrompt: 'Your task is to clean up/fix transcribed text generated from mic input by the user according to the user\'s own prompt, this prompt may contain custom vocabulary, instructions, etc. Please return the user\'s transcription with the fixes made (e.g. the AI might hear "PostgreSQL" as "post crest QL" you need to use your own reasoning to fix these mistakes in the transcription)',
+    model: "groq:openai/gpt-oss-120b",
+    systemPrompt: `Your task is to fix spelling errors and proper names in transcribed text.
+IMPORTANT: Only correct spelling mistakes and proper nouns (names, places, technical terms).
+Do NOT change wording, phrasing, or sentence structure.
+Do NOT rephrase or rewrite any part of the transcription.
+Preserve the original voice and speaking style exactly as transcribed.`,
     customPromptPrefix: "Here's my custom user prompt:",
     transcriptionPrefix: "Here's my raw transcription output that I need you to edit:",
 };
+// Default settings that will be written to settings.json
+const DEFAULT_SETTINGS = {
+    model: DEFAULTS.model,
+};
 const WHSPR_DIR = path.join(os.homedir(), ".whspr");
 const SETTINGS_PATH = path.join(WHSPR_DIR, "settings.json");
+function parseModelProvider(model) {
+    const colonIndex = model.indexOf(":");
+    if (colonIndex === -1) {
+        throw new Error(`Invalid model format: "${model}". Expected "provider:model-name" (e.g., "groq:openai/gpt-oss-120b")`);
+    }
+    const provider = model.slice(0, colonIndex);
+    const modelName = model.slice(colonIndex + 1);
+    if (provider !== "groq" && provider !== "anthropic") {
+        throw new Error(`Unknown provider: "${provider}". Supported providers: groq, anthropic`);
+    }
+    return { provider, modelName };
+}
 function loadSettings() {
     try {
-        if (fs.existsSync(SETTINGS_PATH)) {
-            const content = fs.readFileSync(SETTINGS_PATH, "utf-8");
-            return JSON.parse(content);
+        // Ensure ~/.whspr/ directory exists
+        if (!fs.existsSync(WHSPR_DIR)) {
+            fs.mkdirSync(WHSPR_DIR, { recursive: true });
         }
+        // Create settings.json with defaults if it doesn't exist
+        if (!fs.existsSync(SETTINGS_PATH)) {
+            fs.writeFileSync(SETTINGS_PATH, JSON.stringify(DEFAULT_SETTINGS, null, 2) + "\n", "utf-8");
+            return { ...DEFAULT_SETTINGS };
+        }
+        const content = fs.readFileSync(SETTINGS_PATH, "utf-8");
+        return JSON.parse(content);
     }
     catch (error) {
         // Silently ignore invalid settings file
@@ -85,13 +113,24 @@ function formatDuration(seconds) {
     return `${secs}s`;
 }
 async function main() {
-    // Check for API key before recording
+    // Parse model configuration
+    const modelConfig = settings.model ?? DEFAULTS.model;
+    const { provider, modelName } = parseModelProvider(modelConfig);
+    // Check for required API keys before recording
+    // Always need GROQ_API_KEY for Whisper transcription
     if (!process.env.GROQ_API_KEY) {
         console.error(chalk.red("Error: GROQ_API_KEY environment variable is not set"));
         console.log(chalk.gray("Get your API key at https://console.groq.com/keys"));
         console.log(chalk.gray("Then run: export GROQ_API_KEY=\"your-api-key\""));
         process.exit(1);
     }
+    // Check for provider-specific API key for post-processing
+    if (provider === "anthropic" && !process.env.ANTHROPIC_API_KEY) {
+        console.error(chalk.red("Error: ANTHROPIC_API_KEY environment variable is not set"));
+        console.log(chalk.gray("Get your API key at https://console.anthropic.com/settings/keys"));
+        console.log(chalk.gray("Then run: export ANTHROPIC_API_KEY=\"your-api-key\""));
+        process.exit(1);
+    }
     try {
         // 1. Record audio
         const recording = await record(verbose);
@@ -115,6 +154,8 @@ async function main() {
             // 5. Post-process
             status("Post-processing...");
             let fixedText = await postprocess(rawText, customPrompt, {
+                provider,
+                modelName,
                 systemPrompt: settings.systemPrompt ?? DEFAULTS.systemPrompt,
                 customPromptPrefix: settings.customPromptPrefix ?? DEFAULTS.customPromptPrefix,
                 transcriptionPrefix: settings.transcriptionPrefix ?? DEFAULTS.transcriptionPrefix,

package/dist/postprocess.d.ts CHANGED Viewed

@@ -1,4 +1,7 @@
+import { ProviderType } from "./utils/providers.js";
 export interface PostprocessOptions {
+    provider: ProviderType;
+    modelName: string;
     systemPrompt: string;
     customPromptPrefix: string;
     transcriptionPrefix: string;

package/dist/postprocess.js CHANGED Viewed

@@ -1,17 +1,19 @@
-import { generateObject } from "ai";
+import { generateText, Output } from "ai";
 import { z } from "zod";
 import { withRetry } from "./utils/retry.js";
-import { groq } from "./utils/groq.js";
-const MODEL = "openai/gpt-oss-120b";
+import { getProvider } from "./utils/providers.js";
 const outputSchema = z.object({
     fixed_transcription: z.string(),
 });
 export async function postprocess(rawTranscription, customPrompt, options) {
-    const { systemPrompt, customPromptPrefix, transcriptionPrefix } = options;
+    const { provider, modelName, systemPrompt, customPromptPrefix, transcriptionPrefix, } = options;
+    const providerInstance = getProvider(provider);
     const result = await withRetry(async () => {
-        const response = await generateObject({
-            model: groq(MODEL),
-            schema: outputSchema,
+        const response = await generateText({
+            model: providerInstance(modelName),
+            output: Output.object({
+                schema: outputSchema,
+            }),
             messages: [
                 {
                     role: "system",
@@ -31,7 +33,7 @@ export async function postprocess(rawTranscription, customPrompt, options) {
                 },
             ],
         });
-        return response.object;
+        return response.output;
     }, 3, "postprocess");
     return result.fixed_transcription;
 }

package/dist/recorder.js CHANGED Viewed

@@ -32,7 +32,7 @@ export async function record(verbose = false) {
     return new Promise((resolve, reject) => {
         // Initialize waveform buffer
         let waveWidth = getWaveWidth();
-        const waveBuffer = new Array(waveWidth).fill(" ");
+        const waveBuffer = new Array(waveWidth).fill(WAVE_CHARS[0]);
         let currentDb = -60;
         let cancelled = false;
         // Spawn FFmpeg with ebur128 filter to get volume levels

package/dist/utils/providers.d.ts ADDED Viewed

@@ -0,0 +1,4 @@
+export declare const groq: import("@ai-sdk/groq").GroqProvider;
+export declare const anthropic: import("@ai-sdk/anthropic").AnthropicProvider;
+export type ProviderType = "groq" | "anthropic";
+export declare function getProvider(provider: ProviderType): import("@ai-sdk/groq").GroqProvider | import("@ai-sdk/anthropic").AnthropicProvider;

package/dist/utils/providers.js ADDED Viewed

@@ -0,0 +1,14 @@
+import { createGroq } from "@ai-sdk/groq";
+import { createAnthropic } from "@ai-sdk/anthropic";
+export const groq = createGroq();
+export const anthropic = createAnthropic();
+export function getProvider(provider) {
+    switch (provider) {
+        case "groq":
+            return groq;
+        case "anthropic":
+            return anthropic;
+        default:
+            throw new Error(`Unknown provider: ${provider}`);
+    }
+}

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "whspr",
-  "version": "1.0.6",
+  "version": "1.0.10",
   "description": "CLI tool for audio transcription with Groq Whisper API",
   "type": "module",
   "bin": {
@@ -29,8 +29,9 @@
     "prepublishOnly": "npm run build"
   },
   "dependencies": {
-    "@ai-sdk/groq": "^1.x",
-    "ai": "^4.x",
+    "@ai-sdk/anthropic": "^3.0.15",
+    "@ai-sdk/groq": "^3.0.11",
+    "ai": "^6.0.41",
     "chalk": "^5.x",
     "clipboardy": "^4.x",
     "groq-sdk": "^0.x",