npm - agentvibes - Versions diffs - 4.5.7 → 4.6.2 - Mend

agentvibes 4.5.7 → 4.6.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (22) hide show

package/.claude/config/audio-effects.cfg +1 -1
package/.claude/config/tts-pretext.txt +1 -0
package/.claude/hooks/audio-processor.sh +1 -1
package/.claude/hooks/bmad-party-speak.sh +175 -0
package/.claude/hooks-windows/bmad-party-speak.ps1 +207 -0
package/.claude/hooks-windows/bmad-speak.ps1 +32 -7
package/.claude/hooks-windows/play-tts-piper.ps1 +43 -6
package/.claude/hooks-windows/play-tts.ps1 +57 -30
package/.mcp.json +7 -0
package/README.md +64 -2
package/RELEASE_NOTES.md +42 -0
package/bin/agent-vibes +1 -1
package/bin/agentvibes-voice-browser.js +1 -1
package/bin/mcp-server.js +1 -1
package/bin/test-bmad-pr +1 -1
package/package.json +110 -110
package/src/console/tabs/agents-tab.js +240 -34
package/src/console/tabs/install-tab.js +1 -0
package/src/console/tabs/voices-tab.js +38 -5
package/src/console/widgets/track-picker.js +50 -18
package/src/installer.js +97 -3
package/templates/agentvibes-receiver.sh +1 -1

package/.claude/config/audio-effects.cfg CHANGED Viewed

@@ -17,7 +17,7 @@ bmad-agent-tech-writer||agent_vibes_arabic_v2_loop.mp3|0.70
 # BMAD Agents - each with unique audio personality|||
 |||
 # PM John - upbeat, driving energy|||
-John|gain -1 equalizer 3000 1q +2|agentvibes_soft_flamenco_loop.mp3|0.30
+John|gain -1 equalizer 3000 1q +2|agentvibes_soft_flamenco_loop.mp3|0.20
 |||
 # Architect Winston - deep, authoritative|||
 Winston|reverb 40 50 90 gain -2|agentvibes_soft_flamenco_loop.mp3|0.25

package/.claude/config/tts-pretext.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+ AgentVibes

package/.claude/hooks/audio-processor.sh CHANGED Viewed

@@ -310,7 +310,7 @@ mix_background() {
     fi
     ffmpeg -y -i "$voice" -ss "$start_pos" -stream_loop -1 -i "$background" \
-        -filter_complex "[1:a]volume=${volume},afade=t=in:st=0:d=0.3,afade=t=out:st=${bg_fade_out_adjusted}:d=2[bg];[0:a]adelay=${voice_delay_ms}|${voice_delay_ms}[v];[v][bg]amix=inputs=2:duration=longest[out]" \
+        -filter_complex "[1:a]volume=${volume},afade=t=in:st=0:d=0.3,afade=t=out:st=${bg_fade_out_adjusted}:d=2[bg];[0:a]adelay=${voice_delay_ms}|${voice_delay_ms},volume=1.5[v];[v][bg]amix=inputs=2:duration=longest:normalize=0[out]" \
         -map "[out]" $audio_settings -t "$total_duration" "$output" 2>/dev/null || {
         echo "Warning: Background mixing failed, using voice only" >&2
         cp "$voice" "$output"

package/.claude/hooks/bmad-party-speak.sh ADDED Viewed

@@ -0,0 +1,175 @@
+#!/usr/bin/env bash
+#
+# File: ~/.claude/hooks/bmad-party-speak.sh
+#
+# AgentVibes PostToolUse Hook - BMAD Party Mode TTS (Linux / macOS / WSL)
+#
+# Fires after every Agent tool call. Detects BMAD party mode agents by
+# fingerprinting the prompt, extracts the agent display name, maps it to
+# the canonical agent ID via the manifest, then calls bmad-speak.sh.
+# Uses flock for cross-process audio serialization (no overlapping speech).
+#
+# Installed globally so it works in any BMAD project.
+# Uses CLAUDE_PROJECT_DIR env var to locate the project manifest at runtime.
+#
+# Input: JSON on stdin (Claude Code PostToolUse payload)
+#
+set -euo pipefail
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+LOCK_FILE="/tmp/agentvibes-party-queue.lock"
+# --- Read stdin ---
+raw="$(cat)"
+[[ -z "$raw" ]] && exit 0
+# --- Parse all needed fields in one python3 call (fixes M5: 3x subprocess, echo safety) ---
+# Outputs: TOOL_NAME|DISPLAY_NAME|RESPONSE_TEXT (newlines in response encoded as \n literals)
+parsed="$(printf '%s' "$raw" | python3 - <<'PYEOF'
+import sys, json, re
+try:
+    d = json.load(sys.stdin)
+except Exception:
+    print("|||")
+    sys.exit(0)
+tool_name = d.get('tool_name', '')
+prompt = d.get('tool_input', {}).get('prompt', '')
+# Extract display name — safe alternative to grep -oP (fixes C2: macOS BSD grep no -P)
+display_name = ''
+m = re.search(r'You are ([A-Za-z]+)\s*\(', prompt)
+if m:
+    display_name = m.group(1)
+# Extract response text
+response_text = ''
+for item in d.get('tool_response', {}).get('content', []):
+    if item.get('type') == 'text':
+        response_text = item['text']
+        break
+# Strip leading icon + bold name header (e.g. "📊 **Mary:** " or garbled prefix)
+response_text = response_text.strip()
+response_text = re.sub(r'^\S*\s*\*\*[^:]+:\*\*\s*', '', response_text).strip()
+# Encode newlines so we can pass multi-line text through a single shell variable (fixes m3)
+response_text = response_text.replace('\n', '\\n')
+print(f"{tool_name}|{display_name}|{response_text}")
+PYEOF
+)" 2>/dev/null || true
+[[ -z "$parsed" ]] && exit 0
+tool_name="${parsed%%|*}"
+rest="${parsed#*|}"
+display_name="${rest%%|*}"
+response_text="${rest#*|}"
+# Decode \n back to newlines for TTS
+response_text="${response_text//\\n/ }"
+# --- Only handle Agent tool ---
+[[ "$tool_name" != "Agent" ]] && exit 0
+# --- Fingerprint: only fire for BMAD party mode agents (safe string match, no pipe) ---
+[[ "$raw" == *"BMAD agent in a collaborative roundtable"* ]] || exit 0
+[[ -z "$display_name" ]] && exit 0
+[[ -z "$response_text" ]] && exit 0
+# --- Resolve project root ---
+project_root="${CLAUDE_PROJECT_DIR:-}"
+# --- Find bmad-speak.sh (prefer project-local, fall back to global) ---
+bmad_speak=""
+if [[ -n "$project_root" && -f "$project_root/.claude/hooks/bmad-speak.sh" ]]; then
+    bmad_speak="$project_root/.claude/hooks/bmad-speak.sh"
+elif [[ -f "$SCRIPT_DIR/bmad-speak.sh" ]]; then
+    bmad_speak="$SCRIPT_DIR/bmad-speak.sh"
+fi
+[[ -z "$bmad_speak" ]] && exit 0
+# --- Look up canonical agent ID from project manifest via python3 (fixes M4: awk CSV comma) ---
+agent_id="$display_name"  # fallback
+if [[ -n "$project_root" && -f "$project_root/_bmad/_config/agent-manifest.csv" ]]; then
+    manifest="$project_root/_bmad/_config/agent-manifest.csv"
+    matched="$(python3 - "$manifest" "$display_name" <<'PYEOF'
+import sys, csv
+manifest_path, target = sys.argv[1], sys.argv[2].lower()
+try:
+    with open(manifest_path, newline='', encoding='utf-8') as f:
+        for row in csv.DictReader(f):
+            if row.get('displayName', '').lower() == target:
+                print(row.get('name', ''))
+                break
+except Exception:
+    pass
+PYEOF
+)" 2>/dev/null || true
+    [[ -n "$matched" ]] && agent_id="$matched"
+fi
+# --- Apply verbosity truncation ---
+verbosity="medium"
+# Guard project_root empty to avoid /.claude/... path (fixes M1)
+if [[ -n "$project_root" && -f "$project_root/.claude/tts-verbosity.txt" ]]; then
+    v="$(tr -d '[:space:]' < "$project_root/.claude/tts-verbosity.txt")"
+    [[ -n "$v" ]] && verbosity="$v"
+elif [[ -f "$HOME/.claude/tts-verbosity.txt" ]]; then
+    v="$(tr -d '[:space:]' < "$HOME/.claude/tts-verbosity.txt")"
+    [[ -n "$v" ]] && verbosity="$v"
+fi
+case "$verbosity" in
+    low)
+        # First sentence — fall back to full text if no punctuation (fixes m1)
+        first="$(printf '%s' "$response_text" | python3 -c "
+import sys, re
+t = sys.stdin.read()
+m = re.match(r'^.*?[.!?]', t)
+print(m.group(0) if m else t)
+" 2>/dev/null || printf '%s' "$response_text")"
+        [[ -n "$first" ]] && response_text="$first"
+        ;;
+    medium)
+        # First 2 sentences — fall back to full text if no punctuation (fixes m1)
+        two="$(printf '%s' "$response_text" | python3 -c "
+import sys, re
+t = sys.stdin.read()
+parts = re.findall(r'.*?[.!?]', t)
+print(' '.join(parts[:2]) if parts else t)
+" 2>/dev/null || printf '%s' "$response_text")"
+        [[ -n "$two" ]] && response_text="$two"
+        ;;
+    # high = full text
+esac
+[[ -z "$response_text" ]] && exit 0
+# --- Acquire queue lock (flock: cross-process, auto-releases on crash) ---
+exec 9>"$LOCK_FILE"
+if command -v flock &>/dev/null; then
+    flock -w 60 9
+    "$bmad_speak" "$agent_id" "$response_text" || true
+    flock -u 9
+else
+    # macOS fallback: atomic mkdir polling lock
+    LOCK_DIR="/tmp/agentvibes-party-queue.lock.d"
+    # Register trap BEFORE acquiring lock so SIGTERM can't orphan it (fixes M3)
+    trap 'rmdir "$LOCK_DIR" 2>/dev/null || true' EXIT
+    WAITED=0
+    while ! mkdir "$LOCK_DIR" 2>/dev/null; do
+        sleep 0.5
+        WAITED=$((WAITED + 1))
+        if [[ $WAITED -ge 120 ]]; then
+            echo "[AgentVibes] Party mode TTS queue timeout for agent: $agent_id" >&2
+            exit 0
+        fi
+    done
+    "$bmad_speak" "$agent_id" "$response_text" || true
+    rmdir "$LOCK_DIR" 2>/dev/null || true
+fi

package/.claude/hooks-windows/bmad-party-speak.ps1 ADDED Viewed

@@ -0,0 +1,207 @@
+#
+# File: ~/.claude/hooks-windows/bmad-party-speak.ps1
+#
+# AgentVibes PostToolUse Hook - BMAD Party Mode TTS
+#
+# Fires after every Agent tool call. Detects BMAD party mode agents by
+# fingerprinting the prompt, extracts the agent display name, maps it to
+# the canonical agent ID via the manifest, then calls bmad-speak.ps1.
+#
+# Installed globally so it works in any BMAD project.
+# Uses $env:CLAUDE_PROJECT_DIR to locate the project manifest at runtime.
+#
+try {
+    # --- Read stdin safely ---
+    $raw = [Console]::In.ReadToEnd()
+    if (-not $raw -or $raw.Trim() -eq "") { exit 0 }
+    $data = $raw | ConvertFrom-Json
+    if (-not $data) { exit 0 }
+    # --- Only handle Agent tool ---
+    if ($data.tool_name -ne "Agent") { exit 0 }
+    # --- Extract prompt ---
+    $prompt = $data.tool_input.prompt
+    if (-not $prompt) { exit 0 }
+    # --- Fingerprint: only fire for BMAD party mode agents ---
+    if ($prompt -notmatch "BMAD agent in a collaborative roundtable") { exit 0 }
+    # --- Extract display name from "You are {Name} (" ---
+    if ($prompt -notmatch "You are ([A-Za-z]+)\s*\(") { exit 0 }
+    $DisplayName = $Matches[1]
+    # --- Extract response text ---
+    $content = $data.tool_response.content
+    if (-not $content -or $content.Count -eq 0) { exit 0 }
+    $ResponseText = ($content | Where-Object { $_.type -eq "text" } | Select-Object -First 1).text
+    if (-not $ResponseText) { exit 0 }
+    # Strip leading icon + bold name header e.g. "📊 **Mary:**" or garbled "≡ƒôè **Mary:**"
+    # Trim first so leading newlines don't defeat the ^ anchor (fixes M7)
+    $ResponseText = $ResponseText.Trim()
+    $ResponseText = $ResponseText -replace '^\S*\s*\*\*[^:]+:\*\*\s*', ''
+    $ResponseText = $ResponseText.Trim()
+    if (-not $ResponseText) { exit 0 }
+    # --- Resolve paths ---
+    $ScriptDir = Split-Path -Parent $MyInvocation.MyCommand.Path
+    $ProjectRoot = $env:CLAUDE_PROJECT_DIR
+    # --- Find bmad-speak.ps1 (prefer project-local, fall back to global) ---
+    $BmadSpeak = $null
+    if ($ProjectRoot) {
+        $local = Join-Path $ProjectRoot ".claude\hooks-windows\bmad-speak.ps1"
+        if (Test-Path $local) { $BmadSpeak = $local }
+    }
+    if (-not $BmadSpeak) {
+        $global = Join-Path $ScriptDir "bmad-speak.ps1"
+        if (Test-Path $global) { $BmadSpeak = $global }
+    }
+    if (-not $BmadSpeak) { exit 0 }
+    # --- Look up canonical agent ID from project manifest (fixes m2: UTF8 encoding) ---
+    $AgentId = $DisplayName  # fallback
+    if ($ProjectRoot) {
+        $ManifestFile = Join-Path $ProjectRoot "_bmad\_config\agent-manifest.csv"
+        if (Test-Path $ManifestFile) {
+            $rows = Import-Csv $ManifestFile -Encoding UTF8
+            foreach ($row in $rows) {
+                if ($row.displayName -ieq $DisplayName) {
+                    $AgentId = $row.name
+                    break
+                }
+            }
+        }
+    }
+    # --- Apply verbosity truncation ---
+    $Verbosity = "medium"
+    $verbosityPaths = @(
+        (Join-Path $env:USERPROFILE ".claude\tts-verbosity.txt")
+    )
+    if ($ProjectRoot) {
+        $verbosityPaths = @((Join-Path $ProjectRoot ".claude\tts-verbosity.txt")) + $verbosityPaths
+    }
+    foreach ($p in $verbosityPaths) {
+        if (Test-Path $p) {
+            $v = (Get-Content $p -Raw -ErrorAction SilentlyContinue).Trim()
+            if ($v) { $Verbosity = $v; break }
+        }
+    }
+    switch ($Verbosity) {
+        "low" {
+            $sentences = [regex]::Split($ResponseText, '(?<=[.!?])\s+')
+            # Fall back to full text if no sentence-ending punctuation (fixes m1)
+            if ($sentences.Count -gt 0 -and $sentences[0]) { $ResponseText = $sentences[0] }
+        }
+        "medium" {
+            $sentences = [regex]::Split($ResponseText, '(?<=[.!?])\s+')
+            # Fall back to full text if no sentence-ending punctuation (fixes m1)
+            $truncated = ($sentences | Select-Object -First 2) -join " "
+            if ($truncated) { $ResponseText = $truncated }
+        }
+        # "high" = full text
+    }
+    # --- Pre-synthesize WAV before acquiring mutex so synthesis overlaps with previous agent's playback ---
+    $PreSynthWav = $null
+    try {
+        # Resolve agent voice from voice map
+        $VoiceMapLocal  = if ($ProjectRoot) { Join-Path $ProjectRoot ".agentvibes\bmad-voice-map.json" } else { $null }
+        $VoiceMapGlobal = Join-Path $env:USERPROFILE ".agentvibes\bmad-voice-map.json"
+        $VoiceMapFile   = if ($VoiceMapLocal -and (Test-Path $VoiceMapLocal)) { $VoiceMapLocal }
+                          elseif (Test-Path $VoiceMapGlobal) { $VoiceMapGlobal }
+                          else { $null }
+        $AgentVoiceName = $null
+        $SpeakerId      = $null
+        if ($VoiceMapFile) {
+            $vm = Get-Content $VoiceMapFile -Raw | ConvertFrom-Json
+            $profile = $vm.agents.$AgentId
+            if ($profile -and $profile.voice) {
+                $raw = $profile.voice
+                if ($raw -match '::') {
+                    $parts = $raw -split '::'
+                    $AgentVoiceName = $parts[0]
+                    if ($parts[1] -match '-(\d+)$') { $SpeakerId = $Matches[1] }
+                } else {
+                    $AgentVoiceName = $raw
+                }
+            }
+        }
+        # Locate piper
+        $PiperExe = "$env:LOCALAPPDATA\Programs\Piper\piper.exe"
+        if (-not (Test-Path $PiperExe)) {
+            $found = Get-Command piper.exe -ErrorAction SilentlyContinue
+            if ($found) { $PiperExe = $found.Source }
+        }
+        if (Test-Path $PiperExe) {
+            $VoicesDir = "$env:USERPROFILE\.claude\piper-voices"
+            # Fall back to first available voice if agent voice not found
+            if (-not $AgentVoiceName) {
+                $first = Get-ChildItem $VoicesDir -Filter "*.onnx" -ErrorAction SilentlyContinue | Select-Object -First 1
+                if ($first) { $AgentVoiceName = $first.BaseName }
+            }
+            if ($AgentVoiceName -and ($AgentVoiceName -match '^[a-zA-Z0-9_\-\.]+$')) {
+                $VoiceModel = Join-Path $VoicesDir "$AgentVoiceName.onnx"
+                if (Test-Path $VoiceModel) {
+                    $AudioDir = "$env:USERPROFILE\.claude\audio"
+                    if (-not (Test-Path $AudioDir)) { New-Item -ItemType Directory -Path $AudioDir -Force | Out-Null }
+                    $PreSynthWav = Join-Path $AudioDir "tts-presynth-$([System.IO.Path]::GetRandomFileName() -replace '\..*').wav"
+                    $piperArgs = @("--model", $VoiceModel, "--output-file", $PreSynthWav)
+                    if ($SpeakerId) { $piperArgs += @("--speaker", $SpeakerId) }
+                    $ResponseText | & $PiperExe @piperArgs 2>$null
+                    if (-not (Test-Path $PreSynthWav) -or (Get-Item $PreSynthWav).Length -eq 0) {
+                        $PreSynthWav = $null
+                    }
+                }
+            }
+        }
+    } catch {
+        $PreSynthWav = $null  # degrade gracefully — will synthesize inside mutex instead
+    }
+    # --- Speak with queue serialization (named mutex, cross-process) ---
+    $mutex = New-Object System.Threading.Mutex($false, "AgentVibesPartyModeTTSQueue")
+    try {
+        $acquired = $false
+        try {
+            # WaitOne throws AbandonedMutexException if prior process crashed while holding it.
+            # That exception means we DID acquire the mutex — treat it as success (fixes M2).
+            $acquired = $mutex.WaitOne(60000)
+        } catch [System.Threading.AbandonedMutexException] {
+            $acquired = $true  # abandoned = we now own it
+        }
+        if ($acquired) {
+            try {
+                # Pass pre-synthesized WAV path so play-tts.ps1 skips synthesis (reduces gap between agents)
+                if ($PreSynthWav) { $env:AGENTVIBES_PRESYNTHESIZED_WAV = $PreSynthWav }
+                # Pass positional args directly after -File (spaces handled by quoting via array)
+                & powershell -NoProfile -ExecutionPolicy Bypass -File $BmadSpeak $AgentId $ResponseText
+            } finally {
+                $env:AGENTVIBES_PRESYNTHESIZED_WAV = ""
+                if ($PreSynthWav -and (Test-Path $PreSynthWav)) {
+                    Remove-Item $PreSynthWav -Force -ErrorAction SilentlyContinue
+                }
+                $mutex.ReleaseMutex()
+            }
+        } else {
+            # Timed out — log to stderr so it's visible in hook error output (fixes M6)
+            [Console]::Error.WriteLine("[AgentVibes] Party mode TTS queue timeout for agent: $AgentId")
+        }
+    } finally {
+        $mutex.Close()
+    }
+} catch {
+    # Silently exit — never block Claude
+    exit 0
+}

package/.claude/hooks-windows/bmad-speak.ps1 CHANGED Viewed

@@ -50,6 +50,7 @@ $VoiceMapGlobal = Join-Path $env:USERPROFILE ".agentvibes\bmad-voice-map.json"
 $VoiceMapFile   = if (Test-Path $VoiceMapLocal) { $VoiceMapLocal } else { $VoiceMapGlobal }
 $AgentVoice     = ""
+$AgentPretext   = ""
 $AgentPersonality = ""
 $AgentBgEnabled = $false
 $AgentBgTrack   = ""
@@ -72,24 +73,35 @@ if (Test-Path $_BgVolFile) {
     $AgentBgVolume = "0.20"
 }
-if (Test-Path $VoiceMapFile) {
-    try {
-        $VoiceMap = Get-Content $VoiceMapFile -Raw | ConvertFrom-Json
+# Resolve agent ID and display name/title from manifest (needed for default pretext)
+$AgentDisplayName = ""
+$AgentTitle       = ""
-        # Resolve agent ID: match canonical ID or display name prefix
+if (Test-Path $ManifestFile) {
+    try {
         $ManifestRows = Import-Csv $ManifestFile -Encoding UTF8
         foreach ($row in $ManifestRows) {
             $id      = ($row.PSObject.Properties | Select-Object -First 1).Value -replace '^"|"$', ''
             $display = ($row.PSObject.Properties | Select-Object -Skip 1 -First 1).Value -replace '^"|"$', ''
+            $title   = ($row.PSObject.Properties | Select-Object -Skip 2 -First 1).Value -replace '^"|"$', ''
             if ($id -ieq $AgentNameOrId -or $display -like "$AgentNameOrId*") {
-                $AgentId = $id
+                $AgentId          = $id
+                $AgentDisplayName = $display
+                $AgentTitle       = $title
                 break
             }
         }
+    } catch { }
+}
+if (Test-Path $VoiceMapFile) {
+    try {
+        $VoiceMap = Get-Content $VoiceMapFile -Raw | ConvertFrom-Json
         if ($AgentId -and $VoiceMap.agents.$AgentId) {
             $Profile = $VoiceMap.agents.$AgentId
             if ($Profile.voice)       { $AgentVoice       = $Profile.voice }
+            if ($Profile.pretext)     { $AgentPretext     = $Profile.pretext }
             if ($Profile.personality) { $AgentPersonality = $Profile.personality }
             if ($Profile.backgroundMusic) {
                 $AgentBgEnabled = [bool]$Profile.backgroundMusic.enabled
@@ -105,6 +117,16 @@ if (Test-Path $VoiceMapFile) {
     }
 }
+# Fall back to default pretext if none stored: "DisplayName, Title here."
+# Matches AgentVoiceStore.getDefaultPretext() in agent-voice-store.js
+if (-not $AgentPretext -and $AgentDisplayName) {
+    if ($AgentTitle) {
+        $AgentPretext = "$AgentDisplayName, $AgentTitle here."
+    } else {
+        $AgentPretext = "$AgentDisplayName here."
+    }
+}
 # ---------------------------------------------------------------------------
 # Locate play-tts.ps1 — prefer project-local, fall back to global
 $PlayTtsLocal  = Join-Path $ProjectRoot ".claude\hooks-windows\play-tts.ps1"
@@ -163,11 +185,14 @@ if ($AgentBgEnabled -and $AgentBgTrack) {
 }
 try {
+    # Prepend pretext if configured (e.g. "As your UX designer")
+    $SpeakText = if ($AgentPretext) { "$AgentPretext. $Dialogue" } else { $Dialogue }
     # Speak with agent's voice (or global voice if none configured)
     if ($AgentVoice) {
-        & powershell -NoProfile -ExecutionPolicy Bypass -File $PlayTtsScript $Dialogue $AgentVoice
+        & powershell -NoProfile -ExecutionPolicy Bypass -File $PlayTtsScript $SpeakText $AgentVoice
     } else {
-        & powershell -NoProfile -ExecutionPolicy Bypass -File $PlayTtsScript $Dialogue
+        & powershell -NoProfile -ExecutionPolicy Bypass -File $PlayTtsScript $SpeakText
     }
 } finally {
     # Restore personality

package/.claude/hooks-windows/play-tts-piper.ps1 CHANGED Viewed

@@ -70,15 +70,52 @@ elseif (Test-Path $VoiceFile) {
     $VoiceName = (Get-Content $VoiceFile -Raw).Trim()
 }
-# Strip display name suffix (e.g. "en_US-libritts-high::Bella-9" -> "en_US-libritts-high")
-# and extract speaker ID if present (works for both override and file)
+# Strip display name suffix (e.g. "en_US-libritts-high::Holly-7" -> "en_US-libritts-high")
+# and resolve the real Piper speaker index.
+# IMPORTANT: The trailing number in a speaker name (e.g. "Holly-7") is a disambiguation
+# suffix, NOT the speaker index. Real index must be looked up from voice-assignments.json.
 if ($VoiceName -match '::') {
     $parts = $VoiceName -split '::'
     $VoiceName = $parts[0]
-    if ($parts.Length -ge 2 -and $parts[1] -match '-(\d+)$') {
-        $env:PIPER_SPEAKER = $Matches[1]
-    } else {
-        Remove-Item env:PIPER_SPEAKER -ErrorAction SilentlyContinue
+    $SpeakerName = if ($parts.Length -ge 2) { $parts[1] } else { "" }
+    Remove-Item env:PIPER_SPEAKER -ErrorAction SilentlyContinue
+    if ($SpeakerName) {
+        # Primary: look up in voice-assignments.json catalog (libritts_speakers keyed by speaker index)
+        # Derive project root from this script's location: .claude/hooks-windows/ -> project root
+        $PiperScriptRoot = Split-Path -Parent $MyInvocation.MyCommand.Path
+        $PiperProjectRoot = Split-Path -Parent (Split-Path -Parent $PiperScriptRoot)
+        $VoiceAssignmentsPath = Join-Path $PiperProjectRoot "voice-assignments.json"
+        # Fallback: global AgentVibes install if not found in project
+        if (-not (Test-Path $VoiceAssignmentsPath)) {
+            $VoiceAssignmentsPath = Join-Path $env:USERPROFILE "AgentVibes\voice-assignments.json"
+        }
+        $SpeakerResolved = $false
+        if (Test-Path $VoiceAssignmentsPath) {
+            try {
+                $vaData = Get-Content $VoiceAssignmentsPath -Raw | ConvertFrom-Json
+                foreach ($prop in $vaData.libritts_speakers.PSObject.Properties) {
+                    if ($prop.Value.voice_name -eq $SpeakerName) {
+                        $env:PIPER_SPEAKER = $prop.Name
+                        $SpeakerResolved = $true
+                        break
+                    }
+                }
+            } catch { }
+        }
+        # Fallback: check patched speaker_id_map in the .onnx.json
+        if (-not $SpeakerResolved) {
+            $OnnxJsonPath = "$VoicesDir\$VoiceName.onnx.json"
+            if (Test-Path $OnnxJsonPath) {
+                try {
+                    $onnxData = Get-Content $OnnxJsonPath -Raw | ConvertFrom-Json
+                    $speakerIdMap = $onnxData.speaker_id_map
+                    if ($speakerIdMap -and $speakerIdMap.PSObject.Properties[$SpeakerName]) {
+                        $env:PIPER_SPEAKER = [string]$speakerIdMap.PSObject.Properties[$SpeakerName].Value
+                    }
+                } catch { }
+            }
+        }
     }
 } else {
     # No multi-speaker syntax — clear any stale speaker env var

package/.claude/hooks-windows/play-tts.ps1 CHANGED Viewed

@@ -128,58 +128,85 @@ if ($BgEnabled -or $HasReverb) {
     }
 }
+# Check for pre-synthesized WAV (party mode optimization — synthesis done before mutex acquisition)
+$PreSynthWav = $env:AGENTVIBES_PRESYNTHESIZED_WAV
+$UsePreSynth = $PreSynthWav -and (Test-Path $PreSynthWav) -and
+    (Get-Item $PreSynthWav -ErrorAction SilentlyContinue).Length -gt 0
 # If background music or reverb enabled and ffmpeg available, tell provider to skip playback
 if (($BgEnabled -or $HasReverb) -and $HasFfmpeg) {
     $env:AGENTVIBES_NO_PLAY = "1"
 }
-# Call the provider script
+# Call the provider script (skip if using pre-synthesized audio)
 # When post-processing (reverb/music), capture output preserving InformationRecord colors.
 # Otherwise call directly so Write-Host colors pass through to the terminal.
 $NeedsPostProcess = ($BgEnabled -or $HasReverb) -and $HasFfmpeg
-try {
-    if ($NeedsPostProcess) {
-        if ($VoiceOverride) {
-            $providerOutput = & $ProviderScript $Text $VoiceOverride 6>&1 2>&1
-        } else {
-            $providerOutput = & $ProviderScript $Text 6>&1 2>&1
+if ($UsePreSynth) {
+    Write-Host "[SYNTH] Using pre-synthesized audio..." -ForegroundColor Cyan
+    # If no post-processing needed, play the pre-synth file directly and exit
+    if (-not $NeedsPostProcess) {
+        $player = $null
+        try {
+            $player = New-Object System.Media.SoundPlayer $PreSynthWav
+            $player.PlaySync()
+        } catch {
+            Write-Host "[WARNING] Pre-synth playback failed: $_" -ForegroundColor Yellow
+        } finally {
+            if ($player) { $player.Dispose() }
         }
-        # Re-emit preserving colors from InformationRecords (Write-Host output)
-        foreach ($item in $providerOutput) {
-            if ($item -is [System.Management.Automation.InformationRecord]) {
-                $msg = $item.MessageData
-                if ($msg -is [System.Management.Automation.HostInformationMessage]) {
-                    Write-Host $msg.Message -ForegroundColor $msg.ForegroundColor -NoNewline:$msg.NoNewLine
-                    if (-not $msg.NoNewLine) { Write-Host }
+        Remove-Item env:AGENTVIBES_NO_PLAY -ErrorAction SilentlyContinue
+        exit 0
+    }
+} else {
+    try {
+        if ($NeedsPostProcess) {
+            if ($VoiceOverride) {
+                $providerOutput = & $ProviderScript $Text $VoiceOverride 6>&1 2>&1
+            } else {
+                $providerOutput = & $ProviderScript $Text 6>&1 2>&1
+            }
+            # Re-emit preserving colors from InformationRecords (Write-Host output)
+            foreach ($item in $providerOutput) {
+                if ($item -is [System.Management.Automation.InformationRecord]) {
+                    $msg = $item.MessageData
+                    if ($msg -is [System.Management.Automation.HostInformationMessage]) {
+                        Write-Host $msg.Message -ForegroundColor $msg.ForegroundColor -NoNewline:$msg.NoNewLine
+                        if (-not $msg.NoNewLine) { Write-Host }
+                    } else {
+                        Write-Host "$item"
+                    }
                 } else {
                     Write-Host "$item"
                 }
-            } else {
-                Write-Host "$item"
             }
-        }
-    } else {
-        if ($VoiceOverride) {
-            & $ProviderScript $Text $VoiceOverride
         } else {
-            & $ProviderScript $Text
+            if ($VoiceOverride) {
+                & $ProviderScript $Text $VoiceOverride
+            } else {
+                & $ProviderScript $Text
+            }
         }
     }
-}
-catch {
-    Write-Host "[ERROR] TTS Error: $_" -ForegroundColor Red
-    Remove-Item env:AGENTVIBES_NO_PLAY -ErrorAction SilentlyContinue
-    exit 1
+    catch {
+        Write-Host "[ERROR] TTS Error: $_" -ForegroundColor Red
+        Remove-Item env:AGENTVIBES_NO_PLAY -ErrorAction SilentlyContinue
+        exit 1
+    }
 }
 # Apply reverb and/or mix with background music
 if (($BgEnabled -or $HasReverb) -and $HasFfmpeg) {
     Remove-Item env:AGENTVIBES_NO_PLAY -ErrorAction SilentlyContinue
-    # Find the most recent TTS wav file
+    # Find the WAV to post-process: use pre-synthesized file if available, else most recent
     $AudioDir = "$ClaudeDir\audio"
-    $RecentWav = Get-ChildItem -Path $AudioDir -Filter "tts-*.wav" -ErrorAction SilentlyContinue |
-        Sort-Object LastWriteTime -Descending | Select-Object -First 1
+    $RecentWav = if ($UsePreSynth) {
+        Get-Item $PreSynthWav -ErrorAction SilentlyContinue
+    } else {
+        Get-ChildItem -Path $AudioDir -Filter "tts-*.wav" -ErrorAction SilentlyContinue |
+            Sort-Object LastWriteTime -Descending | Select-Object -First 1
+    }
     if ($RecentWav -and $RecentWav.Length -gt 0) {
         $voicePath = $RecentWav.FullName
@@ -282,7 +309,7 @@ if (($BgEnabled -or $HasReverb) -and $HasFfmpeg) {
                     $fadeOutStart = $totalDuration - 2
                     # Filter: music fades in 0.5s, voice delayed 2s, music fades out last 2s
-                    $filter = "[0:a]volume=${BgVolume},afade=t=in:d=0.5,afade=t=out:st=${fadeOutStart}:d=2[bg];[1:a]adelay=2000|2000,apad=pad_dur=2[voice];[bg][voice]amix=inputs=2:duration=longest:dropout_transition=2[out]"
+                    $filter = "[0:a]volume=${BgVolume},afade=t=in:d=0.5,afade=t=out:st=${fadeOutStart}:d=2[bg];[1:a]adelay=1000|1000,volume=1.5,apad=pad_dur=2[voice];[bg][voice]amix=inputs=2:duration=longest:dropout_transition=2:normalize=0[out]"
                     # Run ffmpeg - use Start-Process to avoid stderr issues with $ErrorActionPreference
                     $ffmpegArgs = "-y -stream_loop -1 -i `"$BgTrackPath`" -i `"$voicePath`" -filter_complex `"$filter`" -map `"[out]`" -t $totalDuration `"$MixedFile`""