PyPI - npcsh - Versions diffs - 1.1.21__py3-none-any.whl → 1.1.23__py3-none-any.whl - Mend

npcsh 1.1.21py3-none-any.whl → 1.1.23py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (188) hide show

npcsh/npc_team/jinxs/modes/yap.jinx CHANGED Viewed

@@ -1,44 +1,40 @@
 jinx_name: yap
-description: Voice chat mode - speech-to-text input, text-to-speech output
+description: Voice chat TUI - speech-to-text input, text-to-speech output
+interactive: true
 inputs:
   - model: null
   - provider: null
   - tts_model: kokoro
   - voice: af_heart
   - files: null
+  - show_setup: false
 steps:
-  - name: yap_repl
+  - name: yap_tui
     engine: python
     code: |
-      import os
-      import sys
-      import time
-      import tempfile
-      import threading
-      import queue
+      import os, sys, tty, termios, time, tempfile, threading, queue
+      import select as _sel
       from termcolor import colored
-      # Audio imports with graceful fallback
+      # Audio imports
       try:
           import torch
           import pyaudio
           import wave
           import numpy as np
           from faster_whisper import WhisperModel
-          from gtts import gTTS
           from npcpy.data.audio import (
               FORMAT, CHANNELS, RATE, CHUNK,
               transcribe_recording, convert_mp3_to_wav
           )
+          from npcpy.gen.audio_gen import text_to_speech, get_available_engines, get_available_voices
           AUDIO_AVAILABLE = True
-      except ImportError as e:
+      except ImportError:
           AUDIO_AVAILABLE = False
-          print(colored(f"Audio dependencies not available: {e}", "yellow"))
-          print("Install with: pip install npcsh[audio]")
       from npcpy.llm_funcs import get_llm_response
-      from npcpy.npc_sysenv import get_system_message, render_markdown
+      from npcpy.npc_sysenv import get_system_message, render_markdown, get_locally_available_models
       from npcpy.data.load import load_file_contents
       from npcpy.data.text import rag_search
@@ -46,10 +42,10 @@ steps:
       team = context.get('team')
       messages = context.get('messages', [])
       files = context.get('files')
-      tts_model = context.get('tts_model', 'kokoro')
-      voice = context.get('voice', 'af_heart')
+      tts_model_name = context.get('tts_model', 'kokoro')
+      voice_name = context.get('voice') or None
+      show_setup = context.get('show_setup', False)
-      # Resolve npc if it's a string (npc name) rather than NPC object
       if isinstance(npc, str) and team:
           npc = team.get(npc) if hasattr(team, 'get') else None
       elif isinstance(npc, str):
@@ -57,53 +53,303 @@ steps:
       model = context.get('model') or (npc.model if npc and hasattr(npc, 'model') else None)
       provider = context.get('provider') or (npc.provider if npc and hasattr(npc, 'provider') else None)
+      npc_name = npc.name if npc else "yap"
-      print("""
-      ██╗   ██╗ █████╗ ██████╗
-      ╚██╗ ██╔╝██╔══██╗██╔══██╗
-       ╚████╔╝ ███████║██████╔╝
-        ╚██╔╝  ██╔══██║██╔═══╝
-         ██║   ██║  ██║██║
-         ╚═╝   ╚═╝  ╚═╝╚═╝
+      # ================================================================
+      #  Non-interactive fallback
+      # ================================================================
+      if not sys.stdin.isatty():
+          context['output'] = "Yap requires an interactive terminal."
+          context['messages'] = messages
+          exit()
-      Voice Chat Mode
-      """)
+      # ================================================================
+      #  Gather available options for setup/modal
+      # ================================================================
+      _all_engines = []
+      _engine_voices = {}
+      try:
+          _engines_info = get_available_engines()
+          for ename, einfo in _engines_info.items():
+              _all_engines.append(ename)
+              try:
+                  _engine_voices[ename] = [v['id'] if isinstance(v, dict) else str(v) for v in get_available_voices(ename)]
+              except Exception:
+                  _engine_voices[ename] = []
+      except Exception:
+          _all_engines = ['kokoro', 'qwen3', 'elevenlabs', 'openai', 'gemini', 'gtts']
+          _engine_voices = {e: [] for e in _all_engines}
-      npc_name = npc.name if npc else "yap"
-      print(f"Entering yap mode (NPC: {npc_name}). Type '/yq' to exit.")
+      if not _all_engines:
+          _all_engines = ['kokoro']
-      if not AUDIO_AVAILABLE:
-          print(colored("Audio not available. Falling back to text mode.", "yellow"))
+      _all_models = []
+      _all_providers = []
+      try:
+          _local = get_locally_available_models(os.getcwd())
+          _seen_models = set()
+          _seen_providers = set()
+          for entry in _local:
+              m = entry.get('model', '') if isinstance(entry, dict) else str(entry)
+              p = entry.get('provider', '') if isinstance(entry, dict) else ''
+              if m and m not in _seen_models:
+                  _all_models.append(m)
+                  _seen_models.add(m)
+              if p and p not in _seen_providers:
+                  _all_providers.append(p)
+                  _seen_providers.add(p)
+      except Exception:
+          pass
-      # Load files for RAG context
-      loaded_chunks = {}
-      if files:
-          if isinstance(files, str):
-              files = [f.strip() for f in files.split(',')]
-          for file_path in files:
-              file_path = os.path.expanduser(file_path)
-              if os.path.exists(file_path):
-                  try:
-                      chunks = load_file_contents(file_path)
-                      loaded_chunks[file_path] = chunks
-                      print(colored(f"Loaded: {file_path}", "green"))
-                  except Exception as e:
-                      print(colored(f"Error loading {file_path}: {e}", "red"))
+      if not _all_models:
+          _all_models = [model or 'gemma3:4b']
+      if not _all_providers:
+          _all_providers = [provider or 'ollama']
-      # System message for concise voice responses
-      sys_msg = get_system_message(npc) if npc else "You are a helpful assistant."
-      sys_msg += "\n\nProvide brief responses of 1-2 sentences unless asked for more detail. Keep responses clear and conversational for voice."
+      # Ensure current selections are in the lists
+      if tts_model_name not in _all_engines:
+          _all_engines.insert(0, tts_model_name)
+      if model and model not in _all_models:
+          _all_models.insert(0, model)
+      if provider and provider not in _all_providers:
+          _all_providers.insert(0, provider)
-      if not messages or messages[0].get("role") != "system":
-          messages.insert(0, {"role": "system", "content": sys_msg})
+      def _voices_for_engine(eng):
+          v = _engine_voices.get(eng, [])
+          if not v:
+              defaults = {'kokoro': ['af_heart'], 'qwen3': ['ryan'], 'elevenlabs': ['rachel'],
+                          'openai': ['alloy'], 'gemini': ['en-US-Standard-A'], 'gtts': ['en']}
+              v = defaults.get(eng, ['default'])
+          return v
+      # ================================================================
+      #  Setup screen
+      # ================================================================
+      def run_setup():
+          nonlocal tts_model_name, voice_name, model, provider
+          TURQ = '\033[38;2;64;224;208m'
+          PURPLE = '\033[38;2;180;130;255m'
+          ORANGE = '\033[38;2;255;165;0m'
+          GREEN = '\033[32m'
+          DIM = '\033[90m'
+          BOLD = '\033[1m'
+          REV = '\033[7m'
+          RST = '\033[0m'
+          def _sz():
+              try:
+                  s = os.get_terminal_size()
+                  return s.columns, s.lines
+              except:
+                  return 80, 24
+          # Setup state
+          fields = ['model', 'provider', 'engine', 'voice']
+          field_labels = {'model': 'LLM Model', 'provider': 'LLM Provider',
+                          'engine': 'TTS Engine', 'voice': 'Voice'}
+          model_idx = _all_models.index(model) if model in _all_models else 0
+          provider_idx = _all_providers.index(provider) if provider in _all_providers else 0
+          engine_idx = _all_engines.index(tts_model_name) if tts_model_name in _all_engines else 0
+          cur_voices = _voices_for_engine(_all_engines[engine_idx])
+          voice_idx = 0
+          if voice_name and voice_name in cur_voices:
+              voice_idx = cur_voices.index(voice_name)
+          field_options = {
+              'model': (_all_models, model_idx),
+              'provider': (_all_providers, provider_idx),
+              'engine': (_all_engines, engine_idx),
+              'voice': (cur_voices, voice_idx),
+          }
+          sel = 0  # 0-3 = fields, 4 = save default, 5 = dont show again
+          save_default = True
+          dont_show = False
+          total_rows = 6  # 4 fields + 2 checkboxes
+          def _get_val(f):
+              opts, idx = field_options[f]
+              return opts[idx] if opts else '?'
+          def _render_setup():
+              w, h = _sz()
+              box_w = min(50, w - 4)
+              box_h = 18
+              sx = max(1, (w - box_w) // 2)
+              sy = max(1, (h - box_h) // 2)
-      # Audio state
+              buf = ['\033[2J\033[H']
+              # Box border
+              buf.append(f'\033[{sy};{sx}H{PURPLE}{"─" * box_w}{RST}')
+              title = " YAP Voice Chat Setup "
+              tp = sx + (box_w - len(title)) // 2
+              buf.append(f'\033[{sy};{tp}H{BOLD}{PURPLE}{title}{RST}')
+              y = sy + 2
+              for i, f in enumerate(fields):
+                  opts, idx = field_options[f]
+                  val = opts[idx] if opts else '?'
+                  label = field_labels[f]
+                  lpad = sx + 2
+                  if i == sel:
+                      arrow_l = f'{TURQ}\u25c4{RST}'
+                      arrow_r = f'{TURQ}\u25ba{RST}'
+                      buf.append(f'\033[{y};{lpad}H{REV} {label}: {RST} {arrow_l} {BOLD}{val}{RST} {arrow_r}')
+                  else:
+                      buf.append(f'\033[{y};{lpad}H  {DIM}{label}:{RST} {val}')
+                  y += 2
+              # Separator
+              buf.append(f'\033[{y};{sx + 2}H{DIM}{"─" * (box_w - 4)}{RST}')
+              y += 1
+              # Checkboxes
+              ck_save = f'{GREEN}[x]{RST}' if save_default else '[ ]'
+              ck_dont = f'{GREEN}[x]{RST}' if dont_show else '[ ]'
+              if sel == 4:
+                  buf.append(f'\033[{y};{sx + 2}H{REV} {ck_save} Save as default {RST}')
+              else:
+                  buf.append(f'\033[{y};{sx + 2}H  {ck_save} Save as default')
+              y += 1
+              if sel == 5:
+                  buf.append(f'\033[{y};{sx + 2}H{REV} {ck_dont} Don\'t show again {RST}')
+              else:
+                  buf.append(f'\033[{y};{sx + 2}H  {ck_dont} Don\'t show again')
+              y += 2
+              # Hints
+              buf.append(f'\033[{y};{sx + 2}H{DIM}\u2191/\u2193:Navigate  \u2190/\u2192:Change  Space:Toggle  Enter:Start  Ctrl+Q:Quit{RST}')
+              y += 1
+              buf.append(f'\033[{y};{sx}H{PURPLE}{"─" * box_w}{RST}')
+              sys.stdout.write(''.join(buf))
+              sys.stdout.flush()
+          fd = sys.stdin.fileno()
+          old = termios.tcgetattr(fd)
+          try:
+              tty.setcbreak(fd)
+              sys.stdout.write('\033[?25l')
+              running = True
+              while running:
+                  _render_setup()
+                  if _sel.select([fd], [], [], 0.1)[0]:
+                      c = os.read(fd, 1).decode('latin-1')
+                      if c == '\x11' or c == '\x03':  # Ctrl+Q / Ctrl+C
+                          termios.tcsetattr(fd, termios.TCSADRAIN, old)
+                          sys.stdout.write('\033[?25h\033[2J\033[H')
+                          sys.stdout.flush()
+                          context['output'] = "Setup cancelled."
+                          context['messages'] = messages
+                          exit()
+                      elif c == '\x1b':  # Escape sequence
+                          if _sel.select([fd], [], [], 0.05)[0]:
+                              c2 = os.read(fd, 1).decode('latin-1')
+                              if c2 == '[':
+                                  c3 = os.read(fd, 1).decode('latin-1')
+                                  if c3 == 'A':  # Up
+                                      sel = max(0, sel - 1)
+                                  elif c3 == 'B':  # Down
+                                      sel = min(total_rows - 1, sel + 1)
+                                  elif c3 == 'D':  # Left
+                                      if sel < 4:
+                                          f = fields[sel]
+                                          opts, idx = field_options[f]
+                                          if opts:
+                                              new_idx = (idx - 1) % len(opts)
+                                              field_options[f] = (opts, new_idx)
+                                              if f == 'engine':
+                                                  nv = _voices_for_engine(opts[new_idx])
+                                                  field_options['voice'] = (nv, 0)
+                                  elif c3 == 'C':  # Right
+                                      if sel < 4:
+                                          f = fields[sel]
+                                          opts, idx = field_options[f]
+                                          if opts:
+                                              new_idx = (idx + 1) % len(opts)
+                                              field_options[f] = (opts, new_idx)
+                                              if f == 'engine':
+                                                  nv = _voices_for_engine(opts[new_idx])
+                                                  field_options['voice'] = (nv, 0)
+                      elif c == 'k':
+                          sel = max(0, sel - 1)
+                      elif c == 'j':
+                          sel = min(total_rows - 1, sel + 1)
+                      elif c == 'h':
+                          if sel < 4:
+                              f = fields[sel]
+                              opts, idx = field_options[f]
+                              if opts:
+                                  new_idx = (idx - 1) % len(opts)
+                                  field_options[f] = (opts, new_idx)
+                                  if f == 'engine':
+                                      nv = _voices_for_engine(opts[new_idx])
+                                      field_options['voice'] = (nv, 0)
+                      elif c == 'l':
+                          if sel < 4:
+                              f = fields[sel]
+                              opts, idx = field_options[f]
+                              if opts:
+                                  new_idx = (idx + 1) % len(opts)
+                                  field_options[f] = (opts, new_idx)
+                                  if f == 'engine':
+                                      nv = _voices_for_engine(opts[new_idx])
+                                      field_options['voice'] = (nv, 0)
+                      elif c == ' ':
+                          if sel == 4:
+                              save_default = not save_default
+                          elif sel == 5:
+                              dont_show = not dont_show
+                      elif c in ('\r', '\n'):
+                          running = False
+          finally:
+              termios.tcsetattr(fd, termios.TCSADRAIN, old)
+              sys.stdout.write('\033[?25h\033[2J\033[H')
+              sys.stdout.flush()
+          # Apply selections
+          model = _get_val('model')
+          provider = _get_val('provider')
+          tts_model_name = _get_val('engine')
+          voice_name = _get_val('voice')
+          # Persist if requested
+          if save_default or dont_show:
+              from npcsh.config import set_npcsh_config_value
+              if save_default:
+                  set_npcsh_config_value("NPCSH_TTS_ENGINE", tts_model_name)
+                  set_npcsh_config_value("NPCSH_TTS_VOICE", voice_name)
+                  set_npcsh_config_value("NPCSH_CHAT_MODEL", model)
+                  set_npcsh_config_value("NPCSH_CHAT_PROVIDER", provider)
+              if dont_show:
+                  set_npcsh_config_value("NPCSH_YAP_SETUP_DONE", "1")
+      if show_setup:
+          run_setup()
+      # Set default voice if still None
+      if not voice_name:
+          defaults = {'kokoro': 'af_heart', 'qwen3': 'ryan', 'elevenlabs': 'rachel',
+                      'openai': 'alloy', 'gemini': 'en-US-Standard-A', 'gtts': 'en'}
+          voice_name = defaults.get(tts_model_name, 'default')
+      # ================================================================
+      #  Audio models
+      # ================================================================
       vad_model = None
       whisper_model = None
       if AUDIO_AVAILABLE:
           try:
-              # Load VAD model for voice activity detection
               vad_model, _ = torch.hub.load(
                   repo_or_dir="snakers4/silero-vad",
                   model="silero_vad",
@@ -112,164 +358,833 @@ steps:
                   verbose=False
               )
               vad_model.to('cpu')
-              print(colored("VAD model loaded.", "green"))
-              # Load Whisper for STT
+          except Exception:
+              pass
+          try:
               whisper_model = WhisperModel("base", device="cpu", compute_type="int8")
-              print(colored("Whisper model loaded.", "green"))
-          except Exception as e:
-              print(colored(f"Error loading audio models: {e}", "red"))
+          except Exception:
               AUDIO_AVAILABLE = False
-      def speak_text(text, tts_model='kokoro', voice='af_heart'):
-          """Convert text to speech and play it"""
-          if not AUDIO_AVAILABLE:
-              return
+      # ================================================================
+      #  File loading for RAG
+      # ================================================================
+      loaded_chunks = {}
+      if files:
+          if isinstance(files, str):
+              files = [f.strip() for f in files.split(',')]
+          for fp in files:
+              fp = os.path.expanduser(fp)
+              if os.path.exists(fp):
+                  try:
+                      loaded_chunks[fp] = load_file_contents(fp)
+                  except Exception:
+                      pass
+      # System message
+      sys_msg = get_system_message(npc) if npc else "You are a helpful assistant."
+      sys_msg += "\n\nProvide brief responses of 1-2 sentences unless asked for more detail. Keep responses clear and conversational for voice."
+      if not messages or messages[0].get("role") != "system":
+          messages.insert(0, {"role": "system", "content": sys_msg})
+      # ================================================================
+      #  State
+      # ================================================================
+      class UI:
+          tab = 0           # 0=chat, 1=settings
+          TAB_NAMES = ['Chat', 'Settings']
+          # chat
+          chat_log = []     # [(role, text)]
+          chat_scroll = -1
+          input_buf = ""
+          thinking = False
+          spinner_frame = 0
+          recording = False
+          rec_seconds = 0.0
+          transcribing = False
+          speaking = False
+          # VAD listening
+          listening = AUDIO_AVAILABLE  # auto-listen by default
+          listen_stop = False          # signal to stop listener thread
+          # settings
+          set_sel = 0
+          tts_enabled = AUDIO_AVAILABLE
+          auto_speak = True
+          vad_threshold = 0.4     # speech probability threshold
+          silence_timeout = 1.5   # seconds of silence before cut
+          min_speech = 0.3        # minimum speech duration to process
+          editing = False
+          edit_buf = ""
+          edit_key = ""
+          # Modal state
+          modal_open = False
+          modal_sel = 0
+          modal_engine_idx = 0
+          modal_voice_idx = 0
+          modal_model_idx = 0
+          modal_provider_idx = 0
+          modal_save = False
+      ui = UI()
+      # Initialize modal indices to current selections
+      if tts_model_name in _all_engines:
+          ui.modal_engine_idx = _all_engines.index(tts_model_name)
+      if model and model in _all_models:
+          ui.modal_model_idx = _all_models.index(model)
+      if provider and provider in _all_providers:
+          ui.modal_provider_idx = _all_providers.index(provider)
+      cur_v = _voices_for_engine(tts_model_name)
+      if voice_name in cur_v:
+          ui.modal_voice_idx = cur_v.index(voice_name)
+      # ================================================================
+      #  Helpers
+      # ================================================================
+      def sz():
+          try:
+              s = os.get_terminal_size()
+              return s.columns, s.lines
+          except:
+              return 80, 24
+      TURQ = '\033[38;2;64;224;208m'
+      PURPLE = '\033[38;2;180;130;255m'
+      ORANGE = '\033[38;2;255;165;0m'
+      GREEN = '\033[32m'
+      DIM = '\033[90m'
+      BOLD = '\033[1m'
+      REV = '\033[7m'
+      RST = '\033[0m'
+      RED = '\033[31m'
+      SPINNERS = ['\u280b', '\u2819', '\u2839', '\u2838', '\u283c', '\u2834', '\u2826', '\u2827', '\u2807', '\u280f']
+      def wrap_text(text, width):
+          lines = []
+          for line in text.split('\n'):
+              while len(line) > width:
+                  lines.append(line[:width])
+                  line = line[width:]
+              lines.append(line)
+          return lines
+      # ================================================================
+      #  Audio functions
+      # ================================================================
+      def transcribe_audio(audio_path):
+          if not whisper_model or not audio_path:
+              return ""
           try:
-              # Use gTTS as fallback
-              tts = gTTS(text=text, lang='en')
-              with tempfile.NamedTemporaryFile(suffix='.mp3', delete=False) as f:
-                  tts.save(f.name)
-                  wav_path = convert_mp3_to_wav(f.name)
+              segments, _ = whisper_model.transcribe(audio_path, beam_size=5)
+              text = " ".join([seg.text for seg in segments]).strip()
+              try: os.remove(audio_path)
+              except: pass
+              return text
+          except Exception as e:
+              ui.chat_log.append(('error', f'Transcribe error: {e}'))
+              return ""
-              # Play audio
+      def speak_text(text):
+          if not AUDIO_AVAILABLE or not ui.tts_enabled:
+              return
+          try:
+              ui.speaking = True
               import subprocess
+              audio_bytes = text_to_speech(text, engine=tts_model_name, voice=voice_name)
+              # Determine file format from engine
+              if tts_model_name in ('elevenlabs', 'gtts'):
+                  suffix = '.mp3'
+              else:
+                  suffix = '.wav'
+              tmp = tempfile.NamedTemporaryFile(suffix=suffix, delete=False)
+              tmp_path = tmp.name
+              tmp.write(audio_bytes)
+              tmp.close()
+              # If mp3, convert to wav for playback
+              play_path = tmp_path
+              if suffix == '.mp3':
+                  wav_path = tmp_path.replace('.mp3', '.wav')
+                  convert_mp3_to_wav(tmp_path, wav_path)
+                  play_path = wav_path
               if sys.platform == 'darwin':
-                  subprocess.run(['afplay', wav_path], check=True)
+                  subprocess.run(['afplay', play_path], check=True, timeout=60)
               elif sys.platform == 'linux':
-                  subprocess.run(['aplay', wav_path], check=True)
-              else:
-                  # Windows
-                  import winsound
-                  winsound.PlaySound(wav_path, winsound.SND_FILENAME)
+                  subprocess.run(['aplay', play_path], check=True, timeout=60,
+                                 stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)
-              for _p in [f.name, wav_path]:
-                  try:
-                      os.remove(_p)
-                  except:
-                      pass
+              for _p in set([tmp_path, play_path]):
+                  try: os.remove(_p)
+                  except: pass
           except Exception as e:
-              print(colored(f"TTS error: {e}", "red"))
+              ui.chat_log.append(('error', f'TTS error: {e}'))
+          finally:
+              ui.speaking = False
-      def record_audio(duration=5):
-          """Record audio from microphone"""
-          if not AUDIO_AVAILABLE:
-              return None
+      def save_frames_to_wav(frames, sample_width):
+          f = tempfile.NamedTemporaryFile(suffix='.wav', delete=False)
+          path = f.name
+          f.close()
+          wf = wave.open(path, 'wb')
+          wf.setnchannels(CHANNELS)
+          wf.setsampwidth(sample_width)
+          wf.setframerate(RATE)
+          wf.writeframes(b''.join(frames))
+          wf.close()
+          return path
+      # ================================================================
+      #  VAD continuous listener
+      # ================================================================
+      def vad_listener_loop():
+          """Background thread: continuously monitors mic, detects speech via
+          VAD, records until silence, then transcribes and sends."""
           try:
               p = pyaudio.PyAudio()
-              stream = p.open(format=FORMAT, channels=CHANNELS, rate=RATE, input=True, frames_per_buffer=CHUNK)
+              sw = p.get_sample_size(FORMAT)
+              stream = p.open(format=FORMAT, channels=CHANNELS, rate=RATE,
+                              input=True, frames_per_buffer=CHUNK)
+          except Exception as e:
+              ui.chat_log.append(('error', f'Mic open failed: {e}'))
+              ui.listening = False
+              return
+          chunk_dur = CHUNK / RATE  # duration of one chunk in seconds
+          while not ui.listen_stop:
+              # Skip if busy
+              if ui.thinking or ui.speaking or ui.transcribing:
+                  time.sleep(0.1)
+                  continue
+              if not ui.listening:
+                  time.sleep(0.1)
+                  continue
+              # Read a chunk and run VAD
+              try:
+                  data = stream.read(CHUNK, exception_on_overflow=False)
+              except Exception:
+                  time.sleep(0.05)
+                  continue
-              print(colored("Recording...", "cyan"), end='', flush=True)
-              frames = []
-              for _ in range(0, int(RATE / CHUNK * duration)):
-                  data = stream.read(CHUNK)
-                  frames.append(data)
-              print(colored(" Done.", "cyan"))
+              audio_np = np.frombuffer(data, dtype=np.int16).astype(np.float32) / 32768.0
+              if len(audio_np) != CHUNK:
+                  continue
+              try:
+                  tensor = torch.from_numpy(audio_np)
+                  prob = vad_model(tensor, RATE).item()
+              except Exception:
+                  continue
+              if prob < ui.vad_threshold:
+                  continue
+              # Speech detected — start collecting frames
+              ui.recording = True
+              ui.rec_seconds = 0.0
+              ui.chat_scroll = -1
+              speech_frames = [data]
+              speech_dur = chunk_dur
+              silence_dur = 0.0
+              while not ui.listen_stop:
+                  try:
+                      data = stream.read(CHUNK, exception_on_overflow=False)
+                  except Exception:
+                      break
+                  speech_frames.append(data)
+                  speech_dur += chunk_dur
+                  ui.rec_seconds = speech_dur
+                  audio_np = np.frombuffer(data, dtype=np.int16).astype(np.float32) / 32768.0
+                  try:
+                      tensor = torch.from_numpy(audio_np)
+                      prob = vad_model(tensor, RATE).item()
+                  except Exception:
+                      prob = 0.0
+                  if prob < ui.vad_threshold:
+                      silence_dur += chunk_dur
+                  else:
+                      silence_dur = 0.0
+                  if silence_dur >= ui.silence_timeout:
+                      break
+                  # Safety: max 60 seconds
+                  if speech_dur > 60.0:
+                      break
+              ui.recording = False
+              # Only process if enough speech
+              if speech_dur - silence_dur < ui.min_speech:
+                  continue
+              # Transcribe
+              ui.transcribing = True
+              audio_path = save_frames_to_wav(speech_frames, sw)
+              text = transcribe_audio(audio_path)
+              ui.transcribing = False
+              if text and text.strip():
+                  ui.chat_log.append(('info', f'Heard: "{text}"'))
+                  ui.chat_scroll = -1
+                  send_message(text)
+          # Cleanup
+          try:
               stream.stop_stream()
               stream.close()
               p.terminate()
+          except Exception:
+              pass
-              # Save to temp file
-              with tempfile.NamedTemporaryFile(suffix='.wav', delete=False) as f:
-                  wf = wave.open(f.name, 'wb')
-                  wf.setnchannels(CHANNELS)
-                  wf.setsampwidth(p.get_sample_size(FORMAT))
-                  wf.setframerate(RATE)
-                  wf.writeframes(b''.join(frames))
-                  wf.close()
-                  return f.name
-          except Exception as e:
-              print(colored(f"Recording error: {e}", "red"))
-              return None
+      # ================================================================
+      #  Chat send
+      # ================================================================
+      def send_message(text):
+          ui.chat_log.append(('user', text))
+          ui.thinking = True
+          ui.chat_scroll = -1
-      def transcribe_audio(audio_path):
-          """Transcribe audio to text using Whisper"""
-          if not whisper_model or not audio_path:
-              return ""
-          try:
-              segments, _ = whisper_model.transcribe(audio_path, beam_size=5)
-              text = " ".join([seg.text for seg in segments])
+          def worker():
               try:
-                  os.remove(audio_path)
-              except:
-                  pass
-              return text.strip()
-          except Exception as e:
-              print(colored(f"Transcription error: {e}", "red"))
-              return ""
+                  current_prompt = text
+                  if loaded_chunks:
+                      ctx_content = ""
+                      for fn, chunks in loaded_chunks.items():
+                          full = "\n".join(chunks)
+                          ret = rag_search(text, full, similarity_threshold=0.3)
+                          if ret:
+                              ctx_content += f"\n{ret}\n"
+                      if ctx_content:
+                          current_prompt += f"\n\nContext:{ctx_content}"
-      # REPL loop
-      while True:
-          try:
-              # Voice input or text input
-              if AUDIO_AVAILABLE:
-                  prompt_str = f"{npc_name}:yap> [Press Enter to speak, or type] "
+                  resp = get_llm_response(
+                      current_prompt, model=model, provider=provider,
+                      messages=messages, stream=False, npc=npc
+                  )
+                  messages[:] = resp.get('messages', messages)
+                  response_text = str(resp.get('response', ''))
+                  if response_text:
+                      ui.chat_log.append(('assistant', response_text))
+                      if ui.auto_speak and ui.tts_enabled:
+                          speak_text(response_text)
+              except Exception as e:
+                  ui.chat_log.append(('error', str(e)))
+              ui.thinking = False
+          threading.Thread(target=worker, daemon=True).start()
+      # ================================================================
+      #  Rendering
+      # ================================================================
+      def render():
+          w, h = sz()
+          buf = ['\033[H']
+          # Tab bar
+          tabs = ''
+          for i, name in enumerate(ui.TAB_NAMES):
+              if i == ui.tab:
+                  tabs += f' {REV}{BOLD} {name} {RST} '
               else:
-                  prompt_str = f"{npc_name}:yap> "
-              user_input = input(prompt_str).strip()
-              if user_input.lower() == "/yq":
-                  print("Exiting yap mode.")
-                  break
-              # Empty input = record audio
-              if not user_input and AUDIO_AVAILABLE:
-                  audio_path = record_audio(5)
-                  if audio_path:
-                      user_input = transcribe_audio(audio_path)
-                      if user_input:
-                          print(colored(f"You said: {user_input}", "cyan"))
-                      else:
-                          print(colored("Could not transcribe audio.", "yellow"))
-                          continue
+                  tabs += f' {DIM} {name} {RST} '
+          mic = ''
+          if ui.recording:
+              mic = f'{RED}\u25cf REC {ui.rec_seconds:.1f}s{RST}'
+          elif ui.transcribing:
+              mic = f'{ORANGE}\u25cf transcribing...{RST}'
+          elif ui.speaking:
+              mic = f'{GREEN}\u25cf speaking...{RST}'
+          elif ui.thinking:
+              sp = SPINNERS[ui.spinner_frame % len(SPINNERS)]
+              mic = f'{ORANGE}{sp} thinking...{RST}'
+          elif ui.listening:
+              mic = f'{TURQ}\u25cf listening{RST}'
+          audio_st = '\U0001f3a4' if ui.listening else ('\U0001f507' if not AUDIO_AVAILABLE else '\u23f8')
+          right = f'{npc_name} | {audio_st} | {model or "?"}@{provider or "?"}'
+          pad = w - 12 - len(right) - 20
+          header = f'{PURPLE}YAP{RST} {tabs}{" " * max(0, pad)}{mic}  {DIM}{right}{RST}'
+          buf.append(f'\033[1;1H{REV} {header[:w-2].ljust(w-2)} {RST}')
+          if ui.tab == 0:
+              render_chat(buf, w, h)
+          elif ui.tab == 1:
+              render_settings(buf, w, h)
+          # Draw modal on top if open
+          if ui.modal_open:
+              render_modal(buf, w, h)
+          sys.stdout.write(''.join(buf))
+          sys.stdout.flush()
+      def render_chat(buf, w, h):
+          input_h = 3
+          chat_h = h - 2 - input_h
+          all_lines = []
+          _asst_pw = len(npc_name) + 2  # "name: "
+          _cont_pw = _asst_pw  # continuation indent matches
+          for role, text in ui.chat_log:
+              if role == 'user':
+                  tw = w - 6
+                  wrapped = wrap_text(text, tw)
+                  for i, l in enumerate(wrapped):
+                      prefix = f'{BOLD}you:{RST} ' if i == 0 else '     '
+                      all_lines.append(f'{prefix}{l}')
+              elif role == 'assistant':
+                  tw = w - _asst_pw - 1
+                  wrapped = wrap_text(text, tw)
+                  pad = ' ' * _asst_pw
+                  for i, l in enumerate(wrapped):
+                      prefix = f'{PURPLE}{BOLD}{npc_name}:{RST} ' if i == 0 else pad
+                      all_lines.append(f'{prefix}{l}')
+              elif role == 'info':
+                  tw = w - 5
+                  wrapped = wrap_text(text, tw)
+                  for i, l in enumerate(wrapped):
+                      prefix = f'  {TURQ}\u2139 ' if i == 0 else '    '
+                      all_lines.append(f'{prefix}{l}{RST}' if i == 0 else f'    {l}')
+              elif role == 'error':
+                  tw = w - 5
+                  wrapped = wrap_text(text, tw)
+                  for i, l in enumerate(wrapped):
+                      prefix = f'  {RED}\u2717 ' if i == 0 else '    '
+                      all_lines.append(f'{prefix}{l}{RST}' if i == 0 else f'    {l}')
+          if ui.recording:
+              secs = ui.rec_seconds
+              all_lines.append(f'  {RED}\U0001f399 Recording... {secs:.1f}s{RST}')
+          elif ui.transcribing:
+              sp = SPINNERS[ui.spinner_frame % len(SPINNERS)]
+              all_lines.append(f'  {ORANGE}{sp} Transcribing...{RST}')
+          elif ui.thinking:
+              sp = SPINNERS[ui.spinner_frame % len(SPINNERS)]
+              all_lines.append(f'  {ORANGE}{sp} thinking...{RST}')
+          elif ui.speaking:
+              all_lines.append(f'  {GREEN}\U0001f50a Speaking...{RST}')
+          # Scrolling
+          if ui.chat_scroll == -1:
+              scroll = max(0, len(all_lines) - chat_h)
+          else:
+              scroll = ui.chat_scroll
+          for i in range(chat_h):
+              y = 2 + i
+              li = scroll + i
+              buf.append(f'\033[{y};1H\033[K')
+              if li < len(all_lines):
+                  buf.append(all_lines[li])
+          # Input area
+          div_y = 2 + chat_h
+          buf.append(f'\033[{div_y};1H\033[K{DIM}{"\u2500" * w}{RST}')
+          input_y = div_y + 1
+          visible = ui.input_buf[-(w-4):] if len(ui.input_buf) > w - 4 else ui.input_buf
+          buf.append(f'\033[{input_y};1H\033[K {BOLD}>{RST} {visible}\033[?25h')
+          # Status bar
+          if AUDIO_AVAILABLE:
+              ltog = 'Ctrl+L:Pause' if ui.listening else 'Ctrl+L:Listen'
+              hints = f'Enter:Send  {ltog}  Ctrl+S:Settings  Tab:Settings  Ctrl+Q:Quit'
+          else:
+              hints = 'Enter:Send  Ctrl+S:Settings  Tab:Settings  Ctrl+Q:Quit'
+          buf.append(f'\033[{h};1H\033[K{REV} {hints[:w-2].ljust(w-2)} {RST}')
+      def render_settings(buf, w, h):
+          settings = [
+              ('tts_enabled', 'TTS Enabled', 'On' if ui.tts_enabled else 'Off'),
+              ('auto_speak', 'Auto-Speak', 'On' if ui.auto_speak else 'Off'),
+              ('listening', 'Auto-Listen', 'On' if ui.listening else 'Off'),
+              ('silence_timeout', 'Silence Timeout', f'{ui.silence_timeout}s'),
+              ('vad_threshold', 'VAD Sensitivity', f'{ui.vad_threshold:.1f}'),
+          ]
+          buf.append(f'\033[3;3H{BOLD}Voice Settings{RST}')
+          buf.append(f'\033[4;3H{DIM}{"\u2500" * (w - 6)}{RST}')
+          y = 6
+          for i, (key, label, val) in enumerate(settings):
+              if ui.editing and ui.edit_key == key:
+                  buf.append(f'\033[{y};3H{ORANGE}{label}:{RST} {REV} {ui.edit_buf}_ {RST}')
+              elif i == ui.set_sel:
+                  buf.append(f'\033[{y};3H{REV} {label}: {val} {RST}')
+              else:
+                  buf.append(f'\033[{y};3H {BOLD}{label}:{RST} {val}')
+              y += 2
+          y += 1
+          buf.append(f'\033[{y};3H{DIM}TTS Engine: {tts_model_name}  Voice: {voice_name or "default"}{RST}')
+          y += 1
+          buf.append(f'\033[{y};3H{DIM}LLM: {model or "?"}@{provider or "?"}{RST}')
+          y += 1
+          buf.append(f'\033[{y};3H{DIM}Audio: {"Available" if AUDIO_AVAILABLE else "Not available"}{RST}')
+          y += 1
+          if loaded_chunks:
+              buf.append(f'\033[{y};3H{DIM}Files loaded: {len(loaded_chunks)}{RST}')
+          y += 1
+          buf.append(f'\033[{y};3H{DIM}Whisper: {"Loaded" if whisper_model else "Not loaded"}{RST}')
+          for cy in range(y + 1, h - 1):
+              buf.append(f'\033[{cy};1H\033[K')
+          if ui.editing:
+              buf.append(f'\033[{h};1H\033[K{REV} Enter:Save  Esc:Cancel {RST}')
+          else:
+              buf.append(f'\033[{h};1H\033[K{REV} j/k:Navigate  Space:Toggle  e:Edit  Ctrl+S:Quick Switch  Tab:Chat  Ctrl+Q:Quit {RST}')
+      # ================================================================
+      #  Modal rendering and handling
+      # ================================================================
+      def render_modal(buf, w, h):
+          box_w = min(48, w - 4)
+          box_h = 16
+          sx = max(1, (w - box_w) // 2)
+          sy = max(1, (h - box_h) // 2)
+          # Clear box area
+          for y in range(sy, sy + box_h):
+              buf.append(f'\033[{y};{sx}H{" " * box_w}')
+          # Border
+          buf.append(f'\033[{sy};{sx}H{PURPLE}\u250c{"\u2500" * (box_w - 2)}\u2510{RST}')
+          for y in range(sy + 1, sy + box_h - 1):
+              buf.append(f'\033[{y};{sx}H{PURPLE}\u2502{RST}{" " * (box_w - 2)}{PURPLE}\u2502{RST}')
+          buf.append(f'\033[{sy + box_h - 1};{sx}H{PURPLE}\u2514{"\u2500" * (box_w - 2)}\u2518{RST}')
+          # Title
+          title = " Quick Settings "
+          tp = sx + (box_w - len(title)) // 2
+          buf.append(f'\033[{sy};{tp}H{BOLD}{PURPLE}{title}{RST}')
+          lpad = sx + 3
+          y = sy + 2
+          modal_fields = [
+              ('LLM Model', _all_models, ui.modal_model_idx),
+              ('Provider', _all_providers, ui.modal_provider_idx),
+              ('TTS Engine', _all_engines, ui.modal_engine_idx),
+              ('Voice', _voices_for_engine(_all_engines[ui.modal_engine_idx]), ui.modal_voice_idx),
+          ]
+          for i, (label, opts, idx) in enumerate(modal_fields):
+              val = opts[idx] if idx < len(opts) else '?'
+              if i == ui.modal_sel:
+                  al = f'{TURQ}\u25c4{RST}'
+                  ar = f'{TURQ}\u25ba{RST}'
+                  buf.append(f'\033[{y};{lpad}H{REV} {label}: {RST} {al} {BOLD}{val}{RST} {ar}')
+              else:
+                  buf.append(f'\033[{y};{lpad}H  {DIM}{label}:{RST} {val}')
+              y += 2
+          # Save checkbox
+          ck = f'{GREEN}[x]{RST}' if ui.modal_save else '[ ]'
+          if ui.modal_sel == 4:
+              buf.append(f'\033[{y};{lpad}H{REV} {ck} Save as default {RST}')
+          else:
+              buf.append(f'\033[{y};{lpad}H  {ck} Save as default')
+          y += 2
+          # Hints
+          buf.append(f'\033[{y};{lpad}H{DIM}\u2191\u2193:Nav \u2190\u2192:Change Spc:Toggle Enter:Apply Esc:Cancel{RST}')
+      def open_modal():
+          ui.modal_open = True
+          ui.modal_sel = 0
+          ui.modal_save = False
+          # Sync indices to current values
+          if tts_model_name in _all_engines:
+              ui.modal_engine_idx = _all_engines.index(tts_model_name)
+          if model and model in _all_models:
+              ui.modal_model_idx = _all_models.index(model)
+          if provider and provider in _all_providers:
+              ui.modal_provider_idx = _all_providers.index(provider)
+          cur_v = _voices_for_engine(_all_engines[ui.modal_engine_idx])
+          if voice_name in cur_v:
+              ui.modal_voice_idx = cur_v.index(voice_name)
+          else:
+              ui.modal_voice_idx = 0
+      def apply_modal():
+          nonlocal tts_model_name, voice_name, model, provider
+          model = _all_models[ui.modal_model_idx] if ui.modal_model_idx < len(_all_models) else model
+          provider = _all_providers[ui.modal_provider_idx] if ui.modal_provider_idx < len(_all_providers) else provider
+          tts_model_name = _all_engines[ui.modal_engine_idx] if ui.modal_engine_idx < len(_all_engines) else tts_model_name
+          cur_v = _voices_for_engine(tts_model_name)
+          voice_name = cur_v[ui.modal_voice_idx] if ui.modal_voice_idx < len(cur_v) else voice_name
+          ui.chat_log.append(('info', f'Settings: {model}@{provider}, TTS: {tts_model_name}/{voice_name}'))
+          if ui.modal_save:
+              from npcsh.config import set_npcsh_config_value
+              set_npcsh_config_value("NPCSH_TTS_ENGINE", tts_model_name)
+              set_npcsh_config_value("NPCSH_TTS_VOICE", voice_name)
+              set_npcsh_config_value("NPCSH_CHAT_MODEL", model)
+              set_npcsh_config_value("NPCSH_CHAT_PROVIDER", provider)
+              ui.chat_log.append(('info', 'Saved as defaults.'))
+          ui.modal_open = False
+      def handle_modal_key(c, fd):
+          if c == '\x1b':  # Esc
+              if _sel.select([fd], [], [], 0.05)[0]:
+                  c2 = os.read(fd, 1).decode('latin-1')
+                  if c2 == '[':
+                      c3 = os.read(fd, 1).decode('latin-1')
+                      if c3 == 'A':  # Up
+                          ui.modal_sel = max(0, ui.modal_sel - 1)
+                      elif c3 == 'B':  # Down
+                          ui.modal_sel = min(4, ui.modal_sel + 1)
+                      elif c3 == 'D':  # Left
+                          _modal_cycle(-1)
+                      elif c3 == 'C':  # Right
+                          _modal_cycle(1)
+                      return True
+              # bare Esc = close
+              ui.modal_open = False
+              return True
+          if c == 'k':
+              ui.modal_sel = max(0, ui.modal_sel - 1)
+          elif c == 'j':
+              ui.modal_sel = min(4, ui.modal_sel + 1)
+          elif c == 'h':
+              _modal_cycle(-1)
+          elif c == 'l':
+              _modal_cycle(1)
+          elif c == ' ':
+              if ui.modal_sel == 4:
+                  ui.modal_save = not ui.modal_save
+          elif c in ('\r', '\n'):
+              apply_modal()
+          elif c == '\x11':  # Ctrl+Q in modal just closes it
+              ui.modal_open = False
+          return True
+      def _modal_cycle(direction):
+          if ui.modal_sel == 0:
+              ui.modal_model_idx = (ui.modal_model_idx + direction) % len(_all_models)
+          elif ui.modal_sel == 1:
+              ui.modal_provider_idx = (ui.modal_provider_idx + direction) % len(_all_providers)
+          elif ui.modal_sel == 2:
+              ui.modal_engine_idx = (ui.modal_engine_idx + direction) % len(_all_engines)
+              # Reset voice index when engine changes
+              ui.modal_voice_idx = 0
+          elif ui.modal_sel == 3:
+              cur_v = _voices_for_engine(_all_engines[ui.modal_engine_idx])
+              if cur_v:
+                  ui.modal_voice_idx = (ui.modal_voice_idx + direction) % len(cur_v)
+      # ================================================================
+      #  Input handling
+      # ================================================================
+      def handle_key(c, fd):
+          # Modal intercepts all keys
+          if ui.modal_open:
+              return handle_modal_key(c, fd)
+          if c == '\t':
+              if not ui.editing:
+                  ui.tab = (ui.tab + 1) % 2
+              return True
+          if c == '\x11':  # Ctrl+Q
+              return False
+          if c == '\x03':  # Ctrl+C
+              return True
+          if c == '\x13':  # Ctrl+S = open settings modal
+              open_modal()
+              return True
+          # Escape sequences
+          if c == '\x1b':
+              if _sel.select([fd], [], [], 0.05)[0]:
+                  c2 = os.read(fd, 1).decode('latin-1')
+                  if c2 == '[':
+                      c3 = os.read(fd, 1).decode('latin-1')
+                      if c3 == 'A':  # Up
+                          if ui.tab == 0: _chat_scroll_up()
+                          elif ui.tab == 1 and not ui.editing and ui.set_sel > 0: ui.set_sel -= 1
+                      elif c3 == 'B':  # Down
+                          if ui.tab == 0: _chat_scroll_down()
+                          elif ui.tab == 1 and not ui.editing and ui.set_sel < 4: ui.set_sel += 1
+                      elif c3 == '5':  # PgUp
+                          os.read(fd, 1)
+                          if ui.tab == 0: _chat_page_up()
+                      elif c3 == '6':  # PgDn
+                          os.read(fd, 1)
+                          if ui.tab == 0: _chat_page_down()
+                  elif c2 == 'O':
+                      c3 = os.read(fd, 1).decode('latin-1')
+                      if c3 == 'P': ui.tab = 0  # F1
+                      elif c3 == 'Q': ui.tab = 1  # F2
                   else:
-                      continue
+                      # bare Esc
+                      if ui.tab == 1 and ui.editing:
+                          ui.editing = False
+                          ui.edit_buf = ""
+              else:
+                  if ui.tab == 1 and ui.editing:
+                      ui.editing = False
+                      ui.edit_buf = ""
+              return True
-              if not user_input:
-                  continue
+          if ui.tab == 0:
+              return handle_chat(c, fd)
+          elif ui.tab == 1:
+              return handle_settings(c, fd)
+          return True
-              # Add RAG context if files loaded
-              current_prompt = user_input
-              if loaded_chunks:
-                  context_content = ""
-                  for filename, chunks in loaded_chunks.items():
-                      full_text = "\n".join(chunks)
-                      retrieved = rag_search(user_input, full_text, similarity_threshold=0.3)
-                      if retrieved:
-                          context_content += f"\n{retrieved}\n"
-                  if context_content:
-                      current_prompt += f"\n\nContext:{context_content}"
-              # Get response
-              resp = get_llm_response(
-                  current_prompt,
-                  model=model,
-                  provider=provider,
-                  messages=messages,
-                  stream=False,  # Don't stream for voice
-                  npc=npc
-              )
+      def _chat_scroll_up():
+          _, h = sz()
+          chat_h = h - 5
+          if ui.chat_scroll == -1:
+              ui.chat_scroll = max(0, len(ui.chat_log) * 2 - chat_h - 1)
+          ui.chat_scroll = max(0, ui.chat_scroll - 1)
-              messages = resp.get('messages', messages)
-              response_text = str(resp.get('response', ''))
+      def _chat_scroll_down():
+          ui.chat_scroll = -1 if ui.chat_scroll == -1 else ui.chat_scroll + 1
-              # Display and speak response
-              print(colored(f"{npc_name}: ", "green") + response_text)
+      def _chat_page_up():
+          _, h = sz()
+          chat_h = h - 5
+          if ui.chat_scroll == -1:
+              ui.chat_scroll = max(0, len(ui.chat_log) * 2 - chat_h - chat_h)
+          else:
+              ui.chat_scroll = max(0, ui.chat_scroll - chat_h)
+      def _chat_page_down():
+          ui.chat_scroll = -1
+      def handle_chat(c, fd):
+          # Ctrl+L = toggle listening
+          if c == '\x0c':  # Ctrl+L
               if AUDIO_AVAILABLE:
-                  speak_text(response_text, tts_model, voice)
-          except KeyboardInterrupt:
-              print("\nUse '/yq' to exit or continue.")
-              continue
-          except EOFError:
-              print("\nExiting yap mode.")
-              break
+                  ui.listening = not ui.listening
+                  st = 'on' if ui.listening else 'off'
+                  ui.chat_log.append(('info', f'Listening {st}.'))
+              return True
+          if ui.recording or ui.transcribing:
+              return True
+          if ui.thinking:
+              return True
+          if c in ('\r', '\n'):
+              text = ui.input_buf.strip()
+              ui.input_buf = ""
+              if text:
+                  send_message(text)
+              return True
+          if c == '\x7f' or c == '\x08':
+              ui.input_buf = ui.input_buf[:-1]
+              return True
+          if c >= ' ' and c <= '~':
+              ui.input_buf += c
+              ui.chat_scroll = -1
+              return True
+          return True
+      def handle_settings(c, fd):
+          SETTINGS_KEYS = ['tts_enabled', 'auto_speak', 'listening', 'silence_timeout', 'vad_threshold']
+          if ui.editing:
+              if c in ('\r', '\n'):
+                  val = ui.edit_buf.strip()
+                  if ui.edit_key == 'silence_timeout':
+                      try: ui.silence_timeout = max(0.3, min(10.0, float(val)))
+                      except: pass
+                  elif ui.edit_key == 'vad_threshold':
+                      try: ui.vad_threshold = max(0.1, min(0.9, float(val)))
+                      except: pass
+                  ui.editing = False
+                  ui.edit_buf = ""
+              elif c == '\x7f' or c == '\x08':
+                  ui.edit_buf = ui.edit_buf[:-1]
+              elif c >= ' ' and c <= '~':
+                  ui.edit_buf += c
+              return True
+          if c == 'j' and ui.set_sel < len(SETTINGS_KEYS) - 1:
+              ui.set_sel += 1
+          elif c == 'k' and ui.set_sel > 0:
+              ui.set_sel -= 1
+          elif c == ' ':
+              key = SETTINGS_KEYS[ui.set_sel]
+              if key == 'tts_enabled':
+                  ui.tts_enabled = not ui.tts_enabled
+              elif key == 'auto_speak':
+                  ui.auto_speak = not ui.auto_speak
+              elif key == 'listening':
+                  ui.listening = not ui.listening
+                  st = 'on' if ui.listening else 'off'
+                  ui.chat_log.append(('info', f'Listening {st}.'))
+          elif c == 'e':
+              key = SETTINGS_KEYS[ui.set_sel]
+              if key in ('silence_timeout', 'vad_threshold'):
+                  ui.editing = True
+                  ui.edit_key = key
+                  ui.edit_buf = str(ui.silence_timeout if key == 'silence_timeout' else ui.vad_threshold)
+          return True
+      # ================================================================
+      #  Welcome
+      # ================================================================
+      ui.chat_log.append(('info', f'YAP voice chat. NPC: {npc_name}.'))
+      ui.chat_log.append(('info', f'TTS: {tts_model_name}/{voice_name}  LLM: {model or "?"}@{provider or "?"}'))
+      if AUDIO_AVAILABLE:
+          ui.chat_log.append(('info', 'Listening for speech. Just start talking, or type text.'))
+          ui.chat_log.append(('info', 'Ctrl+L to pause/resume listening. Ctrl+S to change settings.'))
+      else:
+          ui.chat_log.append(('info', 'Audio not available. Text mode only. Ctrl+S to change settings.'))
+      if loaded_chunks:
+          ui.chat_log.append(('info', f'{len(loaded_chunks)} files loaded for context.'))
+      # Start VAD listener thread
+      _listener_thread = None
+      if AUDIO_AVAILABLE and vad_model is not None:
+          _listener_thread = threading.Thread(target=vad_listener_loop, daemon=True)
+          _listener_thread.start()
+      # ================================================================
+      #  Main loop
+      # ================================================================
+      fd = sys.stdin.fileno()
+      old_settings = termios.tcgetattr(fd)
+      try:
+          tty.setcbreak(fd)
+          sys.stdout.write('\033[?25l\033[2J')
+          running = True
+          while running:
+              render()
+              if ui.thinking or ui.recording or ui.transcribing or ui.speaking or ui.listening:
+                  ui.spinner_frame += 1
+              if _sel.select([fd], [], [], 0.15)[0]:
+                  c = os.read(fd, 1).decode('latin-1')
+                  running = handle_key(c, fd)
+      finally:
+          ui.listen_stop = True
+          termios.tcsetattr(fd, termios.TCSADRAIN, old_settings)
+          sys.stdout.write('\033[?25h\033[2J\033[H')
+          sys.stdout.flush()
       context['output'] = "Exited yap mode."
       context['messages'] = messages

npcsh 1.1.21__py3-none-any.whl → 1.1.23__py3-none-any.whl

npcsh 1.1.21py3-none-any.whl → 1.1.23py3-none-any.whl