npm - @innvisor/conny-ai - Versions diffs - 9.8.2 → 9.8.5 - Mend

@innvisor/conny-ai 9.8.2 → 9.8.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/CHANGELOG.md +12 -0
package/conny_app.py +5 -3
package/conny_cli.py +3 -0
package/conny_studio.py +53 -11
package/npm/conny.js +2 -2
package/package.json +1 -1
package/src/conny/channels/cli.py +3 -0
package/src/conny/demo/handler.py +27 -97
package/src/interfaces/web/demo_handler.py +24 -101

package/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,17 @@
 # Changelog
+## 9.8.4 - 2026-06-02
+- made bare `conny` route to the modern onboarding/chat surface instead of the legacy help screen
+- kept `conny init` untouched while preserving the same banner and branding in the post-onboarding chat UI
+- aligned the legacy Python CLI fallback so direct `conny_cli.py` launches follow the same start behavior
+## 9.8.3 - 2026-06-02
+- made `conny` open the real chat interface after onboarding instead of the setup flow
+- kept `conny init` unchanged and preserved its banner/design exactly
+- added slash-command chat shortcuts with a Codex-style launcher header
 ## 9.8.2 - 2026-06-02
 - persisted the language selected in `conny init` so the rest of the CLI loads it automatically

package/conny_app.py CHANGED Viewed

@@ -282,10 +282,12 @@ def _sh(*a):
 def main():
     signal.signal(signal.SIGINT, lambda *_: sys.exit(0))
-    if first_run() and not (len(sys.argv)>1 and sys.argv[1] in ("help","--help","-h","-v","--version")):
-        onboard()
     if len(sys.argv) <= 1:
-        cmd_new()
+        if first_run():
+            onboard()
+            return
+        cmd_chat()
+        return
     else:
         route(sys.argv[1], " ".join(sys.argv[2:]))

package/conny_cli.py CHANGED Viewed

@@ -11845,6 +11845,9 @@ def main():
         if not workspace_is_configured() or not get_instances():
             cmd_init(args)
             return
+        modern_entrypoint = Path(os.environ.get("CONNY_DIR", os.path.dirname(os.path.abspath(__file__)))) / "conny_app.py"
+        subprocess.call([sys.executable, str(modern_entrypoint)])
+        return
     # Help
     if args.help or cmd in ("help", "--help", "-h", ""):

package/conny_studio.py CHANGED Viewed

@@ -1,20 +1,32 @@
 #!/usr/bin/env python3
-"""conny_studio.py — Interactive CLI session with live monitoring."""
+"""conny_studio.py — Interactive CLI chat with live monitoring."""
 import asyncio
 import json
 import os
 import sys
 import time
 import uuid
+import subprocess
 from pathlib import Path
 from datetime import datetime
 import httpx
+from rich.console import Console
 sys.path.insert(0, str(Path(__file__).parent))
+from conny_design import LOGO_FULL, SEP, ICON_BRAND
 from conny_uncertainty import UncertaintyDetector
 from conny_voice import ConnyVoice
+CONSOLE = Console()
+VERSION = "9.8.2"
+try:
+    package_path = Path(__file__).resolve().parent / "package.json"
+    if package_path.exists():
+        VERSION = json.loads(package_path.read_text(encoding="utf-8")).get("version", VERSION)
+except Exception:
+    pass
 STUDIO_DIR = Path.home() / ".conny" / "studio" / "memory"
 API_URL = "http://localhost:8001/test"
@@ -69,11 +81,16 @@ class ConnyStudio:
                 }, ensure_ascii=False) + "\n")
     async def handle_command(self, cmd: str) -> str:
+        if cmd in ("/help", "/menu", "/start"):
+            return (
+                "Comandos: /help /menu /clear /history /models /config /language "
+                "/export /reload-persona /fix-last"
+            )
         if cmd == "/clear":
             self.history = []
             self.chat_id = f"studio_{uuid.uuid4().hex[:8]}"
             return "Session cleared. New conversation started."
-        elif cmd == "/show-memory":
+        elif cmd in ("/history", "/show-memory"):
             if not self.history:
                 return "No turns in memory yet."
             lines = []
@@ -81,6 +98,14 @@ class ConnyStudio:
                 role = "YOU" if h["role"] == "user" else "MEL"
                 lines.append(f"  [{role}] {h['content'][:80]}")
             return "\n".join(lines)
+        elif cmd == "/models":
+            return self._run_cli_command("modelo")
+        elif cmd == "/config":
+            return self._run_cli_command("config")
+        elif cmd == "/language":
+            return self._run_cli_command("language")
+        elif cmd in ("/new", "/init"):
+            return self._run_cli_command("init")
         elif cmd == "/show-failures":
             if not self.failures_file.exists():
                 return "No failures detected this session."
@@ -101,13 +126,28 @@ class ConnyStudio:
             return "No previous turn to fix."
         return f"Unknown command: {cmd}"
+    def _run_cli_command(self, command: str) -> str:
+        cli = Path(__file__).resolve().parent / "conny_cli.py"
+        if not cli.exists():
+            return f"CLI no disponible para /{command}"
+        try:
+            print(f"\033[90m[system] launching: conny {command}\033[0m")
+            subprocess.run([sys.executable, str(cli), command], check=False)
+            return f"/{command} closed. Back in chat."
+        except Exception as exc:
+            return f"No pude abrir /{command}: {exc}"
     def print_header(self):
-        print("\033[1;36m╔══════════════════════════════════════════════╗\033[0m")
-        print("\033[1;36m║  CONNY STUDIO v1.0                         ║\033[0m")
-        print(f"\033[1;36m║  Instance: {self.instance_id:<33}║\033[0m")
-        print(f"\033[1;36m║  Session: {self.session_id:<34}║\033[0m")
-        print("\033[1;36m╚══════════════════════════════════════════════╝\033[0m")
-        print("\033[90mCommands: /clear /show-memory /show-failures /fix-last /reload-persona /export-session\033[0m\n")
+        print()
+        CONSOLE.print(LOGO_FULL)
+        CONSOLE.print(f"  {ICON_BRAND} v{VERSION}  ·  chat real")
+        CONSOLE.print(SEP)
+        print(f"  Instance: {self.instance_id}")
+        print(f"  Session:  {self.session_id}")
+        print("  Comandos: /help /menu /clear /history /models /config /language /export")
+        print("  Atajos: 1=models 2=config 3=language 4=help")
+        CONSOLE.print(SEP)
+        print()
     def print_scores(self, scores):
         conf = scores["confidence"]
@@ -122,14 +162,16 @@ class ConnyStudio:
         self.print_header()
         while True:
             try:
-                user_input = input("\033[1;32m[YOU]\033[0m ")
+                user_input = input("\033[1;32m[YOU]\033[0m ").strip()
             except (EOFError, KeyboardInterrupt):
                 print("\n\033[90mSession ended.\033[0m")
                 break
-            if not user_input.strip():
+            if not user_input:
                 continue
+            if user_input in ("1", "2", "3", "4"):
+                user_input = { "1": "/models", "2": "/config", "3": "/language", "4": "/help" }[user_input]
             if user_input.startswith("/"):
-                result = await self.handle_command(user_input.strip())
+                result = await self.handle_command(user_input)
                 print(f"\033[1;33m[SYSTEM]\033[0m {result}")
                 continue
             try:

package/npm/conny.js CHANGED Viewed

@@ -485,7 +485,7 @@ function execConny(argv) {
 }
 const args = process.argv.slice(2);
-const isHelp = args.length === 0 || args.includes("-h") || args.includes("--help") || args.includes("help");
+const isHelp = args.includes("-h") || args.includes("--help") || args.includes("help");
 const isVersion = args.includes("-v") || args.includes("--version") || args.includes("version");
 const isBootstrapCheck = args.includes("--bootstrap-check");
 const isJson = args.includes("--json");
@@ -518,7 +518,7 @@ if (isHelp) {
   process.exit(0);
 }
-const launchArgs = args.length === 0 ? ["new"] : args;
+const launchArgs = args;
 if (!execConny(launchArgs)) {
   fail(`No pude iniciar Conny desde ${connyHome}`);

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@innvisor/conny-ai",
-  "version": "9.8.2",
+  "version": "9.8.5",
   "description": "Open-source CLI and runtime for building Conny AI receptionist agents on WhatsApp and Telegram.",
   "license": "MIT",
   "author": "Santiago Rubio",

package/src/conny/channels/cli.py CHANGED Viewed

@@ -11785,6 +11785,9 @@ def main():
         if not workspace_is_configured() or not get_instances():
             cmd_init(args)
             return
+        modern_entrypoint = Path(os.environ.get("CONNY_DIR", os.path.dirname(os.path.abspath(__file__)))) / "conny_app.py"
+        subprocess.call([sys.executable, str(modern_entrypoint)])
+        return
     # Help
     if args.help or cmd in ("help", "--help", "-h", ""):

package/src/conny/demo/handler.py CHANGED Viewed

@@ -261,17 +261,8 @@ async def _handle_demo_message(self, chat_id: str, text: str,
             )
         _save("assistant", r)
         bubbles = self._split_bubbles(r, chat_id=chat_id, archetype=_demo_archetype)
-        if should_normalize_first_turn and len(bubbles) == 1:
-            _text_norm = _normalize_conv_text(text or "")
-            _greeting_tokens = (
-                "hola", "buenas", "buenas tardes", "buenos dias", "buenos días",
-                "buenas noches", "hey", "holi", "hi", "hello",
-                "good morning", "good afternoon", "good evening",
-            )
-            if any(_text_norm == token or _text_norm.startswith(token + " ") for token in _greeting_tokens):
-                lowered_bubble = _normalize_conv_text(bubbles[0] or "")
-                if not any(token in lowered_bubble for token in ("cuentame", "cuéntame", "revisar", "ayudo", "ayudar")):
-                    bubbles.append(_lang_text("cuéntame qué te gustaría revisar", "what would you like to check?"))
+        # The LLM owns the follow-up. Do not append generic CTA bubbles here:
+        # that made good model answers sound like fallback.
         tone = self._demo_sessions.get(btone_key, "GENERAL")
         if tone in ("SALUD PREMIUM", "PREMIUM"):
             bubbles = [b[0].upper() + b[1:] if b else b for b in bubbles]
@@ -665,6 +656,7 @@ async def _handle_demo_message(self, chat_id: str, text: str,
             ),
         ]
         had_output = False
+        last_candidate = None
         for prompt_now, temp_now, max_now, tier_now, limit_now in attempts:
             # No lanzar repair si ya pasó demasiado tiempo desde que llegó el mensaje
             if time.time() - _chain_start > _CHAIN_TIMEOUT_S:
@@ -679,9 +671,12 @@ async def _handle_demo_message(self, chat_id: str, text: str,
             )
             if candidate and candidate.strip():
                 had_output = True
+                last_candidate = candidate
                 if not validator(candidate):
                     return candidate, True
-        return None, had_output
+        if had_output and last_candidate:
+            return last_candidate, True
+        return None, False
     def _save(role, msg):
         if db:
@@ -723,20 +718,7 @@ async def _handle_demo_message(self, chat_id: str, text: str,
             )
         _save("assistant", r)
         bubbles = self._split_bubbles(r, chat_id=chat_id, archetype=_demo_archetype)
-        # FIX BUG 4: Si es el primer turno, el usuario saludó, y la respuesta tiene
-        # solo 1 burbuja sin pregunta de seguimiento → agregar burbuja de apertura.
-        # Esta lógica existía en la primera definición de _send (línea 13772) pero
-        # se perdió cuando se redefinió _send aquí en la misma función.
-        if should_normalize_first_turn and len(bubbles) == 1:
-            _text_norm = _normalize_conv_text(text or "")
-            _greeting_tokens = (
-                "hola", "buenas", "buenas tardes", "buenos dias", "buenos días",
-                "buenas noches", "hey", "holi",
-            )
-            if any(_text_norm == token or _text_norm.startswith(token + " ") for token in _greeting_tokens):
-                lowered_bubble = _normalize_conv_text(bubbles[0] or "")
-                if not any(token in lowered_bubble for token in ("cuentame", "cuéntame", "revisar", "ayudo", "ayudar")):
-                    bubbles.append("cuéntame qué te gustaría revisar")
+        # The LLM owns the follow-up. Do not append generic CTA bubbles here.
         # Para premium/salud premium: restaurar mayúscula inicial
         tone = self._demo_sessions.get(btone_key, "GENERAL")
         if tone in ("SALUD PREMIUM", "PREMIUM"):
@@ -1089,6 +1071,7 @@ async def _handle_demo_message(self, chat_id: str, text: str,
             ),
         ]
         had_output = False
+        last_candidate = None
         for prompt_now, temp_now, max_now, tier_now in attempts:
             candidate = await _llm(
                 prompt_now,
@@ -1099,9 +1082,12 @@ async def _handle_demo_message(self, chat_id: str, text: str,
             )
             if candidate and candidate.strip():
                 had_output = True
+                last_candidate = candidate
                 if not validator(candidate):
                     return candidate, True
-        return None, had_output
+        if had_output and last_candidate:
+            return last_candidate, True
+        return None, False
     def _demo_owner_last_resort(
         user_text: str,
@@ -1806,63 +1792,7 @@ Máximo 1 oración por burbuja. Natural y seguro."""
             max_t=220,
         )
         if not r:
-            if found:
-                r = _lang_text(
-                    f"ya tengo {nombre} ||| ya me ubiqué con cómo tendría que sonar esto ||| Escríbeme como si fueras un cliente y te respondo",
-                    f"I’ve got {nombre} now ||| I already know how this chat should sound ||| text me like a real client and I’ll reply in context",
-                    f"já tenho {nombre} ||| já entendi como esse chat precisa soar ||| me escreve como um cliente real e eu respondo em contexto",
-                )
-            else:
-                # v12: no info → opciones naturales, sin exponer estado interno
-                if _owner_is_english():
-                    _no_info_opts = [
-                        f"got it, {nombre} ||| tell me what the business does and I’ll shape the demo around that",
-                        f"okay, {nombre} ||| I’m not finding solid public info yet, so tell me what you offer and I’ll ground it from there",
-                        f"I’ve got the name now ||| give me a quick picture of the business and I’ll keep going",
-                    ]
-                elif _owner_is_portuguese():
-                    _no_info_opts = [
-                        f"perfeito, {nombre} ||| me conta com o que o negócio trabalha e eu monto a demo nisso",
-                        f"ok, {nombre} ||| ainda não achei informação pública forte, então me conta o que vocês oferecem e eu ajusto a demo",
-                        f"já tenho o nome ||| me dá um resumo rápido do negócio e eu sigo daqui",
-                    ]
-                else:
-                    _no_info_opts = [
-                        f"ya anoté {nombre} ||| cuéntame a qué se dedican y te muestro cómo respondería",
-                        f"listo, {nombre} ||| no los encuentro en Google todavía — cuéntame qué hacen y arrancamos",
-                        f"ya los tengo ||| igual puedo hacer la demo — escríbeme un poco de qué trata el negocio",
-                    ]
-                r = _r.choice(_no_info_opts)
-        # ── Burbuja extra: confirmación del link ─────────────────────────
-        # Solo si encontramos info real (no cuando usamos el fallback de Google search)
-        import urllib.parse as _up
-        is_fallback_url = biz_url.startswith("https://www.google.com/search") or biz_url.startswith("https://www.google.com/maps/search")
-        if biz_url and found and not is_fallback_url:
-            # Natural: manda el link con texto corto, sin pregunta directa
-            if _owner_is_english():
-                _link_intros = [
-                    "I found this for you",
-                    "this looks like your business",
-                    "I found you here",
-                    "this is what I found for the business",
-                ]
-            elif _owner_is_portuguese():
-                _link_intros = [
-                    "achei isso de vocês",
-                    "encontrei vocês por aqui",
-                    "isso parece ser de vocês",
-                    "foi isso que eu achei do negócio",
-                ]
-            else:
-                _link_intros = [
-                    "mira, encontré esto de ustedes",
-                    "los encontré por acá",
-                    "esto es de ustedes",
-                    "vi esto de su negocio",
-                ]
-            r = r.rstrip() + f" ||| {_r.choice(_link_intros)} ||| {biz_url}"
+            return _send("⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         return _send(r)
     # ── Confirmación positiva del link: "sí ese es / correcto / sí" ───────────
@@ -2155,7 +2085,7 @@ Natural, sin punto al final, sin ¿¡, en minúscula.""",
                     f"perfecto, ya leí el documento de {business_name}"
                     f" ||| ya sé de qué se tratan — probemos, Escríbeme algo como cliente"
                 )
-                return _send(r or fallback)
+                return _send(r if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
             else:
                 # Doc llegó pero no pudimos extraer texto (imagen, binario raro)
                 return _send(
@@ -2244,7 +2174,7 @@ Natural, sin punto al final, sin ¿¡, en minúscula.""",
                 f"listo, ya entendí bien lo que hace {business_name} ||| "
                 f"arrancamos? Escríbeme algo como cliente a ver qué pasa"
             )
-            return _send(r or fallback)
+            return _send(r if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         elif not _has_what:
             # Falta: qué hacen
@@ -2255,7 +2185,7 @@ Todavía no sabes exactamente qué servicios o productos ofrecen.
 Haz UNA pregunta natural para entenderlo. Muy corta. Sin punto al final. En minúscula. Sin ¿ ni ¡.""",
                 "preguntando qué hacen", max_t=80
             )
-            return _send(r or "y a qué se dedican exactamente")
+            return _send(r if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         elif not _has_where:
             # Falta: dónde están
@@ -2267,7 +2197,7 @@ Haz UNA pregunta natural para saberlo. Muy corta. Sin punto al final. En minúsc
 Ejemplo: "y dónde están ubicados?" o "en qué ciudad o barrio están" """,
                 "preguntando ubicación", max_t=80
             )
-            return _send(r or "¿y dónde están ubicados?")
+            return _send(r if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         else:
             # Seguir aprendiendo con una pregunta más
@@ -2278,7 +2208,7 @@ Haz UNA pregunta más para entender mejor al negocio (horario, qué los diferenc
 Muy corta. Sin punto al final. En minúscula. Sin ¿ ni ¡.""",
                 "pregunta adicional", max_t=80
             )
-            return _send(r or "¿y cuál es su horario de atención?")
+            return _send(r if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
     # ── INTERCEPTOR: preguntas meta (soy bot? eres real? eres IA?) ─────────
     # Deben responderse ANTES del flujo normal — sin buscar en web ni confundirse
@@ -2427,6 +2357,7 @@ IDENTIDAD Y CREADOR — REGLA DURA
 """
         customer_history = sim_history[-8:]
         customer_had_output = False
+        last_candidate = None
         customer_reply = None
         original_history = history
         history = customer_history
@@ -2574,7 +2505,7 @@ Maneja en 2 burbujas (|||). REGLAS ESTRICTAS:
 Ejemplo del tono que quiero:
   "sí, hay de todo en el mercado ||| qué presupuesto tienes más o menos, para ver qué te muestro" """, "maneja la objeción")
-            return _send((r or f"sí, hay de todo en el mercado ||| qué presupuesto tienes más o menos, para ver qué te muestro") + _next_trick())
+            return _send((r + _next_trick()) if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         if detected_cmd == "/cita":
             r = await _llm(f"""Eres Conny, asesora de {business_name}. Un cliente acaba de decir que quiere ir o comprar.
@@ -2590,7 +2521,7 @@ Flujo sugerido:
 Sin punto al final. Sin ¿¡. Máximo 1-2 oraciones por burbuja.
 Ejemplo del tono: "qué producto te interesa llevar ||| esta semana puedo el miércoles o el viernes — cuál te queda" """,
                 "quiero comprar / quiero ir", max_t=350)
-            return _send((r or f"qué te interesa llevar ||| esta semana tengo el miércoles o el viernes, cuál te queda mejor") + _next_trick())
+            return _send((r + _next_trick()) if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         if detected_cmd == "/stats":
             return _send(f"el 78% de los clientes no vuelven si no les responden en menos de 5 minutos ||| una cita perdida en {business_name} vale entre $80k y $500k según el servicio ||| Conny responde en menos de 3 segundos, 24/7, sin días libres ni mal humor" + _next_trick())
@@ -2601,7 +2532,7 @@ Ejemplo del tono: "qué producto te interesa llevar ||| esta semana puedo el mi
         if detected_cmd == "/cierre":
             r = await _llm(f"""Eres Conny de {business_name}. Un cliente lleva 3 mensajes dudando.
 Haz el cierre en 2 burbujas (|||). Directo, con urgencia real. Sin presión forzada. Sin punto al final.""", "no sé, lo pienso")
-            return _send((r or f"claro, sin afán ||| igual te separo un espacio esta semana — si decides que no, lo cancelas. te queda bien el jueves") + _next_trick())
+            return _send((r + _next_trick()) if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         if detected_cmd == "/list":
             lista = (
@@ -2673,7 +2604,7 @@ Haz el cierre en 2 burbujas (|||). Directo, con urgencia real. Sin presión forz
             r = await _llm(f"""El usuario ha dicho: "{hist_text[:300]}"
 Extrae datos mencionados (nombre, interés, servicio). Demuestra en 2 burbujas (|||) que los recuerdas.
 Si no hay datos: "todavía no me has dado tu nombre — pero cuando lo hagas, lo recuerdo para siempre". Sin punto al final.""", "qué recuerdas")
-            return _send(r or "todo lo que me dices lo guardo ||| nombre, servicio de interés, objeciones — todo queda")
+            return _send(r if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         if detected_cmd == "/2am":
             return _send(f"son las 2 de la madrugada y estoy aquí ||| tu recepcionista está durmiendo — yo no. nunca" + _next_trick())
@@ -2681,12 +2612,12 @@ Si no hay datos: "todavía no me has dado tu nombre — pero cuando lo hagas, lo
         if detected_cmd == "/competencia":
             r = await _llm(f"""Eres Conny de {business_name}. Un cliente dice: "ya fui a otra parte y no me gustó."
 Responde en 2 burbujas (|||). Sin atacar a la competencia. Natural. Sin punto al final.""", "ya fui a otro lado")
-            return _send((r or f"ay qué pena ||| qué fue lo que no te gustó — acá antes de tocar nada hacemos valoración para asegurarnos del resultado") + _next_trick())
+            return _send((r + _next_trick()) if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         if detected_cmd == "/precio":
             r = await _llm(f"""Eres Conny de {business_name}. Un cliente dice: "está muy caro."
 Maneja en 2 burbujas (|||). Enfócate en valor. Cierra hacia valoración con día concreto. Sin punto al final.""", "está muy caro")
-            return _send((r or f"sí, vale lo que vale ||| los resultados duran, en la valoración gratis te dicen el número exacto. cuándo puedes") + _next_trick())
+            return _send((r + _next_trick()) if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         if detected_cmd == "/menu_bot":
             # Modo bot — IVR con emojis, ideal para negocios que prefieren menú estructurado
@@ -3055,7 +2986,7 @@ OBJECIONES
         recent_limit=8,
     )
     if not r:
-        r = _demo_customer_last_resort(text)
+        r = "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente."
     # Solo revelar truco si la respuesta tiene contenido real (>60 chars)
     # y no termina en pregunta (no interrumpir el flujo de la conversación)
     if _should_reveal_trick and r and len(r.replace("|||","").strip()) > 60:
@@ -3107,4 +3038,3 @@ OBJECIONES
     return _send(r)

package/src/interfaces/web/demo_handler.py CHANGED Viewed

@@ -447,17 +447,8 @@ async def handle_demo_message(
             )
         _save("assistant", r)
         bubbles = self._split_bubbles(r, chat_id=chat_id, archetype=_demo_archetype)
-        if should_normalize_first_turn and len(bubbles) == 1:
-            _text_norm = _normalize_conv_text(text or "")
-            _greeting_tokens = (
-                "hola", "buenas", "buenas tardes", "buenos dias", "buenos días",
-                "buenas noches", "hey", "holi", "hi", "hello",
-                "good morning", "good afternoon", "good evening",
-            )
-            if any(_text_norm == token or _text_norm.startswith(token + " ") for token in _greeting_tokens):
-                lowered_bubble = _normalize_conv_text(bubbles[0] or "")
-                if not any(token in lowered_bubble for token in ("cuentame", "cuéntame", "revisar", "ayudo", "ayudar")):
-                    bubbles.append(_lang_text("cuéntame qué te gustaría revisar", "what would you like to check?"))
+        # The LLM owns the follow-up. Do not append generic CTA bubbles here:
+        # that made good model answers sound like fallback.
         tone = self._demo_sessions.get(btone_key, "GENERAL")
         if tone in ("SALUD PREMIUM", "PREMIUM"):
             bubbles = [b[0].upper() + b[1:] if b else b for b in bubbles]
@@ -978,11 +969,10 @@ async def handle_demo_message(
                 last_candidate = candidate
                 if not validator(candidate):
                     return candidate, True
-        if had_output and last_candidate and not looks_fragmented_reply(last_candidate):
-            candidate_norm = _normalize_conv_text(last_candidate)
-            if len(candidate_norm.split()) >= 5 and not validator(last_candidate):
-                return last_candidate, True
-        return None, had_output
+        # BUG FIX ARCHITECTURE: si el modelo generó algo, así no pase validaciones, se devuelve. NO FALLBACK.
+        if had_output and last_candidate:
+            return last_candidate, True
+        return None, False
     def _save(role, msg):
         if db:
@@ -1024,20 +1014,7 @@ async def handle_demo_message(
             )
         _save("assistant", r)
         bubbles = self._split_bubbles(r, chat_id=chat_id, archetype=_demo_archetype)
-        # FIX BUG 4: Si es el primer turno, el usuario saludó, y la respuesta tiene
-        # solo 1 burbuja sin pregunta de seguimiento → agregar burbuja de apertura.
-        # Esta lógica existía en la primera definición de _send (línea 13772) pero
-        # se perdió cuando se redefinió _send aquí en la misma función.
-        if should_normalize_first_turn and len(bubbles) == 1:
-            _text_norm = _normalize_conv_text(text or "")
-            _greeting_tokens = (
-                "hola", "buenas", "buenas tardes", "buenos dias", "buenos días",
-                "buenas noches", "hey", "holi",
-            )
-            if any(_text_norm == token or _text_norm.startswith(token + " ") for token in _greeting_tokens):
-                lowered_bubble = _normalize_conv_text(bubbles[0] or "")
-                if not any(token in lowered_bubble for token in ("cuentame", "cuéntame", "revisar", "ayudo", "ayudar")):
-                    bubbles.append("cuéntame qué te gustaría revisar")
+        # The LLM owns the follow-up. Do not append generic CTA bubbles here.
         # Para premium/salud premium: restaurar mayúscula inicial
         tone = self._demo_sessions.get(btone_key, "GENERAL")
         if tone in ("SALUD PREMIUM", "PREMIUM"):
@@ -1336,10 +1313,12 @@ async def handle_demo_message(
             )
             if candidate and candidate.strip():
                 had_output = True
+                last_candidate = candidate
                 if not validator(candidate):
                     return candidate, True
-        return None, had_output
+        if had_output and last_candidate:
+            return last_candidate, True
+        return None, False
     def _demo_owner_last_resort(
         user_text: str,
@@ -2181,63 +2160,7 @@ Máximo 1 oración por burbuja. Natural y seguro."""
             max_t=220,
         )
         if not r:
-            if found:
-                r = _lang_text(
-                    f"ya tengo {nombre} ||| ya me ubiqué con cómo tendría que sonar esto ||| Escríbeme como si fueras un cliente y te respondo",
-                    f"I’ve got {nombre} now ||| I already know how this chat should sound ||| text me like a real client and I’ll reply in context",
-                    f"já tenho {nombre} ||| já entendi como esse chat precisa soar ||| me escreve como um cliente real e eu respondo em contexto",
-                )
-            else:
-                # v12: no info → opciones naturales, sin exponer estado interno
-                if _owner_is_english():
-                    _no_info_opts = [
-                        f"got it, {nombre} ||| tell me what the business does and I’ll shape the demo around that",
-                        f"okay, {nombre} ||| I’m not finding solid public info yet, so tell me what you offer and I’ll ground it from there",
-                        f"I’ve got the name now ||| give me a quick picture of the business and I’ll keep going",
-                    ]
-                elif _owner_is_portuguese():
-                    _no_info_opts = [
-                        f"perfeito, {nombre} ||| me conta com o que o negócio trabalha e eu monto a demo nisso",
-                        f"ok, {nombre} ||| ainda não achei informação pública forte, então me conta o que vocês oferecem e eu ajusto a demo",
-                        f"já tenho o nome ||| me dá um resumo rápido do negócio e eu sigo daqui",
-                    ]
-                else:
-                    _no_info_opts = [
-                        f"ya anoté {nombre} ||| cuéntame a qué se dedican y te muestro cómo respondería",
-                        f"listo, {nombre} ||| no los encuentro en Google todavía — cuéntame qué hacen y arrancamos",
-                        f"ya los tengo ||| igual puedo hacer la demo — escríbeme un poco de qué trata el negocio",
-                    ]
-                r = _r.choice(_no_info_opts)
-        # ── Burbuja extra: confirmación del link ─────────────────────────
-        # Solo si encontramos info real (no cuando usamos el fallback de Google search)
-        import urllib.parse as _up
-        is_fallback_url = biz_url.startswith("https://www.google.com/search") or biz_url.startswith("https://www.google.com/maps/search")
-        if biz_url and found and not is_fallback_url:
-            # Natural: manda el link con texto corto, sin pregunta directa
-            if _owner_is_english():
-                _link_intros = [
-                    "I found this for you",
-                    "this looks like your business",
-                    "I found you here",
-                    "this is what I found for the business",
-                ]
-            elif _owner_is_portuguese():
-                _link_intros = [
-                    "achei isso de vocês",
-                    "encontrei vocês por aqui",
-                    "isso parece ser de vocês",
-                    "foi isso que eu achei do negócio",
-                ]
-            else:
-                _link_intros = [
-                    "mira, encontré esto de ustedes",
-                    "los encontré por acá",
-                    "esto es de ustedes",
-                    "vi esto de su negocio",
-                ]
-            r = r.rstrip() + f" ||| {_r.choice(_link_intros)} ||| {biz_url}"
+            return _send("⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         return _send(r)
     # ── Confirmación positiva del link: "sí ese es / correcto / sí" ───────────
@@ -2553,7 +2476,7 @@ Natural, sin punto al final, sin ¿¡, en minúscula.""",
                     f"perfecto, ya leí el documento de {business_name}"
                     f" ||| ya sé de qué se tratan — probemos, Escríbeme algo como cliente"
                 )
-                return _send(r or fallback)
+                return _send(r if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
             else:
                 # Doc llegó pero no pudimos extraer texto (imagen, binario raro)
                 return _send(
@@ -2714,7 +2637,7 @@ Natural, sin punto al final, sin ¿¡, en minúscula.""",
                 f"listo, ya entendí bien lo que hace {business_name} ||| "
                 f"arrancamos? Escríbeme algo como cliente a ver qué pasa"
             )
-            return _send(r or fallback)
+            return _send(r if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         elif not _has_what:
             # Falta: qué hacen
@@ -2725,7 +2648,7 @@ Todavía no sabes exactamente qué servicios o productos ofrecen.
 Haz UNA pregunta natural para entenderlo. Muy corta. Sin punto al final. En minúscula. Sin ¿ ni ¡.""",
                 "preguntando qué hacen", max_t=80
             )
-            return _send(r or "y a qué se dedican exactamente")
+            return _send(r if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         elif not _has_where:
             # Falta: dónde están
@@ -2737,7 +2660,7 @@ Haz UNA pregunta natural para saberlo. Muy corta. Sin punto al final. En minúsc
 Ejemplo: "y dónde están ubicados?" o "en qué ciudad o barrio están" """,
                 "preguntando ubicación", max_t=80
             )
-            return _send(r or "¿y dónde están ubicados?")
+            return _send(r if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         else:
             # Seguir aprendiendo con una pregunta más
@@ -2748,7 +2671,7 @@ Haz UNA pregunta más para entender mejor al negocio (horario, qué los diferenc
 Muy corta. Sin punto al final. En minúscula. Sin ¿ ni ¡.""",
                 "pregunta adicional", max_t=80
             )
-            return _send(r or "¿y cuál es su horario de atención?")
+            return _send(r if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
     # ── INTERCEPTOR: preguntas meta (soy bot? eres real? eres IA?) ─────────
     # Deben responderse ANTES del flujo normal — sin buscar en web ni confundirse
@@ -3047,7 +2970,7 @@ Maneja en 2 burbujas (|||). REGLAS ESTRICTAS:
 Ejemplo del tono que quiero:
   "sí, hay de todo en el mercado ||| qué presupuesto tienes más o menos, para ver qué te muestro" """, "maneja la objeción")
-            return _send((r or f"sí, hay de todo en el mercado ||| qué presupuesto tienes más o menos, para ver qué te muestro") + _next_trick())
+            return _send((r + _next_trick()) if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         if detected_cmd == "/cita":
             r = await _llm(f"""Eres Conny, asesora de {business_name}. Un cliente acaba de decir que quiere ir o comprar.
@@ -3063,7 +2986,7 @@ Flujo sugerido:
 Sin punto al final. Sin ¿¡. Máximo 1-2 oraciones por burbuja.
 Ejemplo del tono: "qué producto te interesa llevar ||| esta semana puedo el miércoles o el viernes — cuál te queda" """,
                 "quiero comprar / quiero ir", max_t=350)
-            return _send((r or f"qué te interesa llevar ||| esta semana tengo el miércoles o el viernes, cuál te queda mejor") + _next_trick())
+            return _send((r + _next_trick()) if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         if detected_cmd == "/stats":
             return _send(f"el 78% de los clientes no vuelven si no les responden en menos de 5 minutos ||| una cita perdida en {business_name} vale entre $80k y $500k según el servicio ||| Conny responde en menos de 3 segundos, 24/7, sin días libres ni mal humor" + _next_trick())
@@ -3074,7 +2997,7 @@ Ejemplo del tono: "qué producto te interesa llevar ||| esta semana puedo el mi
         if detected_cmd == "/cierre":
             r = await _llm(f"""Eres Conny de {business_name}. Un cliente lleva 3 mensajes dudando.
 Haz el cierre en 2 burbujas (|||). Directo, con urgencia real. Sin presión forzada. Sin punto al final.""", "no sé, lo pienso")
-            return _send((r or f"claro, sin afán ||| igual te separo un espacio esta semana — si decides que no, lo cancelas. te queda bien el jueves") + _next_trick())
+            return _send((r + _next_trick()) if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         if detected_cmd == "/list":
             lista = (
@@ -3146,7 +3069,7 @@ Haz el cierre en 2 burbujas (|||). Directo, con urgencia real. Sin presión forz
             r = await _llm(f"""El usuario ha dicho: "{hist_text[:300]}"
 Extrae datos mencionados (nombre, interés, servicio). Demuestra en 2 burbujas (|||) que los recuerdas.
 Si no hay datos: "todavía no me has dado tu nombre — pero cuando lo hagas, lo recuerdo para siempre". Sin punto al final.""", "qué recuerdas")
-            return _send(r or "todo lo que me dices lo guardo ||| nombre, servicio de interés, objeciones — todo queda")
+            return _send(r if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         if detected_cmd == "/2am":
             return _send(f"son las 2 de la madrugada y estoy aquí ||| tu recepcionista está durmiendo — yo no. nunca" + _next_trick())
@@ -3154,12 +3077,12 @@ Si no hay datos: "todavía no me has dado tu nombre — pero cuando lo hagas, lo
         if detected_cmd == "/competencia":
             r = await _llm(f"""Eres Conny de {business_name}. Un cliente dice: "ya fui a otra parte y no me gustó."
 Responde en 2 burbujas (|||). Sin atacar a la competencia. Natural. Sin punto al final.""", "ya fui a otro lado")
-            return _send((r or f"ay qué pena ||| qué fue lo que no te gustó — acá antes de tocar nada hacemos valoración para asegurarnos del resultado") + _next_trick())
+            return _send((r + _next_trick()) if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         if detected_cmd == "/precio":
             r = await _llm(f"""Eres Conny de {business_name}. Un cliente dice: "está muy caro."
 Maneja en 2 burbujas (|||). Enfócate en valor. Cierra hacia valoración con día concreto. Sin punto al final.""", "está muy caro")
-            return _send((r or f"sí, vale lo que vale ||| los resultados duran, en la valoración gratis te dicen el número exacto. cuándo puedes") + _next_trick())
+            return _send((r + _next_trick()) if r else "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente.")
         if detected_cmd == "/menu_bot":
             # Modo bot — IVR con emojis, ideal para negocios que prefieren menú estructurado
@@ -3528,7 +3451,7 @@ OBJECIONES
         recent_limit=8,
     )
     if not r:
-        r = _demo_customer_last_resort(text)
+        r = "⚠️ Fallo del modelo LLM. No obtuve respuesta. Por favor, envía tu mensaje nuevamente."
     # Solo revelar truco si la respuesta tiene contenido real (>60 chars)
     # y no termina en pregunta (no interrumpir el flujo de la conversación)
     if _should_reveal_trick and r and len(r.replace("|||","").strip()) > 60: