PyPI - amd-gaia - Versions diffs - 0.15.0__py3-none-any.whl → 0.15.1__py3-none-any.whl - Mend

amd-gaia 0.15.0py3-none-any.whl → 0.15.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (181) hide show

{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.1.dist-info}/METADATA +223 -223
amd_gaia-0.15.1.dist-info/RECORD +178 -0
{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.1.dist-info}/entry_points.txt +1 -0
{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.1.dist-info}/licenses/LICENSE.md +20 -20
gaia/__init__.py +29 -29
gaia/agents/__init__.py +19 -19
gaia/agents/base/__init__.py +9 -9
gaia/agents/base/agent.py +2177 -2177
gaia/agents/base/api_agent.py +120 -120
gaia/agents/base/console.py +1841 -1841
gaia/agents/base/errors.py +237 -237
gaia/agents/base/mcp_agent.py +86 -86
gaia/agents/base/tools.py +83 -83
gaia/agents/blender/agent.py +556 -556
gaia/agents/blender/agent_simple.py +133 -135
gaia/agents/blender/app.py +211 -211
gaia/agents/blender/app_simple.py +41 -41
gaia/agents/blender/core/__init__.py +16 -16
gaia/agents/blender/core/materials.py +506 -506
gaia/agents/blender/core/objects.py +316 -316
gaia/agents/blender/core/rendering.py +225 -225
gaia/agents/blender/core/scene.py +220 -220
gaia/agents/blender/core/view.py +146 -146
gaia/agents/chat/__init__.py +9 -9
gaia/agents/chat/agent.py +835 -835
gaia/agents/chat/app.py +1058 -1058
gaia/agents/chat/session.py +508 -508
gaia/agents/chat/tools/__init__.py +15 -15
gaia/agents/chat/tools/file_tools.py +96 -96
gaia/agents/chat/tools/rag_tools.py +1729 -1729
gaia/agents/chat/tools/shell_tools.py +436 -436
gaia/agents/code/__init__.py +7 -7
gaia/agents/code/agent.py +549 -549
gaia/agents/code/cli.py +377 -0
gaia/agents/code/models.py +135 -135
gaia/agents/code/orchestration/__init__.py +24 -24
gaia/agents/code/orchestration/checklist_executor.py +1763 -1763
gaia/agents/code/orchestration/checklist_generator.py +713 -713
gaia/agents/code/orchestration/factories/__init__.py +9 -9
gaia/agents/code/orchestration/factories/base.py +63 -63
gaia/agents/code/orchestration/factories/nextjs_factory.py +118 -118
gaia/agents/code/orchestration/factories/python_factory.py +106 -106
gaia/agents/code/orchestration/orchestrator.py +841 -841
gaia/agents/code/orchestration/project_analyzer.py +391 -391
gaia/agents/code/orchestration/steps/__init__.py +67 -67
gaia/agents/code/orchestration/steps/base.py +188 -188
gaia/agents/code/orchestration/steps/error_handler.py +314 -314
gaia/agents/code/orchestration/steps/nextjs.py +828 -828
gaia/agents/code/orchestration/steps/python.py +307 -307
gaia/agents/code/orchestration/template_catalog.py +469 -469
gaia/agents/code/orchestration/workflows/__init__.py +14 -14
gaia/agents/code/orchestration/workflows/base.py +80 -80
gaia/agents/code/orchestration/workflows/nextjs.py +186 -186
gaia/agents/code/orchestration/workflows/python.py +94 -94
gaia/agents/code/prompts/__init__.py +11 -11
gaia/agents/code/prompts/base_prompt.py +77 -77
gaia/agents/code/prompts/code_patterns.py +2036 -2036
gaia/agents/code/prompts/nextjs_prompt.py +40 -40
gaia/agents/code/prompts/python_prompt.py +109 -109
gaia/agents/code/schema_inference.py +365 -365
gaia/agents/code/system_prompt.py +41 -41
gaia/agents/code/tools/__init__.py +42 -42
gaia/agents/code/tools/cli_tools.py +1138 -1138
gaia/agents/code/tools/code_formatting.py +319 -319
gaia/agents/code/tools/code_tools.py +769 -769
gaia/agents/code/tools/error_fixing.py +1347 -1347
gaia/agents/code/tools/external_tools.py +180 -180
gaia/agents/code/tools/file_io.py +845 -845
gaia/agents/code/tools/prisma_tools.py +190 -190
gaia/agents/code/tools/project_management.py +1016 -1016
gaia/agents/code/tools/testing.py +321 -321
gaia/agents/code/tools/typescript_tools.py +122 -122
gaia/agents/code/tools/validation_parsing.py +461 -461
gaia/agents/code/tools/validation_tools.py +806 -806
gaia/agents/code/tools/web_dev_tools.py +1758 -1758
gaia/agents/code/validators/__init__.py +16 -16
gaia/agents/code/validators/antipattern_checker.py +241 -241
gaia/agents/code/validators/ast_analyzer.py +197 -197
gaia/agents/code/validators/requirements_validator.py +145 -145
gaia/agents/code/validators/syntax_validator.py +171 -171
gaia/agents/docker/__init__.py +7 -7
gaia/agents/docker/agent.py +642 -642
gaia/agents/emr/__init__.py +8 -8
gaia/agents/emr/agent.py +1506 -1506
gaia/agents/emr/cli.py +1322 -1322
gaia/agents/emr/constants.py +475 -475
gaia/agents/emr/dashboard/__init__.py +4 -4
gaia/agents/emr/dashboard/server.py +1974 -1974
gaia/agents/jira/__init__.py +11 -11
gaia/agents/jira/agent.py +894 -894
gaia/agents/jira/jql_templates.py +299 -299
gaia/agents/routing/__init__.py +7 -7
gaia/agents/routing/agent.py +567 -570
gaia/agents/routing/system_prompt.py +75 -75
gaia/agents/summarize/__init__.py +11 -0
gaia/agents/summarize/agent.py +885 -0
gaia/agents/summarize/prompts.py +129 -0
gaia/api/__init__.py +23 -23
gaia/api/agent_registry.py +238 -238
gaia/api/app.py +305 -305
gaia/api/openai_server.py +575 -575
gaia/api/schemas.py +186 -186
gaia/api/sse_handler.py +373 -373
gaia/apps/__init__.py +4 -4
gaia/apps/llm/__init__.py +6 -6
gaia/apps/llm/app.py +173 -169
gaia/apps/summarize/app.py +116 -633
gaia/apps/summarize/html_viewer.py +133 -133
gaia/apps/summarize/pdf_formatter.py +284 -284
gaia/audio/__init__.py +2 -2
gaia/audio/audio_client.py +439 -439
gaia/audio/audio_recorder.py +269 -269
gaia/audio/kokoro_tts.py +599 -599
gaia/audio/whisper_asr.py +432 -432
gaia/chat/__init__.py +16 -16
gaia/chat/app.py +430 -430
gaia/chat/prompts.py +522 -522
gaia/chat/sdk.py +1228 -1225
gaia/cli.py +5481 -5632
gaia/database/__init__.py +10 -10
gaia/database/agent.py +176 -176
gaia/database/mixin.py +290 -290
gaia/database/testing.py +64 -64
gaia/eval/batch_experiment.py +2332 -2332
gaia/eval/claude.py +542 -542
gaia/eval/config.py +37 -37
gaia/eval/email_generator.py +512 -512
gaia/eval/eval.py +3179 -3179
gaia/eval/groundtruth.py +1130 -1130
gaia/eval/transcript_generator.py +582 -582
gaia/eval/webapp/README.md +167 -167
gaia/eval/webapp/package-lock.json +875 -875
gaia/eval/webapp/package.json +20 -20
gaia/eval/webapp/public/app.js +3402 -3402
gaia/eval/webapp/public/index.html +87 -87
gaia/eval/webapp/public/styles.css +3661 -3661
gaia/eval/webapp/server.js +415 -415
gaia/eval/webapp/test-setup.js +72 -72
gaia/llm/__init__.py +9 -2
gaia/llm/base_client.py +60 -0
gaia/llm/exceptions.py +12 -0
gaia/llm/factory.py +70 -0
gaia/llm/lemonade_client.py +3236 -3221
gaia/llm/lemonade_manager.py +294 -294
gaia/llm/providers/__init__.py +9 -0
gaia/llm/providers/claude.py +108 -0
gaia/llm/providers/lemonade.py +120 -0
gaia/llm/providers/openai_provider.py +79 -0
gaia/llm/vlm_client.py +382 -382
gaia/logger.py +189 -189
gaia/mcp/agent_mcp_server.py +245 -245
gaia/mcp/blender_mcp_client.py +138 -138
gaia/mcp/blender_mcp_server.py +648 -648
gaia/mcp/context7_cache.py +332 -332
gaia/mcp/external_services.py +518 -518
gaia/mcp/mcp_bridge.py +811 -550
gaia/mcp/servers/__init__.py +6 -6
gaia/mcp/servers/docker_mcp.py +83 -83
gaia/perf_analysis.py +361 -0
gaia/rag/__init__.py +10 -10
gaia/rag/app.py +293 -293
gaia/rag/demo.py +304 -304
gaia/rag/pdf_utils.py +235 -235
gaia/rag/sdk.py +2194 -2194
gaia/security.py +163 -163
gaia/talk/app.py +289 -289
gaia/talk/sdk.py +538 -538
gaia/testing/__init__.py +87 -87
gaia/testing/assertions.py +330 -330
gaia/testing/fixtures.py +333 -333
gaia/testing/mocks.py +493 -493
gaia/util.py +46 -46
gaia/utils/__init__.py +33 -33
gaia/utils/file_watcher.py +675 -675
gaia/utils/parsing.py +223 -223
gaia/version.py +100 -100
amd_gaia-0.15.0.dist-info/RECORD +0 -168
gaia/agents/code/app.py +0 -266
gaia/llm/llm_client.py +0 -723
{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.1.dist-info}/WHEEL +0 -0
{amd_gaia-0.15.0.dist-info → amd_gaia-0.15.1.dist-info}/top_level.txt +0 -0

gaia/agents/emr/cli.py CHANGED Viewed

@@ -1,1322 +1,1322 @@
-# Copyright(C) 2025-2026 Advanced Micro Devices, Inc. All rights reserved.
-# SPDX-License-Identifier: MIT
-"""CLI for Medical Intake Agent."""
-import argparse
-import logging
-import sys
-from pathlib import Path
-from rich.console import Console
-from rich.panel import Panel
-from rich.table import Table
-from gaia.agents.emr.agent import MedicalIntakeAgent
-logger = logging.getLogger(__name__)
-console = Console()
-def _print_header(watch_dir: str, db_path: str):
-    """Print a styled header for the CLI."""
-    console.print()
-    console.print(
-        Panel.fit(
-            "[bold cyan]Medical Intake Agent[/bold cyan]\n"
-            "[dim]Automatic Patient Form Processing[/dim]",
-            border_style="cyan",
-        )
-    )
-    # Status table
-    table = Table(show_header=False, box=None, padding=(0, 2))
-    table.add_column(style="dim")
-    table.add_column()
-    table.add_row("📁 Watch folder:", watch_dir)
-    table.add_row("💾 Database:", db_path)
-    console.print(table)
-    console.print()
-    # Commands help
-    console.print("[dim]Commands:[/dim]")
-    console.print("  [cyan]stats[/cyan]      Show processing statistics")
-    console.print("  [cyan]quit[/cyan]       Stop and exit")
-    console.print("  [dim]Or type questions about patients[/dim]")
-    console.print()
-def _print_prompt():
-    """Print the input prompt with visual separators."""
-    console.print("─" * 80, style="dim")
-    console.print("> ", end="", style="bold green")
-    sys.stdout.flush()  # Ensure prompt is displayed before input() blocks
-def cmd_watch(args):
-    """Start watching directory for intake forms."""
-    _print_header(args.watch_dir, args.db)
-    console.print("[dim]Starting agent...[/dim]")
-    agent = MedicalIntakeAgent(
-        watch_dir=args.watch_dir,
-        db_path=args.db,
-        vlm_model=args.vlm_model,
-    )
-    console.print("[green]✓ Ready![/green] Drop intake forms to process them.\n")
-    sys.stdout.flush()  # Ensure Ready message appears before prompt
-    try:
-        while True:
-            try:
-                _print_prompt()
-                user_input = input().strip()
-            except EOFError:
-                break
-            if not user_input:
-                continue
-            if user_input.lower() in ("quit", "exit", "q"):
-                break
-            console.print("─" * 80, style="dim")
-            if user_input.lower() == "stats":
-                cmd_stats_inline(agent)
-            else:
-                # Process the query
-                agent.process_query(user_input)
-            print()
-    except KeyboardInterrupt:
-        print()
-    finally:
-        console.print("[dim]Stopping agent...[/dim]")
-        agent.stop()
-        console.print("[green]✓ Stopped[/green]")
-def cmd_stats_inline(agent):
-    """Show stats inline during watch mode."""
-    try:
-        stats = agent.get_stats()
-        _print_stats_table(stats)
-    except Exception as e:
-        console.print(f"[red]Error getting stats: {e}[/red]")
-def cmd_process(args):
-    """Process a single intake form file."""
-    if not Path(args.file).exists():
-        console.print(f"[red]Error: File not found: {args.file}[/red]")
-        return 1
-    console.print(f"[dim]Processing: {args.file}[/dim]")
-    agent = MedicalIntakeAgent(
-        watch_dir=args.watch_dir,
-        db_path=args.db,
-        vlm_model=args.vlm_model,
-        auto_start_watching=False,
-    )
-    try:
-        # pylint: disable=protected-access
-        patient_data = agent._process_intake_form(args.file)
-        if patient_data:
-            # Agent already prints success and patient details
-            return 0
-        else:
-            console.print(f"[red]Failed to process: {args.file}[/red]")
-            return 1
-    finally:
-        agent.stop()
-def cmd_query(args):
-    """Query patient database."""
-    agent = MedicalIntakeAgent(
-        watch_dir=args.watch_dir,
-        db_path=args.db,
-        auto_start_watching=False,
-    )
-    try:
-        agent.process_query(args.question)
-        return 0
-    finally:
-        agent.stop()
-def _print_stats_table(stats: dict):
-    """Print statistics using Rich formatting."""
-    console.print()
-    # Time savings highlight
-    time_table = Table(show_header=False, box=None, padding=(0, 1))
-    time_table.add_column(style="bold green")
-    time_table.add_column(style="green")
-    time_table.add_row(
-        f"⏱️  {stats['time_saved_minutes']} min saved",
-        f"({stats['time_saved_percent']} faster)",
-    )
-    console.print(Panel(time_table, title="Time Savings", border_style="green"))
-    # Main stats grid
-    grid = Table.grid(expand=True, padding=(0, 2))
-    grid.add_column()
-    grid.add_column()
-    # Patients table
-    patients = Table(show_header=False, box=None)
-    patients.add_column(style="dim")
-    patients.add_column(style="bold")
-    patients.add_row("Total", str(stats["total_patients"]))
-    patients.add_row("New", str(stats["new_patients"]))
-    patients.add_row("Returning", str(stats["returning_patients"]))
-    patients.add_row("Today", str(stats["processed_today"]))
-    # Processing table
-    processing = Table(show_header=False, box=None)
-    processing.add_column(style="dim")
-    processing.add_column(style="bold")
-    processing.add_row("Processed", str(stats["files_processed"]))
-    processing.add_row("Success", str(stats["extraction_success"]))
-    processing.add_row("Failed", str(stats["extraction_failed"]))
-    processing.add_row("Rate", stats["success_rate"])
-    grid.add_row(
-        Panel(patients, title="👥 Patients", border_style="cyan"),
-        Panel(processing, title="📋 Processing", border_style="cyan"),
-    )
-    console.print(grid)
-    # Alerts (if any)
-    if stats.get("unacknowledged_alerts", 0) > 0:
-        console.print(
-            f"[bold red]🚨 {stats['unacknowledged_alerts']} unacknowledged alert(s)[/bold red]"
-        )
-    console.print()
-def cmd_stats(args):
-    """Show processing statistics."""
-    agent = MedicalIntakeAgent(
-        watch_dir=args.watch_dir,
-        db_path=args.db,
-        auto_start_watching=False,
-        silent_mode=True,
-    )
-    try:
-        stats = agent.get_stats()
-        _print_stats_table(stats)
-        return 0
-    finally:
-        agent.stop()
-def cmd_reset(args):
-    """Reset by deleting the database file."""
-    import os
-    from rich.prompt import Confirm
-    db_path = Path(args.db)
-    # Check if database exists
-    if not db_path.exists():
-        console.print("[dim]Database file does not exist. Nothing to reset.[/dim]")
-        return 0
-    # Get stats before deletion to show what will be deleted
-    total_patients = 0
-    agent = None
-    try:
-        agent = MedicalIntakeAgent(
-            watch_dir=args.watch_dir,
-            db_path=args.db,
-            auto_start_watching=False,
-            silent_mode=True,
-        )
-        stats = agent.get_stats()
-        total_patients = stats.get("total_patients", 0)
-    except Exception:
-        pass  # If we can't read stats, proceed anyway
-    finally:
-        if agent:
-            agent.stop()
-    # Confirmation prompt unless --force is used
-    if not args.force:
-        console.print()
-        console.print(
-            "[bold yellow]⚠️  WARNING:[/bold yellow] This will permanently delete:"
-        )
-        if total_patients > 0:
-            console.print(f"  • {total_patients} patient record(s)")
-            console.print("  • All associated alerts and intake sessions")
-        console.print(f"  • Database file: {db_path}")
-        console.print()
-        if not Confirm.ask("[bold red]Are you sure you want to continue?[/bold red]"):
-            console.print("[dim]Cancelled.[/dim]")
-            return 0
-    # Delete the database file
-    try:
-        os.remove(db_path)
-        console.print()
-        console.print("[bold green]✓ Database deleted successfully[/bold green]")
-        console.print(f"  Removed: {db_path}")
-        console.print()
-        console.print(
-            "[dim]A fresh database will be created when you next run the agent.[/dim]"
-        )
-        return 0
-    except Exception as e:
-        console.print(f"[red]Error deleting database: {e}[/red]")
-        return 1
-def cmd_init(args):
-    """Initialize EMR agent by downloading and loading required models."""
-    import time
-    from gaia.llm.lemonade_client import LemonadeClient
-    console.print()
-    console.print(
-        Panel.fit(
-            "[bold cyan]EMR Agent Setup[/bold cyan]\n"
-            "[dim]Downloading and loading required models[/dim]",
-            border_style="cyan",
-        )
-    )
-    console.print()
-    # Required models for EMR agent
-    vlm_model = args.vlm_model  # Default: Qwen3-VL-4B-Instruct-GGUF
-    llm_model = "Qwen3-Coder-30B-A3B-Instruct-GGUF"  # For chat/query processing
-    embed_model = "nomic-embed-text-v2-moe-GGUF"  # For similarity search
-    REQUIRED_CONTEXT_SIZE = 32768
-    # Step 1: Check Lemonade server and context size
-    console.print("[bold]Step 1:[/bold] Checking Lemonade server...")
-    try:
-        client = LemonadeClient(model=vlm_model)
-        health = client.health_check()
-        if health.get("status") == "ok":
-            console.print("  [green]✓[/green] Lemonade server is running")
-            # Check context size
-            context_size = health.get("context_size", 0)
-            if context_size >= REQUIRED_CONTEXT_SIZE:
-                console.print(
-                    f"  [green]✓[/green] Context size: [cyan]{context_size:,}[/cyan] tokens (recommended: {REQUIRED_CONTEXT_SIZE:,})"
-                )
-            elif context_size > 0:
-                console.print(
-                    f"  [yellow]⚠[/yellow] Context size: [yellow]{context_size:,}[/yellow] tokens"
-                )
-                console.print(
-                    f"    [yellow]Warning:[/yellow] Context size should be at least [cyan]{REQUIRED_CONTEXT_SIZE:,}[/cyan] for reliable form processing"
-                )
-                console.print(
-                    "    [dim]To fix: Right-click Lemonade tray → Settings → Context Size → 32768[/dim]"
-                )
-            else:
-                console.print(
-                    "  [dim]Context size: Not reported (will check after model load)[/dim]"
-                )
-        else:
-            console.print("  [red]✗[/red] Lemonade server not responding")
-            console.print()
-            console.print("[yellow]Please start Lemonade server first:[/yellow]")
-            console.print("  1. Open Lemonade from the system tray")
-            console.print("  2. Or run: [cyan]lemonade-server[/cyan]")
-            return 1
-    except Exception as e:
-        console.print(f"  [red]✗[/red] Cannot connect to Lemonade: {e}")
-        console.print()
-        console.print("[yellow]Please start Lemonade server first:[/yellow]")
-        console.print("  1. Open Lemonade from the system tray")
-        console.print("  2. Or run: [cyan]lemonade-server[/cyan]")
-        return 1
-    # Step 2: Check required models
-    console.print()
-    console.print("[bold]Step 2:[/bold] Checking required models...")
-    try:
-        models_response = client.list_models()
-        available_models = models_response.get("data", [])
-        downloaded_model_ids = [m.get("id", "") for m in available_models]
-        # Check each required model
-        required_models = [
-            ("VLM", vlm_model, "Form extraction"),
-            ("LLM", llm_model, "Chat/query processing"),
-            ("Embedding", embed_model, "Similarity search"),
-        ]
-        models_to_download = []
-        for model_type, model_name, _purpose in required_models:
-            is_downloaded = model_name in downloaded_model_ids
-            if is_downloaded:
-                console.print(
-                    f"  [green]✓[/green] {model_type}: [cyan]{model_name}[/cyan]"
-                )
-            else:
-                console.print(
-                    f"  [dim]○[/dim] {model_type}: [cyan]{model_name}[/cyan] [dim](not downloaded)[/dim]"
-                )
-                models_to_download.append((model_type, model_name))
-        if models_to_download:
-            console.print()
-            console.print(
-                f"  [yellow]⚠️  {len(models_to_download)} model(s) need to be downloaded[/yellow]"
-            )
-    except Exception as e:
-        console.print(f"  [red]✗[/red] Failed to check models: {e}")
-        return 1
-    # Step 3: Load all required models
-    console.print()
-    console.print("[bold]Step 3:[/bold] Loading required models...")
-    console.print("  [dim]Loading models into memory for fast inference...[/dim]")
-    console.print()
-    models_loaded = {}
-    # Load VLM model first (most important for form processing)
-    for model_type, model_name in [
-        ("VLM", vlm_model),
-        ("LLM", llm_model),
-        ("Embedding", embed_model),
-    ]:
-        console.print(f"  Loading {model_type}: [cyan]{model_name}[/cyan]...")
-        try:
-            start_time = time.time()
-            client.load_model(model_name, timeout=1800, auto_download=True)
-            elapsed = time.time() - start_time
-            models_loaded[model_type] = True
-            console.print(f"  [green]✓[/green] {model_type} loaded ({elapsed:.1f}s)")
-        except Exception as e:
-            error_msg = str(e)
-            models_loaded[model_type] = False
-            # Check for common errors
-            if "being used by another process" in error_msg:
-                console.print(
-                    f"  [yellow]![/yellow] {model_type}: File locked, try again later"
-                )
-            elif (
-                "not found" in error_msg.lower()
-                or "does not exist" in error_msg.lower()
-            ):
-                console.print(
-                    f"  [yellow]![/yellow] {model_type}: Model not available in registry"
-                )
-            else:
-                console.print(f"  [yellow]![/yellow] {model_type}: {error_msg[:50]}...")
-    # Check if critical models loaded
-    if not models_loaded.get("VLM"):
-        console.print()
-        console.print(
-            "[red]✗ VLM model failed to load - form processing will not work[/red]"
-        )
-        return 1
-    # Clear VLM context to ensure fresh memory allocation
-    console.print()
-    console.print("  [dim]Clearing VLM context for clean memory...[/dim]")
-    try:
-        client.unload_model()
-        client.load_model(vlm_model, timeout=300, auto_download=True)
-        console.print("  [green]✓[/green] VLM context cleared")
-    except Exception as e:
-        console.print(f"  [dim]Context clear skipped: {e}[/dim]")
-    # Step 4: Verify models and check context size
-    console.print()
-    console.print("[bold]Step 4:[/bold] Verifying models are ready...")
-    vlm_ready = False
-    llm_ready = False
-    embed_ready = False
-    final_context_size = 0
-    try:
-        # Check health for context size
-        health = client.health_check()
-        final_context_size = health.get("context_size", 0)
-        # Check each model
-        vlm_ready = client.check_model_loaded(vlm_model)
-        llm_ready = client.check_model_loaded(llm_model)
-        embed_ready = client.check_model_loaded(embed_model)
-        if vlm_ready:
-            console.print("  [green]✓[/green] VLM: Ready for form extraction")
-        else:
-            console.print("  [yellow]![/yellow] VLM: Will load on first use")
-        if llm_ready:
-            console.print("  [green]✓[/green] LLM: Ready for chat queries")
-        else:
-            console.print("  [dim]○[/dim] LLM: Will load on first use")
-        if embed_ready:
-            console.print("  [green]✓[/green] Embedding: Ready for search")
-        else:
-            console.print("  [dim]○[/dim] Embedding: Will load on first use")
-        # Report context size
-        if final_context_size >= REQUIRED_CONTEXT_SIZE:
-            console.print(
-                f"  [green]✓[/green] Context size: [cyan]{final_context_size:,}[/cyan] tokens"
-            )
-        elif final_context_size > 0:
-            console.print(
-                f"  [yellow]⚠[/yellow] Context size: [yellow]{final_context_size:,}[/yellow] tokens (need {REQUIRED_CONTEXT_SIZE:,})"
-            )
-    except Exception as e:
-        console.print(f"  [yellow]![/yellow] Could not verify: {e}")
-    # Step 5: Show all downloaded and loaded models
-    console.print()
-    console.print("[bold]Step 5:[/bold] Model inventory...")
-    try:
-        models_response = client.list_models()
-        all_models = models_response.get("data", [])
-        # Categorize models
-        vlm_models = []
-        llm_models = []
-        embed_models = []
-        for m in all_models:
-            model_id = m.get("id", "")
-            model_lower = model_id.lower()
-            if "vl" in model_lower or "vision" in model_lower or "vlm" in model_lower:
-                vlm_models.append(model_id)
-            elif (
-                "embed" in model_lower
-                or "bge" in model_lower
-                or "e5" in model_lower
-                or "nomic" in model_lower
-            ):
-                embed_models.append(model_id)
-            else:
-                llm_models.append(model_id)
-        # Show categorized models
-        if vlm_models:
-            console.print(
-                f"  [cyan]VLM Models:[/cyan] {', '.join(vlm_models[:3])}"
-                + (f" (+{len(vlm_models)-3} more)" if len(vlm_models) > 3 else "")
-            )
-        if llm_models:
-            console.print(
-                f"  [cyan]LLM Models:[/cyan] {', '.join(llm_models[:3])}"
-                + (f" (+{len(llm_models)-3} more)" if len(llm_models) > 3 else "")
-            )
-        if embed_models:
-            console.print(
-                f"  [cyan]Embedding Models:[/cyan] {', '.join(embed_models[:3])}"
-                + (f" (+{len(embed_models)-3} more)" if len(embed_models) > 3 else "")
-            )
-        console.print(f"  [dim]Total models available: {len(all_models)}[/dim]")
-    except Exception as e:
-        console.print(f"  [dim]Could not list models: {e}[/dim]")
-    # Success summary
-    console.print()
-    # Build model status lines
-    model_status_lines = []
-    # VLM status
-    if vlm_ready:
-        model_status_lines.append(
-            f"[green]✓[/green] VLM: [cyan]{vlm_model}[/cyan] - Ready"
-        )
-    else:
-        model_status_lines.append(
-            f"[yellow]![/yellow] VLM: [cyan]{vlm_model}[/cyan] - Will load on first use"
-        )
-    # LLM status
-    if llm_ready:
-        model_status_lines.append(
-            f"[green]✓[/green] LLM: [cyan]{llm_model}[/cyan] - Ready"
-        )
-    else:
-        model_status_lines.append(
-            f"[dim]○[/dim] LLM: [cyan]{llm_model}[/cyan] - Will load on first use"
-        )
-    # Embedding status
-    if embed_ready:
-        model_status_lines.append(
-            f"[green]✓[/green] Embedding: [cyan]{embed_model}[/cyan] - Ready"
-        )
-    else:
-        model_status_lines.append(
-            f"[dim]○[/dim] Embedding: [cyan]{embed_model}[/cyan] - Will load on first use"
-        )
-    # Context size status
-    if final_context_size >= REQUIRED_CONTEXT_SIZE:
-        model_status_lines.append(
-            f"[green]✓[/green] Context size: {final_context_size:,} tokens"
-        )
-    elif final_context_size > 0:
-        model_status_lines.append(
-            f"[yellow]⚠[/yellow] Context size: {final_context_size:,} tokens (need {REQUIRED_CONTEXT_SIZE:,})"
-        )
-    # Count ready models
-    ready_count = sum([vlm_ready, llm_ready, embed_ready])
-    console.print(
-        Panel.fit(
-            f"[bold green]✓ EMR Agent initialized ({ready_count}/3 models ready)[/bold green]\n\n"
-            + "\n".join(model_status_lines)
-            + "\n\n"
-            "[dim]You can now run:[/dim]\n"
-            "  [cyan]gaia-emr dashboard[/cyan]  - Start the web dashboard\n"
-            "  [cyan]gaia-emr watch[/cyan]      - Watch folder for intake forms\n"
-            "  [cyan]gaia-emr process <file>[/cyan] - Process a single file",
-            border_style="green",
-        )
-    )
-    console.print()
-    # Context size warning if needed
-    if 0 < final_context_size < REQUIRED_CONTEXT_SIZE:
-        console.print(
-            Panel.fit(
-                "[yellow]⚠️  Context Size Warning[/yellow]\n\n"
-                f"Current context size ({final_context_size:,}) may be too small for processing intake forms.\n"
-                "Large images can require 4,000-8,000+ tokens.\n\n"
-                "[bold]To fix:[/bold]\n"
-                "  1. Right-click Lemonade tray icon → Settings\n"
-                "  2. Set Context Size to [cyan]32768[/cyan]\n"
-                "  3. Click Apply and restart the model",
-                border_style="yellow",
-            )
-        )
-        console.print()
-    return 0
-def cmd_test(args):
-    """Test VLM extraction pipeline on a single file."""
-    import io
-    import json
-    import time
-    from PIL import Image
-    from gaia.llm.vlm_client import VLMClient
-    file_path = Path(args.file)
-    if not file_path.exists():
-        console.print(f"[red]Error: File not found: {file_path}[/red]")
-        return 1
-    console.print()
-    console.print(
-        Panel.fit(
-            "[bold cyan]EMR Agent - VLM Pipeline Test[/bold cyan]\n"
-            f"[dim]Testing extraction on: {file_path.name}[/dim]",
-            border_style="cyan",
-        )
-    )
-    console.print()
-    # Step 1: Read and analyze file
-    console.print("[bold]Step 1:[/bold] Reading file...")
-    try:
-        raw_bytes = file_path.read_bytes()
-        file_size_kb = len(raw_bytes) / 1024
-        console.print(f"  File size: {file_size_kb:.1f} KB")
-        # Get image dimensions
-        img = Image.open(io.BytesIO(raw_bytes))
-        orig_width, orig_height = img.size
-        console.print(f"  Dimensions: {orig_width}x{orig_height} pixels")
-        # Auto-rotate based on EXIF orientation
-        try:
-            from PIL import ExifTags
-            exif = img._getexif()  # pylint: disable=protected-access
-            if exif:
-                for tag, value in exif.items():
-                    if ExifTags.TAGS.get(tag) == "Orientation":
-                        if value == 3:
-                            img = img.rotate(180, expand=True)
-                            console.print("  [dim]Auto-rotated 180°[/dim]")
-                        elif value == 6:
-                            img = img.rotate(270, expand=True)
-                            console.print("  [dim]Auto-rotated 90° CW[/dim]")
-                        elif value == 8:
-                            img = img.rotate(90, expand=True)
-                            console.print("  [dim]Auto-rotated 90° CCW[/dim]")
-                        orig_width, orig_height = img.size
-                        break
-        except Exception:
-            pass  # No EXIF or rotation info
-    except Exception as e:
-        console.print(f"  [red]✗[/red] Failed to read file: {e}")
-        return 1
-    # Step 2: Optimize image (same as agent)
-    console.print()
-    console.print("[bold]Step 2:[/bold] Optimizing image...")
-    max_dimension = args.max_dimension
-    jpeg_quality = args.jpeg_quality
-    try:
-        if orig_width > max_dimension or orig_height > max_dimension:
-            scale = min(max_dimension / orig_width, max_dimension / orig_height)
-            new_width = int(orig_width * scale)
-            new_height = int(orig_height * scale)
-            img = img.resize((new_width, new_height), Image.Resampling.LANCZOS)
-            console.print(
-                f"  Resized: {orig_width}x{orig_height} → {new_width}x{new_height}"
-            )
-        else:
-            new_width, new_height = orig_width, orig_height
-            console.print(f"  No resize needed (under {max_dimension}px)")
-        # Convert to RGB and JPEG
-        if img.mode in ("RGBA", "P"):
-            img = img.convert("RGB")
-        output = io.BytesIO()
-        img.save(output, format="JPEG", quality=jpeg_quality, optimize=True)
-        image_bytes = output.getvalue()
-        opt_size_kb = len(image_bytes) / 1024
-        reduction = (1 - opt_size_kb / file_size_kb) * 100
-        console.print(
-            f"  Optimized: {file_size_kb:.0f}KB → {opt_size_kb:.0f}KB ({reduction:.0f}% smaller)"
-        )
-        # Estimate image tokens (rough: ~1 token per 14x14 pixel patch)
-        est_img_tokens = (new_width // 14) * (new_height // 14)
-        console.print(f"  Est. image tokens: ~{est_img_tokens:,}")
-    except Exception as e:
-        console.print(f"  [red]✗[/red] Failed to optimize: {e}")
-        return 1
-    # Step 3: Initialize VLM
-    console.print()
-    console.print("[bold]Step 3:[/bold] Initializing VLM...")
-    try:
-        vlm = VLMClient(vlm_model=args.vlm_model)
-        # Clear context if requested (unload and reload model)
-        if getattr(args, "clear_context", False):
-            console.print("  [dim]Clearing VLM context (unload + reload)...[/dim]")
-            try:
-                vlm.client.unload_model()
-                vlm.client.load_model(args.vlm_model, timeout=300, auto_download=True)
-                console.print("  [green]✓[/green] Context cleared")
-            except Exception as e:
-                console.print(f"  [yellow]⚠[/yellow] Could not clear context: {e}")
-        console.print(f"  [green]✓[/green] VLM ready: [cyan]{vlm.vlm_model}[/cyan]")
-    except Exception as e:
-        console.print(f"  [red]✗[/red] Failed to initialize VLM: {e}")
-        return 1
-    # Step 4: Extract data with auto-retry on memory errors
-    console.print()
-    console.print("[bold]Step 4:[/bold] Extracting patient data...")
-    extraction_prompt = """Extract ALL patient information from this medical intake form.
-Return a JSON object with these fields (use null for missing/unclear):
-{
-    "form_date": "YYYY-MM-DD (date form was filled, today's date)",
-    "first_name": "...",
-    "last_name": "...",
-    "date_of_birth": "YYYY-MM-DD",
-    "age": "patient's age if listed",
-    "gender": "Male/Female/Other",
-    "preferred_pronouns": "he/him, she/her, they/them if listed",
-    "ssn": "XXX-XX-XXXX (social security number)",
-    "marital_status": "Single/Married/Divorced/Widowed/Partnered",
-    "spouse_name": "spouse's name if listed",
-    "phone": "home phone number",
-    "mobile_phone": "cell/mobile phone number",
-    "work_phone": "work phone number",
-    "email": "...",
-    "address": "street address",
-    "city": "...",
-    "state": "...",
-    "zip_code": "...",
-    "preferred_language": "English/Spanish/etc if listed",
-    "race": "if listed",
-    "ethnicity": "if listed",
-    "contact_preference": "preferred contact method if listed",
-    "emergency_contact_name": "name of emergency contact person",
-    "emergency_contact_relationship": "relationship to patient (e.g. Mom, Spouse, Friend)",
-    "emergency_contact_phone": "emergency contact's phone number",
-    "referring_physician": "name of referring physician/doctor",
-    "referring_physician_phone": "phone number next to referring physician",
-    "primary_care_physician": "PCP name if different from referring",
-    "preferred_pharmacy": "pharmacy name if listed",
-    "employment_status": "Employed/Self Employed/Unemployed/Retired/Student/Disabled/Military",
-    "occupation": "job title if listed",
-    "employer": "employer/company name",
-    "employer_address": "employer address if listed",
-    "insurance_provider": "insurance company name",
-    "insurance_id": "policy number",
-    "insurance_group_number": "group number",
-    "insured_name": "name of insured person (may differ from patient)",
-    "insured_dob": "YYYY-MM-DD",
-    "insurance_phone": "insurance contact number",
-    "billing_address": "billing address if different from home",
-    "guarantor_name": "person responsible for payment if listed",
-    "reason_for_visit": "chief complaint or reason for visit",
-    "date_of_injury": "YYYY-MM-DD (date of injury or onset of symptoms)",
-    "pain_location": "where pain is located if listed",
-    "pain_onset": "when pain began (e.g. three months ago)",
-    "pain_cause": "what caused the pain/condition",
-    "pain_progression": "Improved/Worsened/Stayed the same",
-    "work_related_injury": "Yes/No",
-    "car_accident": "Yes/No",
-    "medical_conditions": "existing medical conditions",
-    "allergies": "known allergies",
-    "medications": "current medications",
-    "signature_date": "YYYY-MM-DD (date signed)"
-}
-IMPORTANT: Return ONLY the JSON object, no other text."""
-    # Retry loop with progressively smaller images on memory errors
-    max_retries = 3
-    current_img = img
-    current_bytes = image_bytes
-    current_width, current_height = new_width, new_height
-    current_size_kb = opt_size_kb
-    for attempt in range(max_retries):
-        est_img_tokens = (current_width // 14) * (current_height // 14)
-        console.print(
-            f"  Image: {current_width}x{current_height}, {current_size_kb:.0f}KB (~{est_img_tokens:,} tokens)"
-        )
-        if attempt == 0:
-            console.print("  [dim]This may take 30-60 seconds...[/dim]")
-        else:
-            console.print(
-                f"  [dim]Retry {attempt}/{max_retries-1} with smaller image...[/dim]"
-            )
-        try:
-            start_time = time.time()
-            raw_text = vlm.extract_from_image(
-                image_bytes=current_bytes,
-                prompt=extraction_prompt,
-            )
-            extraction_time = time.time() - start_time
-            # Check for memory-related errors
-            if (
-                "failed to process image" in raw_text
-                or "memory slot" in raw_text.lower()
-            ):
-                if attempt < max_retries - 1:
-                    console.print(
-                        "  [yellow]⚠[/yellow] Memory error, reducing image size..."
-                    )
-                    # Reduce image to 75% of current size
-                    scale = 0.75
-                    current_width = int(current_width * scale)
-                    current_height = int(current_height * scale)
-                    current_img = current_img.resize(
-                        (current_width, current_height), Image.Resampling.LANCZOS
-                    )
-                    output = io.BytesIO()
-                    current_img.save(
-                        output, format="JPEG", quality=jpeg_quality, optimize=True
-                    )
-                    current_bytes = output.getvalue()
-                    current_size_kb = len(current_bytes) / 1024
-                    continue
-                else:
-                    console.print(f"  [red]✗[/red] {raw_text}")
-                    console.print()
-                    console.print("[yellow]Suggestions:[/yellow]")
-                    console.print("  1. Try with smaller image: --max-dimension 640")
-                    console.print("  2. Restart Lemonade Server to clear memory")
-                    console.print("  3. Reload the VLM model in Lemonade")
-                    return 1
-            if raw_text.startswith("[VLM extraction failed:"):
-                console.print(f"  [red]✗[/red] {raw_text}")
-                return 1
-            # Success!
-            console.print(
-                f"  [green]✓[/green] Extraction complete ({len(raw_text)} chars, {extraction_time:.1f}s)"
-            )
-            # Estimate tokens/sec (output tokens only)
-            est_output_tokens = len(raw_text) / 4
-            tps = est_output_tokens / extraction_time if extraction_time > 0 else 0
-            console.print(
-                f"  Output: ~{est_output_tokens:.0f} tokens at ~{tps:.1f} TPS"
-            )
-            # Total throughput including prompt processing
-            total_tokens = (
-                est_img_tokens + 200 + est_output_tokens
-            )  # img + prompt + output
-            total_tps = total_tokens / extraction_time if extraction_time > 0 else 0
-            console.print(
-                f"  Total throughput: ~{total_tps:.0f} TPS (incl. {est_img_tokens:,} image tokens)"
-            )
-            # Update dimensions for final report
-            new_width, new_height = current_width, current_height
-            break
-        except Exception as e:
-            console.print(f"  [red]✗[/red] Extraction failed: {e}")
-            return 1
-    else:
-        # All retries exhausted
-        console.print("  [red]✗[/red] All retries failed")
-        return 1
-    # Step 5: Parse JSON
-    console.print()
-    console.print("[bold]Step 5:[/bold] Parsing JSON...")
-    try:
-        # Try direct parse
-        patient_data = json.loads(raw_text)
-        console.print("  [green]✓[/green] JSON parsed successfully")
-    except json.JSONDecodeError:
-        # Try to find JSON in text
-        try:
-            start = raw_text.find("{")
-            end = raw_text.rfind("}") + 1
-            if start >= 0 and end > start:
-                patient_data = json.loads(raw_text[start:end])
-                console.print("  [green]✓[/green] JSON extracted from response")
-            else:
-                console.print("  [red]✗[/red] No JSON found in response")
-                console.print()
-                console.print("[bold]Raw VLM Output:[/bold]")
-                console.print(raw_text[:500])
-                return 1
-        except json.JSONDecodeError as e:
-            console.print(f"  [red]✗[/red] JSON parse failed: {e}")
-            return 1
-    # Display results
-    console.print()
-    console.print(
-        Panel.fit(
-            "[bold green]✓ Extraction Successful[/bold green]",
-            border_style="green",
-        )
-    )
-    # Show extracted fields
-    console.print()
-    console.print("[bold]Extracted Fields:[/bold]")
-    fields_found = 0
-    for key, value in patient_data.items():
-        if value and value != "null":
-            fields_found += 1
-            console.print(f"  [cyan]{key}:[/cyan] {value}")
-    console.print()
-    console.print(f"[dim]Fields extracted: {fields_found}/53[/dim]")
-    console.print()
-    # Timing breakdown section
-    console.print("[bold]⏱️  TIMING BREAKDOWN[/bold]")
-    console.print("-" * 40)
-    console.print(f"   Model:              {args.vlm_model}")
-    console.print(f"   Image dimensions:   {new_width}x{new_height}")
-    console.print(f"   VLM extraction:     {extraction_time:.2f}s")
-    console.print(f"   Est. image tokens:  ~{est_img_tokens:,}")
-    console.print(f"   Est. output tokens: ~{int(est_output_tokens)}")
-    console.print(f"   Est. tokens/sec:    ~{tps:.1f} TPS")
-    console.print()
-    # Success summary
-    if patient_data.get("first_name") and patient_data.get("last_name"):
-        console.print(
-            f"   Patient: {patient_data.get('first_name', '')} {patient_data.get('last_name', '')}"
-        )
-        console.print("   [green]✓ Pipeline test PASSED[/green]")
-    else:
-        console.print("   [yellow]⚠ Missing required name fields[/yellow]")
-        console.print("   [red]✗ Pipeline test FAILED[/red]")
-    console.print()
-    return 0
-def _launch_electron(url: str, delay: float = 1.5) -> bool:
-    """
-    Launch Electron app to display the dashboard.
-    Returns True if Electron was launched successfully, False otherwise.
-    """
-    import os
-    import platform
-    import shutil
-    import subprocess
-    import time
-    time.sleep(delay)  # Wait for server to start
-    # Find the Electron wrapper directory
-    electron_dir = Path(__file__).parent / "dashboard" / "electron"
-    main_js = electron_dir / "main.js"
-    if not main_js.exists():
-        logger.warning(f"Electron wrapper not found at {electron_dir}")
-        return False
-    # On Windows, use npm.cmd and npx.cmd
-    is_windows = platform.system() == "Windows"
-    npm_cmd = "npm.cmd" if is_windows else "npm"
-    npx_cmd = "npx.cmd" if is_windows else "npx"
-    # Check if npx/electron is available
-    npx_path = shutil.which(npx_cmd)
-    if not npx_path:
-        logger.warning(f"{npx_cmd} not found in PATH, cannot launch Electron")
-        return False
-    try:
-        # Check if node_modules exists, if not run npm install first
-        node_modules = electron_dir / "node_modules"
-        if not node_modules.exists():
-            console.print("[dim]Installing Electron dependencies...[/dim]")
-            subprocess.run(
-                [npm_cmd, "install"],
-                cwd=str(electron_dir),
-                capture_output=True,
-                check=True,
-                shell=is_windows,  # Use shell on Windows for .cmd files
-            )
-        # Launch Electron with the dashboard URL
-        env = os.environ.copy()
-        env["EMR_DASHBOARD_URL"] = url
-        subprocess.Popen(
-            [npx_cmd, "electron", "."],
-            cwd=str(electron_dir),
-            env=env,
-            stdout=subprocess.DEVNULL,
-            stderr=subprocess.DEVNULL,
-            shell=is_windows,  # Use shell on Windows for .cmd files
-        )
-        return True
-    except Exception as e:
-        logger.warning(f"Failed to launch Electron: {e}")
-        return False
-def cmd_dashboard(args):
-    """Start web dashboard."""
-    import threading
-    import time
-    import webbrowser
-    def open_browser(url: str, delay: float = 1.5):
-        """Open browser after a short delay to allow server to start."""
-        time.sleep(delay)
-        webbrowser.open(url)
-    def open_electron_or_browser(url: str, use_browser: bool, delay: float = 1.5):
-        """Open Electron app, falling back to browser if needed."""
-        if use_browser:
-            open_browser(url, delay)
-        else:
-            if not _launch_electron(url, delay):
-                console.print(
-                    "[yellow]Electron not available, opening in browser instead...[/yellow]"
-                )
-                open_browser(url, delay)
-    try:
-        from gaia.agents.emr.dashboard.server import run_dashboard
-        console.print()
-        console.print(
-            Panel.fit(
-                "[bold cyan]EMR Dashboard[/bold cyan]\n"
-                "[dim]Real-time Patient Processing Monitor[/dim]",
-                border_style="cyan",
-            )
-        )
-        url = f"http://localhost:{args.port}"
-        table = Table(show_header=False, box=None, padding=(0, 2))
-        table.add_column(style="dim")
-        table.add_column()
-        table.add_row("📁 Watch folder:", args.watch_dir)
-        table.add_row("💾 Database:", args.db)
-        table.add_row("🌐 URL:", f"[bold cyan]{url}[/bold cyan]")
-        console.print(table)
-        console.print("\n[dim]Press Ctrl+C to stop[/dim]\n")
-        # Auto-open unless --no-open flag is set
-        if not getattr(args, "no_open", False):
-            use_browser = getattr(args, "browser", False)
-            if use_browser:
-                console.print("[dim]Opening dashboard in browser...[/dim]\n")
-            else:
-                console.print("[dim]Opening dashboard in Electron app...[/dim]\n")
-            open_thread = threading.Thread(
-                target=open_electron_or_browser,
-                args=(url, use_browser),
-                daemon=True,
-            )
-            open_thread.start()
-        run_dashboard(
-            watch_dir=args.watch_dir,
-            db_path=args.db,
-            host=args.host,
-            port=args.port,
-        )
-    except ImportError:
-        console.print("[red]Error: Dashboard dependencies not installed[/red]")
-        console.print("Install with: [cyan]pip install 'amd-gaia[api]'[/cyan]")
-        return 1
-    except KeyboardInterrupt:
-        console.print("\n[dim]Shutting down dashboard...[/dim]")
-        return 0
-def _add_common_args(parser):
-    """Add common arguments to a parser."""
-    parser.add_argument(
-        "--watch-dir",
-        default="./intake_forms",
-        help="Directory to watch for intake forms (default: ./intake_forms)",
-    )
-    parser.add_argument(
-        "--db",
-        default="./data/patients.db",
-        help="Path to patient database (default: ./data/patients.db)",
-    )
-    parser.add_argument(
-        "--vlm-model",
-        default="Qwen3-VL-4B-Instruct-GGUF",
-        help="VLM model for extraction (default: Qwen3-VL-4B-Instruct-GGUF)",
-    )
-    parser.add_argument(
-        "--debug",
-        action="store_true",
-        help="Enable debug logging",
-    )
-def main():
-    """Main CLI entry point."""
-    parser = argparse.ArgumentParser(
-        description="Medical Intake Agent CLI",
-        formatter_class=argparse.RawDescriptionHelpFormatter,
-    )
-    subparsers = parser.add_subparsers(dest="command", help="Command to run")
-    # Watch command
-    parser_watch = subparsers.add_parser(
-        "watch",
-        help="Watch directory for new intake forms",
-    )
-    _add_common_args(parser_watch)
-    parser_watch.set_defaults(func=cmd_watch)
-    # Process command
-    parser_process = subparsers.add_parser(
-        "process",
-        help="Process a single intake form",
-    )
-    _add_common_args(parser_process)
-    parser_process.add_argument("file", help="Path to intake form file")
-    parser_process.set_defaults(func=cmd_process)
-    # Query command
-    parser_query = subparsers.add_parser(
-        "query",
-        help="Query patient database",
-    )
-    _add_common_args(parser_query)
-    parser_query.add_argument("question", help="Question to ask")
-    parser_query.set_defaults(func=cmd_query)
-    # Stats command
-    parser_stats = subparsers.add_parser(
-        "stats",
-        help="Show processing statistics",
-    )
-    _add_common_args(parser_stats)
-    parser_stats.set_defaults(func=cmd_stats)
-    # Reset command
-    parser_reset = subparsers.add_parser(
-        "reset",
-        help="Clear all patient data from the database",
-    )
-    _add_common_args(parser_reset)
-    parser_reset.add_argument(
-        "--force",
-        "-f",
-        action="store_true",
-        help="Skip confirmation prompt",
-    )
-    parser_reset.set_defaults(func=cmd_reset)
-    # Init command
-    parser_init = subparsers.add_parser(
-        "init",
-        help="Download and setup required VLM models",
-    )
-    parser_init.add_argument(
-        "--vlm-model",
-        default="Qwen3-VL-4B-Instruct-GGUF",
-        help="VLM model to download (default: Qwen3-VL-4B-Instruct-GGUF)",
-    )
-    parser_init.add_argument(
-        "--debug",
-        action="store_true",
-        help="Enable debug logging",
-    )
-    parser_init.set_defaults(func=cmd_init)
-    # Test command
-    parser_test = subparsers.add_parser(
-        "test",
-        help="Test VLM extraction pipeline on a single file",
-    )
-    parser_test.add_argument(
-        "file",
-        help="Path to intake form image (PNG, JPG, PDF)",
-    )
-    parser_test.add_argument(
-        "--vlm-model",
-        default="Qwen3-VL-4B-Instruct-GGUF",
-        help="VLM model to use (default: Qwen3-VL-4B-Instruct-GGUF)",
-    )
-    parser_test.add_argument(
-        "--max-dimension",
-        type=int,
-        default=1024,
-        help="Max image dimension in pixels (default: 1024)",
-    )
-    parser_test.add_argument(
-        "--jpeg-quality",
-        type=int,
-        default=85,
-        help="JPEG compression quality (default: 85)",
-    )
-    parser_test.add_argument(
-        "--clear-context",
-        action="store_true",
-        help="Clear VLM context before processing (fixes memory errors)",
-    )
-    parser_test.add_argument(
-        "--debug",
-        action="store_true",
-        help="Enable debug logging",
-    )
-    parser_test.set_defaults(func=cmd_test)
-    # Dashboard command
-    parser_dashboard = subparsers.add_parser(
-        "dashboard",
-        help="Start web dashboard",
-    )
-    _add_common_args(parser_dashboard)
-    parser_dashboard.add_argument(
-        "--host",
-        default="127.0.0.1",
-        help="Dashboard host (default: 127.0.0.1)",
-    )
-    parser_dashboard.add_argument(
-        "--port",
-        type=int,
-        default=8080,
-        help="Dashboard port (default: 8080)",
-    )
-    parser_dashboard.add_argument(
-        "--no-open",
-        action="store_true",
-        help="Don't automatically open dashboard",
-    )
-    parser_dashboard.add_argument(
-        "--browser",
-        action="store_true",
-        help="Open in web browser instead of Electron app",
-    )
-    parser_dashboard.set_defaults(func=cmd_dashboard)
-    args = parser.parse_args()
-    # Run command
-    if not args.command:
-        parser.print_help()
-        return 0
-    # Configure logging - WARNING by default, DEBUG with --debug flag
-    if getattr(args, "debug", False):
-        logging.basicConfig(
-            level=logging.DEBUG,
-            format="%(asctime)s | %(levelname)s | %(name)s | %(message)s",
-            datefmt="%H:%M:%S",
-        )
-    else:
-        # Suppress all logs from gaia modules for cleaner output
-        logging.basicConfig(level=logging.WARNING)
-        for logger_name in [
-            "gaia",
-            "gaia.llm",
-            "gaia.database",
-            "gaia.agents",
-            "gaia.utils",
-        ]:
-            logging.getLogger(logger_name).setLevel(logging.WARNING)
-    return args.func(args)
-if __name__ == "__main__":
-    sys.exit(main())
+# Copyright(C) 2025-2026 Advanced Micro Devices, Inc. All rights reserved.
+# SPDX-License-Identifier: MIT
+"""CLI for Medical Intake Agent."""
+import argparse
+import logging
+import sys
+from pathlib import Path
+from rich.console import Console
+from rich.panel import Panel
+from rich.table import Table
+from gaia.agents.emr.agent import MedicalIntakeAgent
+logger = logging.getLogger(__name__)
+console = Console()
+def _print_header(watch_dir: str, db_path: str):
+    """Print a styled header for the CLI."""
+    console.print()
+    console.print(
+        Panel.fit(
+            "[bold cyan]Medical Intake Agent[/bold cyan]\n"
+            "[dim]Automatic Patient Form Processing[/dim]",
+            border_style="cyan",
+        )
+    )
+    # Status table
+    table = Table(show_header=False, box=None, padding=(0, 2))
+    table.add_column(style="dim")
+    table.add_column()
+    table.add_row("📁 Watch folder:", watch_dir)
+    table.add_row("💾 Database:", db_path)
+    console.print(table)
+    console.print()
+    # Commands help
+    console.print("[dim]Commands:[/dim]")
+    console.print("  [cyan]stats[/cyan]      Show processing statistics")
+    console.print("  [cyan]quit[/cyan]       Stop and exit")
+    console.print("  [dim]Or type questions about patients[/dim]")
+    console.print()
+def _print_prompt():
+    """Print the input prompt with visual separators."""
+    console.print("─" * 80, style="dim")
+    console.print("> ", end="", style="bold green")
+    sys.stdout.flush()  # Ensure prompt is displayed before input() blocks
+def cmd_watch(args):
+    """Start watching directory for intake forms."""
+    _print_header(args.watch_dir, args.db)
+    console.print("[dim]Starting agent...[/dim]")
+    agent = MedicalIntakeAgent(
+        watch_dir=args.watch_dir,
+        db_path=args.db,
+        vlm_model=args.vlm_model,
+    )
+    console.print("[green]✓ Ready![/green] Drop intake forms to process them.\n")
+    sys.stdout.flush()  # Ensure Ready message appears before prompt
+    try:
+        while True:
+            try:
+                _print_prompt()
+                user_input = input().strip()
+            except EOFError:
+                break
+            if not user_input:
+                continue
+            if user_input.lower() in ("quit", "exit", "q"):
+                break
+            console.print("─" * 80, style="dim")
+            if user_input.lower() == "stats":
+                cmd_stats_inline(agent)
+            else:
+                # Process the query
+                agent.process_query(user_input)
+            print()
+    except KeyboardInterrupt:
+        print()
+    finally:
+        console.print("[dim]Stopping agent...[/dim]")
+        agent.stop()
+        console.print("[green]✓ Stopped[/green]")
+def cmd_stats_inline(agent):
+    """Show stats inline during watch mode."""
+    try:
+        stats = agent.get_stats()
+        _print_stats_table(stats)
+    except Exception as e:
+        console.print(f"[red]Error getting stats: {e}[/red]")
+def cmd_process(args):
+    """Process a single intake form file."""
+    if not Path(args.file).exists():
+        console.print(f"[red]Error: File not found: {args.file}[/red]")
+        return 1
+    console.print(f"[dim]Processing: {args.file}[/dim]")
+    agent = MedicalIntakeAgent(
+        watch_dir=args.watch_dir,
+        db_path=args.db,
+        vlm_model=args.vlm_model,
+        auto_start_watching=False,
+    )
+    try:
+        # pylint: disable=protected-access
+        patient_data = agent._process_intake_form(args.file)
+        if patient_data:
+            # Agent already prints success and patient details
+            return 0
+        else:
+            console.print(f"[red]Failed to process: {args.file}[/red]")
+            return 1
+    finally:
+        agent.stop()
+def cmd_query(args):
+    """Query patient database."""
+    agent = MedicalIntakeAgent(
+        watch_dir=args.watch_dir,
+        db_path=args.db,
+        auto_start_watching=False,
+    )
+    try:
+        agent.process_query(args.question)
+        return 0
+    finally:
+        agent.stop()
+def _print_stats_table(stats: dict):
+    """Print statistics using Rich formatting."""
+    console.print()
+    # Time savings highlight
+    time_table = Table(show_header=False, box=None, padding=(0, 1))
+    time_table.add_column(style="bold green")
+    time_table.add_column(style="green")
+    time_table.add_row(
+        f"⏱️  {stats['time_saved_minutes']} min saved",
+        f"({stats['time_saved_percent']} faster)",
+    )
+    console.print(Panel(time_table, title="Time Savings", border_style="green"))
+    # Main stats grid
+    grid = Table.grid(expand=True, padding=(0, 2))
+    grid.add_column()
+    grid.add_column()
+    # Patients table
+    patients = Table(show_header=False, box=None)
+    patients.add_column(style="dim")
+    patients.add_column(style="bold")
+    patients.add_row("Total", str(stats["total_patients"]))
+    patients.add_row("New", str(stats["new_patients"]))
+    patients.add_row("Returning", str(stats["returning_patients"]))
+    patients.add_row("Today", str(stats["processed_today"]))
+    # Processing table
+    processing = Table(show_header=False, box=None)
+    processing.add_column(style="dim")
+    processing.add_column(style="bold")
+    processing.add_row("Processed", str(stats["files_processed"]))
+    processing.add_row("Success", str(stats["extraction_success"]))
+    processing.add_row("Failed", str(stats["extraction_failed"]))
+    processing.add_row("Rate", stats["success_rate"])
+    grid.add_row(
+        Panel(patients, title="👥 Patients", border_style="cyan"),
+        Panel(processing, title="📋 Processing", border_style="cyan"),
+    )
+    console.print(grid)
+    # Alerts (if any)
+    if stats.get("unacknowledged_alerts", 0) > 0:
+        console.print(
+            f"[bold red]🚨 {stats['unacknowledged_alerts']} unacknowledged alert(s)[/bold red]"
+        )
+    console.print()
+def cmd_stats(args):
+    """Show processing statistics."""
+    agent = MedicalIntakeAgent(
+        watch_dir=args.watch_dir,
+        db_path=args.db,
+        auto_start_watching=False,
+        silent_mode=True,
+    )
+    try:
+        stats = agent.get_stats()
+        _print_stats_table(stats)
+        return 0
+    finally:
+        agent.stop()
+def cmd_reset(args):
+    """Reset by deleting the database file."""
+    import os
+    from rich.prompt import Confirm
+    db_path = Path(args.db)
+    # Check if database exists
+    if not db_path.exists():
+        console.print("[dim]Database file does not exist. Nothing to reset.[/dim]")
+        return 0
+    # Get stats before deletion to show what will be deleted
+    total_patients = 0
+    agent = None
+    try:
+        agent = MedicalIntakeAgent(
+            watch_dir=args.watch_dir,
+            db_path=args.db,
+            auto_start_watching=False,
+            silent_mode=True,
+        )
+        stats = agent.get_stats()
+        total_patients = stats.get("total_patients", 0)
+    except Exception:
+        pass  # If we can't read stats, proceed anyway
+    finally:
+        if agent:
+            agent.stop()
+    # Confirmation prompt unless --force is used
+    if not args.force:
+        console.print()
+        console.print(
+            "[bold yellow]⚠️  WARNING:[/bold yellow] This will permanently delete:"
+        )
+        if total_patients > 0:
+            console.print(f"  • {total_patients} patient record(s)")
+            console.print("  • All associated alerts and intake sessions")
+        console.print(f"  • Database file: {db_path}")
+        console.print()
+        if not Confirm.ask("[bold red]Are you sure you want to continue?[/bold red]"):
+            console.print("[dim]Cancelled.[/dim]")
+            return 0
+    # Delete the database file
+    try:
+        os.remove(db_path)
+        console.print()
+        console.print("[bold green]✓ Database deleted successfully[/bold green]")
+        console.print(f"  Removed: {db_path}")
+        console.print()
+        console.print(
+            "[dim]A fresh database will be created when you next run the agent.[/dim]"
+        )
+        return 0
+    except Exception as e:
+        console.print(f"[red]Error deleting database: {e}[/red]")
+        return 1
+def cmd_init(args):
+    """Initialize EMR agent by downloading and loading required models."""
+    import time
+    from gaia.llm.lemonade_client import LemonadeClient
+    console.print()
+    console.print(
+        Panel.fit(
+            "[bold cyan]EMR Agent Setup[/bold cyan]\n"
+            "[dim]Downloading and loading required models[/dim]",
+            border_style="cyan",
+        )
+    )
+    console.print()
+    # Required models for EMR agent
+    vlm_model = args.vlm_model  # Default: Qwen3-VL-4B-Instruct-GGUF
+    llm_model = "Qwen3-Coder-30B-A3B-Instruct-GGUF"  # For chat/query processing
+    embed_model = "nomic-embed-text-v2-moe-GGUF"  # For similarity search
+    REQUIRED_CONTEXT_SIZE = 32768
+    # Step 1: Check Lemonade server and context size
+    console.print("[bold]Step 1:[/bold] Checking Lemonade server...")
+    try:
+        client = LemonadeClient(model=vlm_model)
+        health = client.health_check()
+        if health.get("status") == "ok":
+            console.print("  [green]✓[/green] Lemonade server is running")
+            # Check context size
+            context_size = health.get("context_size", 0)
+            if context_size >= REQUIRED_CONTEXT_SIZE:
+                console.print(
+                    f"  [green]✓[/green] Context size: [cyan]{context_size:,}[/cyan] tokens (recommended: {REQUIRED_CONTEXT_SIZE:,})"
+                )
+            elif context_size > 0:
+                console.print(
+                    f"  [yellow]⚠[/yellow] Context size: [yellow]{context_size:,}[/yellow] tokens"
+                )
+                console.print(
+                    f"    [yellow]Warning:[/yellow] Context size should be at least [cyan]{REQUIRED_CONTEXT_SIZE:,}[/cyan] for reliable form processing"
+                )
+                console.print(
+                    "    [dim]To fix: Right-click Lemonade tray → Settings → Context Size → 32768[/dim]"
+                )
+            else:
+                console.print(
+                    "  [dim]Context size: Not reported (will check after model load)[/dim]"
+                )
+        else:
+            console.print("  [red]✗[/red] Lemonade server not responding")
+            console.print()
+            console.print("[yellow]Please start Lemonade server first:[/yellow]")
+            console.print("  1. Open Lemonade from the system tray")
+            console.print("  2. Or run: [cyan]lemonade-server[/cyan]")
+            return 1
+    except Exception as e:
+        console.print(f"  [red]✗[/red] Cannot connect to Lemonade: {e}")
+        console.print()
+        console.print("[yellow]Please start Lemonade server first:[/yellow]")
+        console.print("  1. Open Lemonade from the system tray")
+        console.print("  2. Or run: [cyan]lemonade-server[/cyan]")
+        return 1
+    # Step 2: Check required models
+    console.print()
+    console.print("[bold]Step 2:[/bold] Checking required models...")
+    try:
+        models_response = client.list_models()
+        available_models = models_response.get("data", [])
+        downloaded_model_ids = [m.get("id", "") for m in available_models]
+        # Check each required model
+        required_models = [
+            ("VLM", vlm_model, "Form extraction"),
+            ("LLM", llm_model, "Chat/query processing"),
+            ("Embedding", embed_model, "Similarity search"),
+        ]
+        models_to_download = []
+        for model_type, model_name, _purpose in required_models:
+            is_downloaded = model_name in downloaded_model_ids
+            if is_downloaded:
+                console.print(
+                    f"  [green]✓[/green] {model_type}: [cyan]{model_name}[/cyan]"
+                )
+            else:
+                console.print(
+                    f"  [dim]○[/dim] {model_type}: [cyan]{model_name}[/cyan] [dim](not downloaded)[/dim]"
+                )
+                models_to_download.append((model_type, model_name))
+        if models_to_download:
+            console.print()
+            console.print(
+                f"  [yellow]⚠️  {len(models_to_download)} model(s) need to be downloaded[/yellow]"
+            )
+    except Exception as e:
+        console.print(f"  [red]✗[/red] Failed to check models: {e}")
+        return 1
+    # Step 3: Load all required models
+    console.print()
+    console.print("[bold]Step 3:[/bold] Loading required models...")
+    console.print("  [dim]Loading models into memory for fast inference...[/dim]")
+    console.print()
+    models_loaded = {}
+    # Load VLM model first (most important for form processing)
+    for model_type, model_name in [
+        ("VLM", vlm_model),
+        ("LLM", llm_model),
+        ("Embedding", embed_model),
+    ]:
+        console.print(f"  Loading {model_type}: [cyan]{model_name}[/cyan]...")
+        try:
+            start_time = time.time()
+            client.load_model(model_name, timeout=1800, auto_download=True)
+            elapsed = time.time() - start_time
+            models_loaded[model_type] = True
+            console.print(f"  [green]✓[/green] {model_type} loaded ({elapsed:.1f}s)")
+        except Exception as e:
+            error_msg = str(e)
+            models_loaded[model_type] = False
+            # Check for common errors
+            if "being used by another process" in error_msg:
+                console.print(
+                    f"  [yellow]![/yellow] {model_type}: File locked, try again later"
+                )
+            elif (
+                "not found" in error_msg.lower()
+                or "does not exist" in error_msg.lower()
+            ):
+                console.print(
+                    f"  [yellow]![/yellow] {model_type}: Model not available in registry"
+                )
+            else:
+                console.print(f"  [yellow]![/yellow] {model_type}: {error_msg[:50]}...")
+    # Check if critical models loaded
+    if not models_loaded.get("VLM"):
+        console.print()
+        console.print(
+            "[red]✗ VLM model failed to load - form processing will not work[/red]"
+        )
+        return 1
+    # Clear VLM context to ensure fresh memory allocation
+    console.print()
+    console.print("  [dim]Clearing VLM context for clean memory...[/dim]")
+    try:
+        client.unload_model()
+        client.load_model(vlm_model, timeout=300, auto_download=True)
+        console.print("  [green]✓[/green] VLM context cleared")
+    except Exception as e:
+        console.print(f"  [dim]Context clear skipped: {e}[/dim]")
+    # Step 4: Verify models and check context size
+    console.print()
+    console.print("[bold]Step 4:[/bold] Verifying models are ready...")
+    vlm_ready = False
+    llm_ready = False
+    embed_ready = False
+    final_context_size = 0
+    try:
+        # Check health for context size
+        health = client.health_check()
+        final_context_size = health.get("context_size", 0)
+        # Check each model
+        vlm_ready = client.check_model_loaded(vlm_model)
+        llm_ready = client.check_model_loaded(llm_model)
+        embed_ready = client.check_model_loaded(embed_model)
+        if vlm_ready:
+            console.print("  [green]✓[/green] VLM: Ready for form extraction")
+        else:
+            console.print("  [yellow]![/yellow] VLM: Will load on first use")
+        if llm_ready:
+            console.print("  [green]✓[/green] LLM: Ready for chat queries")
+        else:
+            console.print("  [dim]○[/dim] LLM: Will load on first use")
+        if embed_ready:
+            console.print("  [green]✓[/green] Embedding: Ready for search")
+        else:
+            console.print("  [dim]○[/dim] Embedding: Will load on first use")
+        # Report context size
+        if final_context_size >= REQUIRED_CONTEXT_SIZE:
+            console.print(
+                f"  [green]✓[/green] Context size: [cyan]{final_context_size:,}[/cyan] tokens"
+            )
+        elif final_context_size > 0:
+            console.print(
+                f"  [yellow]⚠[/yellow] Context size: [yellow]{final_context_size:,}[/yellow] tokens (need {REQUIRED_CONTEXT_SIZE:,})"
+            )
+    except Exception as e:
+        console.print(f"  [yellow]![/yellow] Could not verify: {e}")
+    # Step 5: Show all downloaded and loaded models
+    console.print()
+    console.print("[bold]Step 5:[/bold] Model inventory...")
+    try:
+        models_response = client.list_models()
+        all_models = models_response.get("data", [])
+        # Categorize models
+        vlm_models = []
+        llm_models = []
+        embed_models = []
+        for m in all_models:
+            model_id = m.get("id", "")
+            model_lower = model_id.lower()
+            if "vl" in model_lower or "vision" in model_lower or "vlm" in model_lower:
+                vlm_models.append(model_id)
+            elif (
+                "embed" in model_lower
+                or "bge" in model_lower
+                or "e5" in model_lower
+                or "nomic" in model_lower
+            ):
+                embed_models.append(model_id)
+            else:
+                llm_models.append(model_id)
+        # Show categorized models
+        if vlm_models:
+            console.print(
+                f"  [cyan]VLM Models:[/cyan] {', '.join(vlm_models[:3])}"
+                + (f" (+{len(vlm_models)-3} more)" if len(vlm_models) > 3 else "")
+            )
+        if llm_models:
+            console.print(
+                f"  [cyan]LLM Models:[/cyan] {', '.join(llm_models[:3])}"
+                + (f" (+{len(llm_models)-3} more)" if len(llm_models) > 3 else "")
+            )
+        if embed_models:
+            console.print(
+                f"  [cyan]Embedding Models:[/cyan] {', '.join(embed_models[:3])}"
+                + (f" (+{len(embed_models)-3} more)" if len(embed_models) > 3 else "")
+            )
+        console.print(f"  [dim]Total models available: {len(all_models)}[/dim]")
+    except Exception as e:
+        console.print(f"  [dim]Could not list models: {e}[/dim]")
+    # Success summary
+    console.print()
+    # Build model status lines
+    model_status_lines = []
+    # VLM status
+    if vlm_ready:
+        model_status_lines.append(
+            f"[green]✓[/green] VLM: [cyan]{vlm_model}[/cyan] - Ready"
+        )
+    else:
+        model_status_lines.append(
+            f"[yellow]![/yellow] VLM: [cyan]{vlm_model}[/cyan] - Will load on first use"
+        )
+    # LLM status
+    if llm_ready:
+        model_status_lines.append(
+            f"[green]✓[/green] LLM: [cyan]{llm_model}[/cyan] - Ready"
+        )
+    else:
+        model_status_lines.append(
+            f"[dim]○[/dim] LLM: [cyan]{llm_model}[/cyan] - Will load on first use"
+        )
+    # Embedding status
+    if embed_ready:
+        model_status_lines.append(
+            f"[green]✓[/green] Embedding: [cyan]{embed_model}[/cyan] - Ready"
+        )
+    else:
+        model_status_lines.append(
+            f"[dim]○[/dim] Embedding: [cyan]{embed_model}[/cyan] - Will load on first use"
+        )
+    # Context size status
+    if final_context_size >= REQUIRED_CONTEXT_SIZE:
+        model_status_lines.append(
+            f"[green]✓[/green] Context size: {final_context_size:,} tokens"
+        )
+    elif final_context_size > 0:
+        model_status_lines.append(
+            f"[yellow]⚠[/yellow] Context size: {final_context_size:,} tokens (need {REQUIRED_CONTEXT_SIZE:,})"
+        )
+    # Count ready models
+    ready_count = sum([vlm_ready, llm_ready, embed_ready])
+    console.print(
+        Panel.fit(
+            f"[bold green]✓ EMR Agent initialized ({ready_count}/3 models ready)[/bold green]\n\n"
+            + "\n".join(model_status_lines)
+            + "\n\n"
+            "[dim]You can now run:[/dim]\n"
+            "  [cyan]gaia-emr dashboard[/cyan]  - Start the web dashboard\n"
+            "  [cyan]gaia-emr watch[/cyan]      - Watch folder for intake forms\n"
+            "  [cyan]gaia-emr process <file>[/cyan] - Process a single file",
+            border_style="green",
+        )
+    )
+    console.print()
+    # Context size warning if needed
+    if 0 < final_context_size < REQUIRED_CONTEXT_SIZE:
+        console.print(
+            Panel.fit(
+                "[yellow]⚠️  Context Size Warning[/yellow]\n\n"
+                f"Current context size ({final_context_size:,}) may be too small for processing intake forms.\n"
+                "Large images can require 4,000-8,000+ tokens.\n\n"
+                "[bold]To fix:[/bold]\n"
+                "  1. Right-click Lemonade tray icon → Settings\n"
+                "  2. Set Context Size to [cyan]32768[/cyan]\n"
+                "  3. Click Apply and restart the model",
+                border_style="yellow",
+            )
+        )
+        console.print()
+    return 0
+def cmd_test(args):
+    """Test VLM extraction pipeline on a single file."""
+    import io
+    import json
+    import time
+    from PIL import Image
+    from gaia.llm.vlm_client import VLMClient
+    file_path = Path(args.file)
+    if not file_path.exists():
+        console.print(f"[red]Error: File not found: {file_path}[/red]")
+        return 1
+    console.print()
+    console.print(
+        Panel.fit(
+            "[bold cyan]EMR Agent - VLM Pipeline Test[/bold cyan]\n"
+            f"[dim]Testing extraction on: {file_path.name}[/dim]",
+            border_style="cyan",
+        )
+    )
+    console.print()
+    # Step 1: Read and analyze file
+    console.print("[bold]Step 1:[/bold] Reading file...")
+    try:
+        raw_bytes = file_path.read_bytes()
+        file_size_kb = len(raw_bytes) / 1024
+        console.print(f"  File size: {file_size_kb:.1f} KB")
+        # Get image dimensions
+        img = Image.open(io.BytesIO(raw_bytes))
+        orig_width, orig_height = img.size
+        console.print(f"  Dimensions: {orig_width}x{orig_height} pixels")
+        # Auto-rotate based on EXIF orientation
+        try:
+            from PIL import ExifTags
+            exif = img._getexif()  # pylint: disable=protected-access
+            if exif:
+                for tag, value in exif.items():
+                    if ExifTags.TAGS.get(tag) == "Orientation":
+                        if value == 3:
+                            img = img.rotate(180, expand=True)
+                            console.print("  [dim]Auto-rotated 180°[/dim]")
+                        elif value == 6:
+                            img = img.rotate(270, expand=True)
+                            console.print("  [dim]Auto-rotated 90° CW[/dim]")
+                        elif value == 8:
+                            img = img.rotate(90, expand=True)
+                            console.print("  [dim]Auto-rotated 90° CCW[/dim]")
+                        orig_width, orig_height = img.size
+                        break
+        except Exception:
+            pass  # No EXIF or rotation info
+    except Exception as e:
+        console.print(f"  [red]✗[/red] Failed to read file: {e}")
+        return 1
+    # Step 2: Optimize image (same as agent)
+    console.print()
+    console.print("[bold]Step 2:[/bold] Optimizing image...")
+    max_dimension = args.max_dimension
+    jpeg_quality = args.jpeg_quality
+    try:
+        if orig_width > max_dimension or orig_height > max_dimension:
+            scale = min(max_dimension / orig_width, max_dimension / orig_height)
+            new_width = int(orig_width * scale)
+            new_height = int(orig_height * scale)
+            img = img.resize((new_width, new_height), Image.Resampling.LANCZOS)
+            console.print(
+                f"  Resized: {orig_width}x{orig_height} → {new_width}x{new_height}"
+            )
+        else:
+            new_width, new_height = orig_width, orig_height
+            console.print(f"  No resize needed (under {max_dimension}px)")
+        # Convert to RGB and JPEG
+        if img.mode in ("RGBA", "P"):
+            img = img.convert("RGB")
+        output = io.BytesIO()
+        img.save(output, format="JPEG", quality=jpeg_quality, optimize=True)
+        image_bytes = output.getvalue()
+        opt_size_kb = len(image_bytes) / 1024
+        reduction = (1 - opt_size_kb / file_size_kb) * 100
+        console.print(
+            f"  Optimized: {file_size_kb:.0f}KB → {opt_size_kb:.0f}KB ({reduction:.0f}% smaller)"
+        )
+        # Estimate image tokens (rough: ~1 token per 14x14 pixel patch)
+        est_img_tokens = (new_width // 14) * (new_height // 14)
+        console.print(f"  Est. image tokens: ~{est_img_tokens:,}")
+    except Exception as e:
+        console.print(f"  [red]✗[/red] Failed to optimize: {e}")
+        return 1
+    # Step 3: Initialize VLM
+    console.print()
+    console.print("[bold]Step 3:[/bold] Initializing VLM...")
+    try:
+        vlm = VLMClient(vlm_model=args.vlm_model)
+        # Clear context if requested (unload and reload model)
+        if getattr(args, "clear_context", False):
+            console.print("  [dim]Clearing VLM context (unload + reload)...[/dim]")
+            try:
+                vlm.client.unload_model()
+                vlm.client.load_model(args.vlm_model, timeout=300, auto_download=True)
+                console.print("  [green]✓[/green] Context cleared")
+            except Exception as e:
+                console.print(f"  [yellow]⚠[/yellow] Could not clear context: {e}")
+        console.print(f"  [green]✓[/green] VLM ready: [cyan]{vlm.vlm_model}[/cyan]")
+    except Exception as e:
+        console.print(f"  [red]✗[/red] Failed to initialize VLM: {e}")
+        return 1
+    # Step 4: Extract data with auto-retry on memory errors
+    console.print()
+    console.print("[bold]Step 4:[/bold] Extracting patient data...")
+    extraction_prompt = """Extract ALL patient information from this medical intake form.
+Return a JSON object with these fields (use null for missing/unclear):
+{
+    "form_date": "YYYY-MM-DD (date form was filled, today's date)",
+    "first_name": "...",
+    "last_name": "...",
+    "date_of_birth": "YYYY-MM-DD",
+    "age": "patient's age if listed",
+    "gender": "Male/Female/Other",
+    "preferred_pronouns": "he/him, she/her, they/them if listed",
+    "ssn": "XXX-XX-XXXX (social security number)",
+    "marital_status": "Single/Married/Divorced/Widowed/Partnered",
+    "spouse_name": "spouse's name if listed",
+    "phone": "home phone number",
+    "mobile_phone": "cell/mobile phone number",
+    "work_phone": "work phone number",
+    "email": "...",
+    "address": "street address",
+    "city": "...",
+    "state": "...",
+    "zip_code": "...",
+    "preferred_language": "English/Spanish/etc if listed",
+    "race": "if listed",
+    "ethnicity": "if listed",
+    "contact_preference": "preferred contact method if listed",
+    "emergency_contact_name": "name of emergency contact person",
+    "emergency_contact_relationship": "relationship to patient (e.g. Mom, Spouse, Friend)",
+    "emergency_contact_phone": "emergency contact's phone number",
+    "referring_physician": "name of referring physician/doctor",
+    "referring_physician_phone": "phone number next to referring physician",
+    "primary_care_physician": "PCP name if different from referring",
+    "preferred_pharmacy": "pharmacy name if listed",
+    "employment_status": "Employed/Self Employed/Unemployed/Retired/Student/Disabled/Military",
+    "occupation": "job title if listed",
+    "employer": "employer/company name",
+    "employer_address": "employer address if listed",
+    "insurance_provider": "insurance company name",
+    "insurance_id": "policy number",
+    "insurance_group_number": "group number",
+    "insured_name": "name of insured person (may differ from patient)",
+    "insured_dob": "YYYY-MM-DD",
+    "insurance_phone": "insurance contact number",
+    "billing_address": "billing address if different from home",
+    "guarantor_name": "person responsible for payment if listed",
+    "reason_for_visit": "chief complaint or reason for visit",
+    "date_of_injury": "YYYY-MM-DD (date of injury or onset of symptoms)",
+    "pain_location": "where pain is located if listed",
+    "pain_onset": "when pain began (e.g. three months ago)",
+    "pain_cause": "what caused the pain/condition",
+    "pain_progression": "Improved/Worsened/Stayed the same",
+    "work_related_injury": "Yes/No",
+    "car_accident": "Yes/No",
+    "medical_conditions": "existing medical conditions",
+    "allergies": "known allergies",
+    "medications": "current medications",
+    "signature_date": "YYYY-MM-DD (date signed)"
+}
+IMPORTANT: Return ONLY the JSON object, no other text."""
+    # Retry loop with progressively smaller images on memory errors
+    max_retries = 3
+    current_img = img
+    current_bytes = image_bytes
+    current_width, current_height = new_width, new_height
+    current_size_kb = opt_size_kb
+    for attempt in range(max_retries):
+        est_img_tokens = (current_width // 14) * (current_height // 14)
+        console.print(
+            f"  Image: {current_width}x{current_height}, {current_size_kb:.0f}KB (~{est_img_tokens:,} tokens)"
+        )
+        if attempt == 0:
+            console.print("  [dim]This may take 30-60 seconds...[/dim]")
+        else:
+            console.print(
+                f"  [dim]Retry {attempt}/{max_retries-1} with smaller image...[/dim]"
+            )
+        try:
+            start_time = time.time()
+            raw_text = vlm.extract_from_image(
+                image_bytes=current_bytes,
+                prompt=extraction_prompt,
+            )
+            extraction_time = time.time() - start_time
+            # Check for memory-related errors
+            if (
+                "failed to process image" in raw_text
+                or "memory slot" in raw_text.lower()
+            ):
+                if attempt < max_retries - 1:
+                    console.print(
+                        "  [yellow]⚠[/yellow] Memory error, reducing image size..."
+                    )
+                    # Reduce image to 75% of current size
+                    scale = 0.75
+                    current_width = int(current_width * scale)
+                    current_height = int(current_height * scale)
+                    current_img = current_img.resize(
+                        (current_width, current_height), Image.Resampling.LANCZOS
+                    )
+                    output = io.BytesIO()
+                    current_img.save(
+                        output, format="JPEG", quality=jpeg_quality, optimize=True
+                    )
+                    current_bytes = output.getvalue()
+                    current_size_kb = len(current_bytes) / 1024
+                    continue
+                else:
+                    console.print(f"  [red]✗[/red] {raw_text}")
+                    console.print()
+                    console.print("[yellow]Suggestions:[/yellow]")
+                    console.print("  1. Try with smaller image: --max-dimension 640")
+                    console.print("  2. Restart Lemonade Server to clear memory")
+                    console.print("  3. Reload the VLM model in Lemonade")
+                    return 1
+            if raw_text.startswith("[VLM extraction failed:"):
+                console.print(f"  [red]✗[/red] {raw_text}")
+                return 1
+            # Success!
+            console.print(
+                f"  [green]✓[/green] Extraction complete ({len(raw_text)} chars, {extraction_time:.1f}s)"
+            )
+            # Estimate tokens/sec (output tokens only)
+            est_output_tokens = len(raw_text) / 4
+            tps = est_output_tokens / extraction_time if extraction_time > 0 else 0
+            console.print(
+                f"  Output: ~{est_output_tokens:.0f} tokens at ~{tps:.1f} TPS"
+            )
+            # Total throughput including prompt processing
+            total_tokens = (
+                est_img_tokens + 200 + est_output_tokens
+            )  # img + prompt + output
+            total_tps = total_tokens / extraction_time if extraction_time > 0 else 0
+            console.print(
+                f"  Total throughput: ~{total_tps:.0f} TPS (incl. {est_img_tokens:,} image tokens)"
+            )
+            # Update dimensions for final report
+            new_width, new_height = current_width, current_height
+            break
+        except Exception as e:
+            console.print(f"  [red]✗[/red] Extraction failed: {e}")
+            return 1
+    else:
+        # All retries exhausted
+        console.print("  [red]✗[/red] All retries failed")
+        return 1
+    # Step 5: Parse JSON
+    console.print()
+    console.print("[bold]Step 5:[/bold] Parsing JSON...")
+    try:
+        # Try direct parse
+        patient_data = json.loads(raw_text)
+        console.print("  [green]✓[/green] JSON parsed successfully")
+    except json.JSONDecodeError:
+        # Try to find JSON in text
+        try:
+            start = raw_text.find("{")
+            end = raw_text.rfind("}") + 1
+            if start >= 0 and end > start:
+                patient_data = json.loads(raw_text[start:end])
+                console.print("  [green]✓[/green] JSON extracted from response")
+            else:
+                console.print("  [red]✗[/red] No JSON found in response")
+                console.print()
+                console.print("[bold]Raw VLM Output:[/bold]")
+                console.print(raw_text[:500])
+                return 1
+        except json.JSONDecodeError as e:
+            console.print(f"  [red]✗[/red] JSON parse failed: {e}")
+            return 1
+    # Display results
+    console.print()
+    console.print(
+        Panel.fit(
+            "[bold green]✓ Extraction Successful[/bold green]",
+            border_style="green",
+        )
+    )
+    # Show extracted fields
+    console.print()
+    console.print("[bold]Extracted Fields:[/bold]")
+    fields_found = 0
+    for key, value in patient_data.items():
+        if value and value != "null":
+            fields_found += 1
+            console.print(f"  [cyan]{key}:[/cyan] {value}")
+    console.print()
+    console.print(f"[dim]Fields extracted: {fields_found}/53[/dim]")
+    console.print()
+    # Timing breakdown section
+    console.print("[bold]⏱️  TIMING BREAKDOWN[/bold]")
+    console.print("-" * 40)
+    console.print(f"   Model:              {args.vlm_model}")
+    console.print(f"   Image dimensions:   {new_width}x{new_height}")
+    console.print(f"   VLM extraction:     {extraction_time:.2f}s")
+    console.print(f"   Est. image tokens:  ~{est_img_tokens:,}")
+    console.print(f"   Est. output tokens: ~{int(est_output_tokens)}")
+    console.print(f"   Est. tokens/sec:    ~{tps:.1f} TPS")
+    console.print()
+    # Success summary
+    if patient_data.get("first_name") and patient_data.get("last_name"):
+        console.print(
+            f"   Patient: {patient_data.get('first_name', '')} {patient_data.get('last_name', '')}"
+        )
+        console.print("   [green]✓ Pipeline test PASSED[/green]")
+    else:
+        console.print("   [yellow]⚠ Missing required name fields[/yellow]")
+        console.print("   [red]✗ Pipeline test FAILED[/red]")
+    console.print()
+    return 0
+def _launch_electron(url: str, delay: float = 1.5) -> bool:
+    """
+    Launch Electron app to display the dashboard.
+    Returns True if Electron was launched successfully, False otherwise.
+    """
+    import os
+    import platform
+    import shutil
+    import subprocess
+    import time
+    time.sleep(delay)  # Wait for server to start
+    # Find the Electron wrapper directory
+    electron_dir = Path(__file__).parent / "dashboard" / "electron"
+    main_js = electron_dir / "main.js"
+    if not main_js.exists():
+        logger.warning(f"Electron wrapper not found at {electron_dir}")
+        return False
+    # On Windows, use npm.cmd and npx.cmd
+    is_windows = platform.system() == "Windows"
+    npm_cmd = "npm.cmd" if is_windows else "npm"
+    npx_cmd = "npx.cmd" if is_windows else "npx"
+    # Check if npx/electron is available
+    npx_path = shutil.which(npx_cmd)
+    if not npx_path:
+        logger.warning(f"{npx_cmd} not found in PATH, cannot launch Electron")
+        return False
+    try:
+        # Check if node_modules exists, if not run npm install first
+        node_modules = electron_dir / "node_modules"
+        if not node_modules.exists():
+            console.print("[dim]Installing Electron dependencies...[/dim]")
+            subprocess.run(
+                [npm_cmd, "install"],
+                cwd=str(electron_dir),
+                capture_output=True,
+                check=True,
+                shell=is_windows,  # Use shell on Windows for .cmd files
+            )
+        # Launch Electron with the dashboard URL
+        env = os.environ.copy()
+        env["EMR_DASHBOARD_URL"] = url
+        subprocess.Popen(
+            [npx_cmd, "electron", "."],
+            cwd=str(electron_dir),
+            env=env,
+            stdout=subprocess.DEVNULL,
+            stderr=subprocess.DEVNULL,
+            shell=is_windows,  # Use shell on Windows for .cmd files
+        )
+        return True
+    except Exception as e:
+        logger.warning(f"Failed to launch Electron: {e}")
+        return False
+def cmd_dashboard(args):
+    """Start web dashboard."""
+    import threading
+    import time
+    import webbrowser
+    def open_browser(url: str, delay: float = 1.5):
+        """Open browser after a short delay to allow server to start."""
+        time.sleep(delay)
+        webbrowser.open(url)
+    def open_electron_or_browser(url: str, use_browser: bool, delay: float = 1.5):
+        """Open Electron app, falling back to browser if needed."""
+        if use_browser:
+            open_browser(url, delay)
+        else:
+            if not _launch_electron(url, delay):
+                console.print(
+                    "[yellow]Electron not available, opening in browser instead...[/yellow]"
+                )
+                open_browser(url, delay)
+    try:
+        from gaia.agents.emr.dashboard.server import run_dashboard
+        console.print()
+        console.print(
+            Panel.fit(
+                "[bold cyan]EMR Dashboard[/bold cyan]\n"
+                "[dim]Real-time Patient Processing Monitor[/dim]",
+                border_style="cyan",
+            )
+        )
+        url = f"http://localhost:{args.port}"
+        table = Table(show_header=False, box=None, padding=(0, 2))
+        table.add_column(style="dim")
+        table.add_column()
+        table.add_row("📁 Watch folder:", args.watch_dir)
+        table.add_row("💾 Database:", args.db)
+        table.add_row("🌐 URL:", f"[bold cyan]{url}[/bold cyan]")
+        console.print(table)
+        console.print("\n[dim]Press Ctrl+C to stop[/dim]\n")
+        # Auto-open unless --no-open flag is set
+        if not getattr(args, "no_open", False):
+            use_browser = getattr(args, "browser", False)
+            if use_browser:
+                console.print("[dim]Opening dashboard in browser...[/dim]\n")
+            else:
+                console.print("[dim]Opening dashboard in Electron app...[/dim]\n")
+            open_thread = threading.Thread(
+                target=open_electron_or_browser,
+                args=(url, use_browser),
+                daemon=True,
+            )
+            open_thread.start()
+        run_dashboard(
+            watch_dir=args.watch_dir,
+            db_path=args.db,
+            host=args.host,
+            port=args.port,
+        )
+    except ImportError:
+        console.print("[red]Error: Dashboard dependencies not installed[/red]")
+        console.print("Install with: [cyan]pip install 'amd-gaia[api]'[/cyan]")
+        return 1
+    except KeyboardInterrupt:
+        console.print("\n[dim]Shutting down dashboard...[/dim]")
+        return 0
+def _add_common_args(parser):
+    """Add common arguments to a parser."""
+    parser.add_argument(
+        "--watch-dir",
+        default="./intake_forms",
+        help="Directory to watch for intake forms (default: ./intake_forms)",
+    )
+    parser.add_argument(
+        "--db",
+        default="./data/patients.db",
+        help="Path to patient database (default: ./data/patients.db)",
+    )
+    parser.add_argument(
+        "--vlm-model",
+        default="Qwen3-VL-4B-Instruct-GGUF",
+        help="VLM model for extraction (default: Qwen3-VL-4B-Instruct-GGUF)",
+    )
+    parser.add_argument(
+        "--debug",
+        action="store_true",
+        help="Enable debug logging",
+    )
+def main():
+    """Main CLI entry point."""
+    parser = argparse.ArgumentParser(
+        description="Medical Intake Agent CLI",
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+    )
+    subparsers = parser.add_subparsers(dest="command", help="Command to run")
+    # Watch command
+    parser_watch = subparsers.add_parser(
+        "watch",
+        help="Watch directory for new intake forms",
+    )
+    _add_common_args(parser_watch)
+    parser_watch.set_defaults(func=cmd_watch)
+    # Process command
+    parser_process = subparsers.add_parser(
+        "process",
+        help="Process a single intake form",
+    )
+    _add_common_args(parser_process)
+    parser_process.add_argument("file", help="Path to intake form file")
+    parser_process.set_defaults(func=cmd_process)
+    # Query command
+    parser_query = subparsers.add_parser(
+        "query",
+        help="Query patient database",
+    )
+    _add_common_args(parser_query)
+    parser_query.add_argument("question", help="Question to ask")
+    parser_query.set_defaults(func=cmd_query)
+    # Stats command
+    parser_stats = subparsers.add_parser(
+        "stats",
+        help="Show processing statistics",
+    )
+    _add_common_args(parser_stats)
+    parser_stats.set_defaults(func=cmd_stats)
+    # Reset command
+    parser_reset = subparsers.add_parser(
+        "reset",
+        help="Clear all patient data from the database",
+    )
+    _add_common_args(parser_reset)
+    parser_reset.add_argument(
+        "--force",
+        "-f",
+        action="store_true",
+        help="Skip confirmation prompt",
+    )
+    parser_reset.set_defaults(func=cmd_reset)
+    # Init command
+    parser_init = subparsers.add_parser(
+        "init",
+        help="Download and setup required VLM models",
+    )
+    parser_init.add_argument(
+        "--vlm-model",
+        default="Qwen3-VL-4B-Instruct-GGUF",
+        help="VLM model to download (default: Qwen3-VL-4B-Instruct-GGUF)",
+    )
+    parser_init.add_argument(
+        "--debug",
+        action="store_true",
+        help="Enable debug logging",
+    )
+    parser_init.set_defaults(func=cmd_init)
+    # Test command
+    parser_test = subparsers.add_parser(
+        "test",
+        help="Test VLM extraction pipeline on a single file",
+    )
+    parser_test.add_argument(
+        "file",
+        help="Path to intake form image (PNG, JPG, PDF)",
+    )
+    parser_test.add_argument(
+        "--vlm-model",
+        default="Qwen3-VL-4B-Instruct-GGUF",
+        help="VLM model to use (default: Qwen3-VL-4B-Instruct-GGUF)",
+    )
+    parser_test.add_argument(
+        "--max-dimension",
+        type=int,
+        default=1024,
+        help="Max image dimension in pixels (default: 1024)",
+    )
+    parser_test.add_argument(
+        "--jpeg-quality",
+        type=int,
+        default=85,
+        help="JPEG compression quality (default: 85)",
+    )
+    parser_test.add_argument(
+        "--clear-context",
+        action="store_true",
+        help="Clear VLM context before processing (fixes memory errors)",
+    )
+    parser_test.add_argument(
+        "--debug",
+        action="store_true",
+        help="Enable debug logging",
+    )
+    parser_test.set_defaults(func=cmd_test)
+    # Dashboard command
+    parser_dashboard = subparsers.add_parser(
+        "dashboard",
+        help="Start web dashboard",
+    )
+    _add_common_args(parser_dashboard)
+    parser_dashboard.add_argument(
+        "--host",
+        default="127.0.0.1",
+        help="Dashboard host (default: 127.0.0.1)",
+    )
+    parser_dashboard.add_argument(
+        "--port",
+        type=int,
+        default=8080,
+        help="Dashboard port (default: 8080)",
+    )
+    parser_dashboard.add_argument(
+        "--no-open",
+        action="store_true",
+        help="Don't automatically open dashboard",
+    )
+    parser_dashboard.add_argument(
+        "--browser",
+        action="store_true",
+        help="Open in web browser instead of Electron app",
+    )
+    parser_dashboard.set_defaults(func=cmd_dashboard)
+    args = parser.parse_args()
+    # Run command
+    if not args.command:
+        parser.print_help()
+        return 0
+    # Configure logging - WARNING by default, DEBUG with --debug flag
+    if getattr(args, "debug", False):
+        logging.basicConfig(
+            level=logging.DEBUG,
+            format="%(asctime)s | %(levelname)s | %(name)s | %(message)s",
+            datefmt="%H:%M:%S",
+        )
+    else:
+        # Suppress all logs from gaia modules for cleaner output
+        logging.basicConfig(level=logging.WARNING)
+        for logger_name in [
+            "gaia",
+            "gaia.llm",
+            "gaia.database",
+            "gaia.agents",
+            "gaia.utils",
+        ]:
+            logging.getLogger(logger_name).setLevel(logging.WARNING)
+    return args.func(args)
+if __name__ == "__main__":
+    sys.exit(main())

amd-gaia 0.15.0__py3-none-any.whl → 0.15.1__py3-none-any.whl

amd-gaia 0.15.0py3-none-any.whl → 0.15.1py3-none-any.whl