PyPI - adversarial-workflow - Versions diffs - 0.6.2__tar.gz → 0.6.4__tar.gz - Mend

adversarial-workflow 0.6.2tar.gz → 0.6.4tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (54) hide show

{adversarial_workflow-0.6.2 → adversarial_workflow-0.6.4}/PKG-INFO RENAMED Viewed

@@ -1,7 +1,7 @@
 Metadata-Version: 2.4
 Name: adversarial-workflow
-Version: 0.6.2
-Summary: Multi-stage AI code review system preventing phantom work - Author/Evaluator pattern
+Version: 0.6.4
+Summary: Multi-stage AI evaluation system for task plans, code review, and test validation
 Author: Fredrik Matheson
 License: MIT
 Project-URL: Homepage, https://github.com/movito/adversarial-workflow
@@ -55,9 +55,30 @@ Evaluate proposals, sort out ideas, and prevent "phantom work" (AI claiming to i
 - 🎯 **Tool-agnostic**: Use with Claude Code, Cursor, Aider, manual coding, or any workflow
 - ✨ **Interactive onboarding**: Guided setup wizard gets you started in <5 minutes
-## What's New in v0.6.0
+## What's New in v0.6.3
-🔌 **Plugin Architecture** - Define custom evaluators without modifying the package:
+### Upgrade
+```bash
+pip install --upgrade adversarial-workflow
+```
+### v0.6.3 - Configurable Timeouts
+- **Per-evaluator timeout**: Add `timeout: 300` to evaluator YAML for slow models like Mistral Large
+- **CLI override**: Use `--timeout 400` to override YAML config on-the-fly
+- **Timeout logging**: See which timeout source is used (CLI/YAML/default)
+- **Safety limits**: Maximum 600 seconds to prevent runaway processes
+### v0.6.2 - .env Loading & Stability
+- **Automatic .env loading**: API keys in `.env` files are now loaded at CLI startup
+- **Custom evaluator support**: Evaluators using `api_key_env: GEMINI_API_KEY` (or other keys) now work with `.env` files
+- **Better diagnostics**: `adversarial check` correctly reports the number of variables loaded from `.env`
+### v0.6.0 - Plugin Architecture
+🔌 **Custom Evaluators** - Define your own evaluators without modifying the package:
 ```bash
 # Create a custom evaluator
@@ -459,6 +480,7 @@ Starting with v0.6.0, you can define project-specific evaluators without modifyi
 | `aliases` | No | Alternative command names |
 | `log_prefix` | No | CLI output prefix |
 | `fallback_model` | No | Fallback model if primary fails |
+| `timeout` | No | Timeout in seconds (default: 180, max: 600) |
 | `version` | No | Evaluator version (default: 1.0.0) |
 ### Listing Available Evaluators

{adversarial_workflow-0.6.2 → adversarial_workflow-0.6.4}/README.md RENAMED Viewed

@@ -20,9 +20,30 @@ Evaluate proposals, sort out ideas, and prevent "phantom work" (AI claiming to i
 - 🎯 **Tool-agnostic**: Use with Claude Code, Cursor, Aider, manual coding, or any workflow
 - ✨ **Interactive onboarding**: Guided setup wizard gets you started in <5 minutes
-## What's New in v0.6.0
+## What's New in v0.6.3
-🔌 **Plugin Architecture** - Define custom evaluators without modifying the package:
+### Upgrade
+```bash
+pip install --upgrade adversarial-workflow
+```
+### v0.6.3 - Configurable Timeouts
+- **Per-evaluator timeout**: Add `timeout: 300` to evaluator YAML for slow models like Mistral Large
+- **CLI override**: Use `--timeout 400` to override YAML config on-the-fly
+- **Timeout logging**: See which timeout source is used (CLI/YAML/default)
+- **Safety limits**: Maximum 600 seconds to prevent runaway processes
+### v0.6.2 - .env Loading & Stability
+- **Automatic .env loading**: API keys in `.env` files are now loaded at CLI startup
+- **Custom evaluator support**: Evaluators using `api_key_env: GEMINI_API_KEY` (or other keys) now work with `.env` files
+- **Better diagnostics**: `adversarial check` correctly reports the number of variables loaded from `.env`
+### v0.6.0 - Plugin Architecture
+🔌 **Custom Evaluators** - Define your own evaluators without modifying the package:
 ```bash
 # Create a custom evaluator
@@ -424,6 +445,7 @@ Starting with v0.6.0, you can define project-specific evaluators without modifyi
 | `aliases` | No | Alternative command names |
 | `log_prefix` | No | CLI output prefix |
 | `fallback_model` | No | Fallback model if primary fails |
+| `timeout` | No | Timeout in seconds (default: 180, max: 600) |
 | `version` | No | Evaluator version (default: 1.0.0) |
 ### Listing Available Evaluators

{adversarial_workflow-0.6.2 → adversarial_workflow-0.6.4}/adversarial_workflow/__init__.py RENAMED Viewed

@@ -12,7 +12,7 @@ Usage:
     adversarial validate "pytest"
 """
-__version__ = "0.6.2"
+__version__ = "0.6.4"
 __author__ = "Fredrik Matheson"
 __license__ = "MIT"

{adversarial_workflow-0.6.2 → adversarial_workflow-0.6.4}/adversarial_workflow/__main__.py RENAMED Viewed

@@ -1,4 +1,5 @@
 """Allow execution via python -m adversarial_workflow."""
 from .cli import main
 if __name__ == "__main__":

{adversarial_workflow-0.6.2 → adversarial_workflow-0.6.4}/adversarial_workflow/cli.py RENAMED Viewed

@@ -29,7 +29,7 @@ from typing import Dict, List, Optional, Tuple
 import yaml
 from dotenv import dotenv_values, load_dotenv
-__version__ = "0.6.2"
+__version__ = "0.6.4"
 # ANSI color codes for better output
 RESET = "\033[0m"
@@ -180,7 +180,9 @@ def create_env_file_interactive(
     env_content += "# DO NOT COMMIT THIS FILE\n\n"
     if anthropic_key:
-        env_content += f"# Anthropic API Key (Claude 3.5 Sonnet)\nANTHROPIC_API_KEY={anthropic_key}\n\n"
+        env_content += (
+            f"# Anthropic API Key (Claude 3.5 Sonnet)\nANTHROPIC_API_KEY={anthropic_key}\n\n"
+        )
     if openai_key:
         env_content += f"# OpenAI API Key (GPT-4o)\nOPENAI_API_KEY={openai_key}\n\n"
@@ -255,9 +257,7 @@ def init_interactive(project_path: str = ".") -> int:
             ],
         )
-        anthropic_key = prompt_user(
-            "Paste your Anthropic API key (or Enter to skip)", secret=True
-        )
+        anthropic_key = prompt_user("Paste your Anthropic API key (or Enter to skip)", secret=True)
         if anthropic_key:
             is_valid, message = validate_api_key(anthropic_key, "anthropic")
@@ -281,9 +281,7 @@ def init_interactive(project_path: str = ".") -> int:
             ],
         )
-        openai_key = prompt_user(
-            "Paste your OpenAI API key (or Enter to skip)", secret=True
-        )
+        openai_key = prompt_user("Paste your OpenAI API key (or Enter to skip)", secret=True)
         if openai_key:
             is_valid, message = validate_api_key(openai_key, "openai")
@@ -322,16 +320,20 @@ def init_interactive(project_path: str = ".") -> int:
         f"{GREEN}✅ Setup Complete!{RESET}",
         [
             "Created:",
-            "  ✓ .env (with your API keys - added to .gitignore)"
-            if (anthropic_key or openai_key)
-            else "  ⚠️ .env (skipped - no API keys provided)",
+            (
+                "  ✓ .env (with your API keys - added to .gitignore)"
+                if (anthropic_key or openai_key)
+                else "  ⚠️ .env (skipped - no API keys provided)"
+            ),
             "  ✓ .adversarial/config.yml",
             "  ✓ .adversarial/scripts/ (3 workflow scripts)",
             "  ✓ .aider.conf.yml (aider configuration)",
             "",
-            "Your configuration:"
-            if (anthropic_key or openai_key)
-            else "Configuration (no API keys yet):",
+            (
+                "Your configuration:"
+                if (anthropic_key or openai_key)
+                else "Configuration (no API keys yet):"
+            ),
             f"  Author (implementation): {'Claude 3.5 Sonnet (Anthropic)' if anthropic_key else 'GPT-4o (OpenAI)' if openai_key else 'Not configured'}",
             f"  Evaluator: {'GPT-4o (OpenAI)' if openai_key else 'Claude 3.5 Sonnet (Anthropic)' if anthropic_key else 'Not configured'}",
             f"  Cost per workflow: {'~$0.02-0.10' if (anthropic_key and openai_key) else '~$0.05-0.15' if (anthropic_key or openai_key) else 'N/A'}",
@@ -609,9 +611,7 @@ def init(project_path: str = ".", interactive: bool = True) -> int:
         print("   3. Then run: adversarial init")
         print()
         print(f"{BOLD}HELP:{RESET}")
-        print(
-            "   New to git? https://git-scm.com/book/en/v2/Getting-Started-Installing-Git"
-        )
+        print("   New to git? https://git-scm.com/book/en/v2/Getting-Started-Installing-Git")
         return 1
     # Pre-flight validation: Check package integrity
@@ -645,9 +645,7 @@ def init(project_path: str = ".", interactive: bool = True) -> int:
             print(f"   • {template}")
         print()
         print(f"{BOLD}FIX:{RESET}")
-        print(
-            "   1. Report this issue: https://github.com/movito/adversarial-workflow/issues"
-        )
+        print("   1. Report this issue: https://github.com/movito/adversarial-workflow/issues")
         print(
             "   2. Or try reinstalling: pip install --upgrade --force-reinstall adversarial-workflow"
         )
@@ -1026,13 +1024,9 @@ def check() -> int:
     else:
         status_parts = []
         if error_count > 0:
-            status_parts.append(
-                f"{error_count} error" + ("s" if error_count != 1 else "")
-            )
+            status_parts.append(f"{error_count} error" + ("s" if error_count != 1 else ""))
         if warning_count > 0:
-            status_parts.append(
-                f"{warning_count} warning" + ("s" if warning_count != 1 else "")
-            )
+            status_parts.append(f"{warning_count} warning" + ("s" if warning_count != 1 else ""))
         if info_count > 0:
             status_parts.append(f"{info_count} info")
@@ -1084,20 +1078,14 @@ def health(verbose: bool = False, json_output: bool = False) -> int:
     # Helper functions for tracking check results
     def check_pass(category: str, message: str, detail: str = None):
         nonlocal passed
-        results[category].append(
-            {"status": "pass", "message": message, "detail": detail}
-        )
+        results[category].append({"status": "pass", "message": message, "detail": detail})
         if not json_output:
             print(f"  {GREEN}✅{RESET} {message}")
         passed += 1
-    def check_warn(
-        category: str, message: str, detail: str = None, recommendation: str = None
-    ):
+    def check_warn(category: str, message: str, detail: str = None, recommendation: str = None):
         nonlocal warnings
-        results[category].append(
-            {"status": "warn", "message": message, "detail": detail}
-        )
+        results[category].append({"status": "warn", "message": message, "detail": detail})
         if not json_output:
             print(f"  {YELLOW}⚠️{RESET}  {message}")
             if detail and verbose:
@@ -1106,9 +1094,7 @@ def health(verbose: bool = False, json_output: bool = False) -> int:
             recommendations.append(recommendation)
         warnings += 1
-    def check_fail(
-        category: str, message: str, fix: str = None, recommendation: str = None
-    ):
+    def check_fail(category: str, message: str, fix: str = None, recommendation: str = None):
         nonlocal errors
         results[category].append({"status": "fail", "message": message, "fix": fix})
         if not json_output:
@@ -1120,9 +1106,7 @@ def health(verbose: bool = False, json_output: bool = False) -> int:
         errors += 1
     def check_info(category: str, message: str, detail: str = None):
-        results[category].append(
-            {"status": "info", "message": message, "detail": detail}
-        )
+        results[category].append({"status": "info", "message": message, "detail": detail})
         if not json_output:
             print(f"  {CYAN}ℹ️{RESET}  {message}")
             if detail and verbose:
@@ -1254,23 +1238,13 @@ def health(verbose: bool = False, json_output: bool = False) -> int:
                 )
                 if git_status.returncode == 0:
                     modified = len(
-                        [
-                            l
-                            for l in git_status.stdout.splitlines()
-                            if l.startswith(" M")
-                        ]
+                        [l for l in git_status.stdout.splitlines() if l.startswith(" M")]
                     )
                     untracked = len(
-                        [
-                            l
-                            for l in git_status.stdout.splitlines()
-                            if l.startswith("??")
-                        ]
+                        [l for l in git_status.stdout.splitlines() if l.startswith("??")]
                     )
                     if modified == 0 and untracked == 0:
-                        check_pass(
-                            "dependencies", f"Git: {version} (working tree clean)"
-                        )
+                        check_pass("dependencies", f"Git: {version} (working tree clean)")
                     else:
                         check_info(
                             "dependencies",
@@ -1307,11 +1281,7 @@ def health(verbose: bool = False, json_output: bool = False) -> int:
             aider_version = subprocess.run(
                 ["aider", "--version"], capture_output=True, text=True, timeout=2
             )
-            version = (
-                aider_version.stdout.strip()
-                if aider_version.returncode == 0
-                else "unknown"
-            )
+            version = aider_version.stdout.strip() if aider_version.returncode == 0 else "unknown"
             check_pass("dependencies", f"Aider: {version} (functional)")
         except:
             check_pass("dependencies", "Aider: installed")
@@ -1455,9 +1425,7 @@ def health(verbose: bool = False, json_output: bool = False) -> int:
                     json.load(f)
                 check_pass("agent_coordination", "current-state.json - Valid JSON")
             except json.JSONDecodeError as e:
-                check_fail(
-                    "agent_coordination", f"current-state.json - Invalid JSON: {e}"
-                )
+                check_fail("agent_coordination", f"current-state.json - Invalid JSON: {e}")
         else:
             check_info("agent_coordination", "current-state.json not found (optional)")
@@ -1501,9 +1469,7 @@ def health(verbose: bool = False, json_output: bool = False) -> int:
                     with open(script_path) as f:
                         content = f.read()
                     if "#!/bin/bash" in content or "#!/usr/bin/env bash" in content:
-                        check_pass(
-                            "workflow_scripts", f"{script_name} - Executable, valid"
-                        )
+                        check_pass("workflow_scripts", f"{script_name} - Executable, valid")
                     else:
                         check_warn(
                             "workflow_scripts",
@@ -1777,9 +1743,7 @@ def verify_token_count(task_file: str, log_file: str) -> None:
             f"   Difference: {expected_tokens - actual_tokens:,} tokens ({100 - int(actual_tokens/expected_tokens*100)}% less)"
         )
         print()
-        print(
-            f"{BOLD}Note:{RESET} Large files may not be fully processed by evaluator."
-        )
+        print(f"{BOLD}Note:{RESET} Large files may not be fully processed by evaluator.")
         print(f"      Consider splitting into smaller documents (<1,000 lines).")
         print()
@@ -1960,9 +1924,7 @@ def evaluate(task_file: str) -> int:
             print(f"{RED}❌ ERROR: OpenAI rate limit exceeded{RESET}")
             print()
             print(f"{BOLD}WHY:{RESET}")
-            print(
-                "   Your task file is too large for your OpenAI organization's rate limit"
-            )
+            print("   Your task file is too large for your OpenAI organization's rate limit")
             print()
             # Extract file size for helpful message
@@ -2009,9 +1971,7 @@ def evaluate(task_file: str) -> int:
             print()
             print(f"{BOLD}FIX:{RESET}")
             print("   Option 1 (RECOMMENDED): Use WSL (Windows Subsystem for Linux)")
-            print(
-                "     1. Install WSL: https://learn.microsoft.com/windows/wsl/install"
-            )
+            print("     1. Install WSL: https://learn.microsoft.com/windows/wsl/install")
             print("     2. Open WSL terminal")
             print("     3. Reinstall package in WSL: pip install adversarial-workflow")
             print()
@@ -2182,9 +2142,7 @@ def validate(test_command: Optional[str] = None) -> int:
         return 1
     try:
-        result = subprocess.run(
-            [script, test_command], timeout=600
-        )  # 10 minutes for tests
+        result = subprocess.run([script, test_command], timeout=600)  # 10 minutes for tests
     except subprocess.TimeoutExpired:
         print(f"{RED}❌ ERROR: Test validation timed out (>10 minutes){RESET}")
         return 1
@@ -2237,9 +2195,7 @@ def select_agent_template() -> Dict[str, str]:
     elif choice == "3":
         print()
         print(f"{CYAN}Custom Template URL:{RESET}")
-        print(
-            "  Example: https://raw.githubusercontent.com/user/repo/main/agent-handoffs.json"
-        )
+        print("  Example: https://raw.githubusercontent.com/user/repo/main/agent-handoffs.json")
         print()
         url = prompt_user("Template URL")
         if url:
@@ -2279,9 +2235,7 @@ def fetch_agent_template(url: str, template_type: str = "standard") -> Optional[
                 with open(template_path, "r") as f:
                     return f.read()
             except Exception as e:
-                print(
-                    f"{RED}❌ ERROR: Could not read {template_type} template: {e}{RESET}"
-                )
+                print(f"{RED}❌ ERROR: Could not read {template_type} template: {e}{RESET}")
                 return None
         else:
             print(f"{RED}❌ ERROR: {template_type} template not found in package{RESET}")
@@ -2384,9 +2338,11 @@ def agent_onboard(project_path: str = ".") -> int:
             return 0
     # 3. Interactive questions (4 max)
-    use_delegation = prompt_user(
-        "Use delegation/tasks/ structure? (recommended)", "Y"
-    ).lower() in ["y", "yes", ""]
+    use_delegation = prompt_user("Use delegation/tasks/ structure? (recommended)", "Y").lower() in [
+        "y",
+        "yes",
+        "",
+    ]
     organize_docs = prompt_user("Organize root docs into docs/?", "n").lower() in [
         "y",
@@ -2463,9 +2419,7 @@ def agent_onboard(project_path: str = ".") -> int:
                     print(
                         f"  {CYAN}ℹ️{RESET}  Original tasks/ preserved (remove manually if desired)"
                     )
-                    print(
-                        f"  {CYAN}ℹ️{RESET}  Rollback: rm -rf tasks && mv tasks.backup tasks"
-                    )
+                    print(f"  {CYAN}ℹ️{RESET}  Rollback: rm -rf tasks && mv tasks.backup tasks")
                 except Exception as e:
                     print(f"  {RED}❌{RESET} Migration failed: {e}")
@@ -2479,9 +2433,7 @@ def agent_onboard(project_path: str = ".") -> int:
         print(f"{BOLD}Documentation Organization:{RESET}")
         # Find markdown files in root
-        root_docs = [
-            f for f in os.listdir(".") if f.endswith(".md") and not f.startswith(".")
-        ]
+        root_docs = [f for f in os.listdir(".") if f.endswith(".md") and not f.startswith(".")]
         if len(root_docs) > 0:
             print(f"  Found {len(root_docs)} markdown file(s) in root")
@@ -2501,9 +2453,7 @@ def agent_onboard(project_path: str = ".") -> int:
                         moved_count += 1
                 if moved_count > 0:
-                    print(
-                        f"  {GREEN}✅{RESET} Organized {moved_count} doc(s) into docs/"
-                    )
+                    print(f"  {GREEN}✅{RESET} Organized {moved_count} doc(s) into docs/")
                 else:
                     print(f"  {CYAN}ℹ️{RESET}  No docs needed organizing")
@@ -2556,9 +2506,7 @@ def agent_onboard(project_path: str = ".") -> int:
                 print(f"  {RED}❌{RESET} Failed to fetch agent template")
                 return 1
         else:
-            print(
-                f"  {CYAN}ℹ️{RESET}  Skipped agent-handoffs.json (manual setup requested)"
-            )
+            print(f"  {CYAN}ℹ️{RESET}  Skipped agent-handoffs.json (manual setup requested)")
         # Render current-state.json
         current_state_template = templates_dir / "current-state.json.template"
@@ -2573,9 +2521,7 @@ def agent_onboard(project_path: str = ".") -> int:
         # Render README.md
         readme_template = templates_dir / "README.md.template"
         if readme_template.exists():
-            render_template(
-                str(readme_template), ".agent-context/README.md", template_vars
-            )
+            render_template(str(readme_template), ".agent-context/README.md", template_vars)
             print(f"  {GREEN}✅{RESET} Created .agent-context/README.md")
         # Copy AGENT-SYSTEM-GUIDE.md if it exists and isn't already there
@@ -2614,9 +2560,7 @@ def agent_onboard(project_path: str = ".") -> int:
         except Exception as e:
             print(f"  {YELLOW}⚠️{RESET}  Could not update config: {e}")
-            print(
-                f"     Manually set task_directory: delegation/tasks/ in .adversarial/config.yml"
-            )
+            print(f"     Manually set task_directory: delegation/tasks/ in .adversarial/config.yml")
     # 9. Update .gitignore
     print()
@@ -2670,9 +2614,7 @@ def agent_onboard(project_path: str = ".") -> int:
         verification_checks.append((f"current-state.json invalid: {e}", False))
     # Check directories exist
-    verification_checks.append(
-        (".agent-context/ exists", os.path.exists(".agent-context"))
-    )
+    verification_checks.append((".agent-context/ exists", os.path.exists(".agent-context")))
     if use_delegation:
         verification_checks.append(
@@ -2777,9 +2719,7 @@ def split(
         # Check if splitting is recommended
         if lines <= max_lines:
-            print(
-                f"{GREEN}✅ File is under recommended limit ({max_lines} lines){RESET}"
-            )
+            print(f"{GREEN}✅ File is under recommended limit ({max_lines} lines){RESET}")
             print("No splitting needed.")
             return 0
@@ -2797,9 +2737,7 @@ def split(
             splits = split_by_phases(content)
             print(f"\n💡 Suggested splits (by phases):")
         else:
-            print(
-                f"{RED}Error: Unknown strategy '{strategy}'. Use 'sections' or 'phases'.{RESET}"
-            )
+            print(f"{RED}Error: Unknown strategy '{strategy}'. Use 'sections' or 'phases'.{RESET}")
             return 1
         # Display split preview
@@ -2971,26 +2909,18 @@ For more information: https://github.com/movito/adversarial-workflow
     subparsers.add_parser("doctor", help="Alias for 'check'")
     # health command
-    health_parser = subparsers.add_parser(
-        "health", help="Comprehensive system health check"
-    )
+    health_parser = subparsers.add_parser("health", help="Comprehensive system health check")
     health_parser.add_argument(
         "--verbose", "-v", action="store_true", help="Show detailed diagnostics"
     )
-    health_parser.add_argument(
-        "--json", action="store_true", help="Output in JSON format"
-    )
+    health_parser.add_argument("--json", action="store_true", help="Output in JSON format")
     # agent command (with subcommands)
     agent_parser = subparsers.add_parser("agent", help="Agent coordination commands")
-    agent_subparsers = agent_parser.add_subparsers(
-        dest="agent_subcommand", help="Agent subcommand"
-    )
+    agent_subparsers = agent_parser.add_subparsers(dest="agent_subcommand", help="Agent subcommand")
     # agent onboard subcommand
-    onboard_parser = agent_subparsers.add_parser(
-        "onboard", help="Set up agent coordination system"
-    )
+    onboard_parser = agent_subparsers.add_parser("onboard", help="Set up agent coordination system")
     onboard_parser.add_argument(
         "--path", default=".", help="Project path (default: current directory)"
     )
@@ -2999,12 +2929,8 @@ For more information: https://github.com/movito/adversarial-workflow
     subparsers.add_parser("review", help="Run Phase 3: Code review")
     # validate command
-    validate_parser = subparsers.add_parser(
-        "validate", help="Run Phase 4: Test validation"
-    )
-    validate_parser.add_argument(
-        "test_command", nargs="?", help="Test command to run (optional)"
-    )
+    validate_parser = subparsers.add_parser("validate", help="Run Phase 4: Test validation")
+    validate_parser.add_argument("test_command", nargs="?", help="Test command to run (optional)")
     # split command
     split_parser = subparsers.add_parser(
@@ -3050,9 +2976,7 @@ For more information: https://github.com/movito/adversarial-workflow
             # Only warn for user-defined evaluators, not built-ins
             # Built-in conflicts are intentional (e.g., 'review' command vs 'review' evaluator)
             if getattr(config, "source", None) != "builtin":
-                logger.warning(
-                    "Evaluator '%s' conflicts with CLI command; skipping", name
-                )
+                logger.warning("Evaluator '%s' conflicts with CLI command; skipping", name)
             # Mark as registered to prevent alias re-registration attempts
             registered_configs.add(id(config))
             continue
@@ -3082,8 +3006,8 @@ For more information: https://github.com/movito/adversarial-workflow
             "--timeout",
             "-t",
             type=int,
-            default=180,
-            help="Timeout in seconds (default: 180)",
+            default=None,
+            help="Timeout in seconds (default: from evaluator config or 180, max: 600)",
         )
         # Store config for later execution
         eval_parser.set_defaults(evaluator_config=config)
@@ -3096,10 +3020,34 @@ For more information: https://github.com/movito/adversarial-workflow
     # Check for evaluator command first (has evaluator_config attribute)
     if hasattr(args, "evaluator_config"):
+        # Determine timeout: CLI flag > YAML config > default (180s)
+        if args.timeout is not None:
+            timeout = args.timeout
+            source = "CLI override"
+        elif args.evaluator_config.timeout != 180:
+            timeout = args.evaluator_config.timeout
+            source = "evaluator config"
+        else:
+            timeout = args.evaluator_config.timeout  # 180 (default)
+            source = "default"
+        # Validate CLI timeout (consistent with YAML validation)
+        if timeout <= 0:
+            print(f"{RED}Error: Timeout must be positive (> 0), got {timeout}{RESET}")
+            return 1
+        if timeout > 600:
+            print(
+                f"{YELLOW}Warning: Timeout {timeout}s exceeds maximum (600s), clamping to 600s{RESET}"
+            )
+            timeout = 600
+        # Log actual timeout and source
+        print(f"Using timeout: {timeout}s ({source})")
         return run_evaluator(
             args.evaluator_config,
             args.file,
-            timeout=args.timeout,
+            timeout=timeout,
         )
     # Execute static commands

{adversarial_workflow-0.6.2 → adversarial_workflow-0.6.4}/adversarial_workflow/evaluators/config.py RENAMED Viewed

@@ -26,6 +26,7 @@ class EvaluatorConfig:
         fallback_model: Fallback model if primary fails
         aliases: Alternative command names
         version: Evaluator version
+        timeout: Timeout in seconds (default: 180, max: 600)
         source: "builtin" or "local" (set internally)
         config_file: Path to YAML file if local (set internally)
     """
@@ -43,6 +44,7 @@ class EvaluatorConfig:
     fallback_model: str | None = None
     aliases: list[str] = field(default_factory=list)
     version: str = "1.0.0"
+    timeout: int = 180  # Timeout in seconds (default: 180, max: 600)
     # Metadata (set internally during discovery, not from YAML)
     source: str = "builtin"

adversarial-workflow 0.6.2__tar.gz → 0.6.4__tar.gz

adversarial-workflow 0.6.2tar.gz → 0.6.4tar.gz