agent-devkit 0.1.6 → 0.2.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +13 -1
- package/package.json +1 -1
- package/runtime/README.md +53 -1
- package/runtime/agent +5 -0
- package/runtime/agents/README.md +26 -0
- package/runtime/agents/agent-devkit-agent-builder/AGENTS.md +24 -0
- package/runtime/agents/agent-devkit-agent-builder/README.md +37 -0
- package/runtime/agents/agent-devkit-agent-builder/agent.yaml +46 -0
- package/runtime/agents/agent-devkit-agent-builder/capabilities/plan-agent/capability.yaml +29 -0
- package/runtime/agents/agent-devkit-agent-builder/capabilities/plan-agent/decision-rules.md +7 -0
- package/runtime/agents/agent-devkit-agent-builder/capabilities/plan-agent/runner.py +33 -0
- package/runtime/agents/agent-devkit-agent-builder/capabilities/plan-agent/workflow.md +8 -0
- package/runtime/agents/agent-devkit-agent-builder/capabilities/scaffold-agent/capability.yaml +31 -0
- package/runtime/agents/agent-devkit-agent-builder/capabilities/scaffold-agent/decision-rules.md +9 -0
- package/runtime/agents/agent-devkit-agent-builder/capabilities/scaffold-agent/runner.py +39 -0
- package/runtime/agents/agent-devkit-agent-builder/capabilities/scaffold-agent/workflow.md +8 -0
- package/runtime/agents/agent-devkit-agent-builder/capabilities/validate-agent-contract/capability.yaml +28 -0
- package/runtime/agents/agent-devkit-agent-builder/capabilities/validate-agent-contract/decision-rules.md +6 -0
- package/runtime/agents/agent-devkit-agent-builder/capabilities/validate-agent-contract/runner.py +33 -0
- package/runtime/agents/agent-devkit-agent-builder/capabilities/validate-agent-contract/workflow.md +7 -0
- package/runtime/agents/agent-devkit-agent-builder/infra/integrations/agent-devkit/agent_builder_repository.py +527 -0
- package/runtime/agents/agent-devkit-agent-builder/knowledge/context.md +15 -0
- package/runtime/agents/agent-devkit-agent-builder/knowledge/policies.yaml +11 -0
- package/runtime/agents/agent-devkit-agent-builder/knowledge/system.md +11 -0
- package/runtime/agents/agent-devkit-agent-builder/templates/agent-plan-output.md +20 -0
- package/runtime/agents/agent-devkit-agent-builder/templates/scaffold-plan-output.md +13 -0
- package/runtime/agents/agent-devkit-agent-builder/templates/validation-report-output.md +13 -0
- package/runtime/agents/agent-devkit-agent-builder/tests/test_runners.py +188 -0
- package/runtime/agents/automation-architect/AGENTS.md +11 -0
- package/runtime/agents/automation-architect/README.md +27 -0
- package/runtime/agents/automation-architect/agent.yaml +57 -0
- package/runtime/agents/automation-architect/capabilities/classify-automation-request/capability.yaml +35 -0
- package/runtime/agents/automation-architect/capabilities/classify-automation-request/decision-rules.md +10 -0
- package/runtime/agents/automation-architect/capabilities/classify-automation-request/runner.py +37 -0
- package/runtime/agents/automation-architect/capabilities/classify-automation-request/workflow.md +7 -0
- package/runtime/agents/automation-architect/capabilities/delegate-automation-build/capability.yaml +34 -0
- package/runtime/agents/automation-architect/capabilities/delegate-automation-build/decision-rules.md +7 -0
- package/runtime/agents/automation-architect/capabilities/delegate-automation-build/runner.py +37 -0
- package/runtime/agents/automation-architect/capabilities/delegate-automation-build/workflow.md +6 -0
- package/runtime/agents/automation-architect/capabilities/plan-automation-solution/capability.yaml +35 -0
- package/runtime/agents/automation-architect/capabilities/plan-automation-solution/decision-rules.md +7 -0
- package/runtime/agents/automation-architect/capabilities/plan-automation-solution/runner.py +37 -0
- package/runtime/agents/automation-architect/capabilities/plan-automation-solution/workflow.md +7 -0
- package/runtime/agents/automation-architect/capabilities/review-automation-solution/capability.yaml +36 -0
- package/runtime/agents/automation-architect/capabilities/review-automation-solution/decision-rules.md +7 -0
- package/runtime/agents/automation-architect/capabilities/review-automation-solution/runner.py +39 -0
- package/runtime/agents/automation-architect/capabilities/review-automation-solution/workflow.md +7 -0
- package/runtime/agents/automation-architect/infra/integrations/automation-architecture/automation_architecture_repository.py +481 -0
- package/runtime/agents/automation-architect/knowledge/context.md +22 -0
- package/runtime/agents/automation-architect/knowledge/policies.yaml +20 -0
- package/runtime/agents/automation-architect/knowledge/system.md +8 -0
- package/runtime/agents/automation-architect/templates/automation-classification.md +6 -0
- package/runtime/agents/automation-architect/templates/automation-plan.md +5 -0
- package/runtime/agents/automation-architect/tests/test_runners.py +135 -0
- package/runtime/agents/aws-architecture-analyst/agent.yaml +17 -4
- package/runtime/agents/aws-cloudwatch-log-analyzer/agent.yaml +12 -2
- package/runtime/agents/aws-cloudwatch-log-analyzer/capabilities/analyze-service-error/capability.yaml +16 -0
- package/runtime/agents/aws-lambda-builder/AGENTS.md +27 -0
- package/runtime/agents/aws-lambda-builder/README.md +21 -0
- package/runtime/agents/aws-lambda-builder/agent.yaml +46 -0
- package/runtime/agents/aws-lambda-builder/capabilities/deploy-lambda-plan/capability.yaml +18 -0
- package/runtime/agents/aws-lambda-builder/capabilities/deploy-lambda-plan/decision-rules.md +6 -0
- package/runtime/agents/aws-lambda-builder/capabilities/deploy-lambda-plan/runner.py +33 -0
- package/runtime/agents/aws-lambda-builder/capabilities/deploy-lambda-plan/workflow.md +6 -0
- package/runtime/agents/aws-lambda-builder/capabilities/generate-lambda-project/capability.yaml +20 -0
- package/runtime/agents/aws-lambda-builder/capabilities/generate-lambda-project/decision-rules.md +6 -0
- package/runtime/agents/aws-lambda-builder/capabilities/generate-lambda-project/runner.py +39 -0
- package/runtime/agents/aws-lambda-builder/capabilities/generate-lambda-project/workflow.md +7 -0
- package/runtime/agents/aws-lambda-builder/capabilities/package-lambda/capability.yaml +22 -0
- package/runtime/agents/aws-lambda-builder/capabilities/package-lambda/decision-rules.md +6 -0
- package/runtime/agents/aws-lambda-builder/capabilities/package-lambda/runner.py +41 -0
- package/runtime/agents/aws-lambda-builder/capabilities/package-lambda/workflow.md +6 -0
- package/runtime/agents/aws-lambda-builder/capabilities/plan-lambda/capability.yaml +18 -0
- package/runtime/agents/aws-lambda-builder/capabilities/plan-lambda/decision-rules.md +7 -0
- package/runtime/agents/aws-lambda-builder/capabilities/plan-lambda/runner.py +33 -0
- package/runtime/agents/aws-lambda-builder/capabilities/plan-lambda/workflow.md +6 -0
- package/runtime/agents/aws-lambda-builder/capabilities/review-lambda-security/capability.yaml +18 -0
- package/runtime/agents/aws-lambda-builder/capabilities/review-lambda-security/decision-rules.md +7 -0
- package/runtime/agents/aws-lambda-builder/capabilities/review-lambda-security/runner.py +33 -0
- package/runtime/agents/aws-lambda-builder/capabilities/review-lambda-security/workflow.md +5 -0
- package/runtime/agents/aws-lambda-builder/infra/integrations/aws-lambda/aws_lambda_repository.py +688 -0
- package/runtime/agents/aws-lambda-builder/knowledge/context.md +12 -0
- package/runtime/agents/aws-lambda-builder/knowledge/policies.yaml +23 -0
- package/runtime/agents/aws-lambda-builder/knowledge/system.md +10 -0
- package/runtime/agents/aws-lambda-builder/templates/lambda-deploy-plan.md +3 -0
- package/runtime/agents/aws-lambda-builder/templates/lambda-package.md +3 -0
- package/runtime/agents/aws-lambda-builder/templates/lambda-plan.md +3 -0
- package/runtime/agents/aws-lambda-builder/templates/lambda-readme.md +3 -0
- package/runtime/agents/aws-lambda-builder/templates/lambda-security-review.md +3 -0
- package/runtime/agents/aws-lambda-builder/tests/test_runners.py +355 -0
- package/runtime/agents/aws-operations-operator/agent.yaml +18 -6
- package/runtime/agents/aws-security-governance-auditor/agent.yaml +17 -5
- package/runtime/agents/azure-devops-orchestrator/agent.yaml +15 -2
- package/runtime/agents/azure-devops-orchestrator/capabilities/read-card/capability.yaml +29 -0
- package/runtime/agents/bpo-analyser/agent.yaml +12 -2
- package/runtime/agents/bpo-analyser/knowledge/policies.yaml +2 -2
- package/runtime/agents/data-scientist-analyst/agent.yaml +16 -4
- package/runtime/agents/data-scientist-analyst/capabilities/generate-data-report/capability.yaml +1 -1
- package/runtime/agents/data-scientist-analyst/capabilities/generate-reconciliation-report/capability.yaml +1 -1
- package/runtime/agents/data-scientist-analyst/capabilities/run-data-pipeline/capability.yaml +1 -1
- package/runtime/agents/data-scientist-analyst/infra/integrations/agent-bridge/methods/analyze-sql-source.yaml +1 -1
- package/runtime/agents/data-scientist-analyst/knowledge/policies.yaml +4 -4
- package/runtime/agents/data-scientist-analyst/knowledge/system.md +1 -1
- package/runtime/agents/data-scientist-analyst/tests/test_runners.py +1 -1
- package/runtime/agents/database-change-operator/agent.yaml +12 -1
- package/runtime/agents/docker-container-builder/AGENTS.md +27 -0
- package/runtime/agents/docker-container-builder/README.md +21 -0
- package/runtime/agents/docker-container-builder/agent.yaml +52 -0
- package/runtime/agents/docker-container-builder/capabilities/analyze-containerization-target/capability.yaml +18 -0
- package/runtime/agents/docker-container-builder/capabilities/analyze-containerization-target/decision-rules.md +6 -0
- package/runtime/agents/docker-container-builder/capabilities/analyze-containerization-target/runner.py +32 -0
- package/runtime/agents/docker-container-builder/capabilities/analyze-containerization-target/workflow.md +6 -0
- package/runtime/agents/docker-container-builder/capabilities/generate-compose/capability.yaml +18 -0
- package/runtime/agents/docker-container-builder/capabilities/generate-compose/decision-rules.md +7 -0
- package/runtime/agents/docker-container-builder/capabilities/generate-compose/runner.py +32 -0
- package/runtime/agents/docker-container-builder/capabilities/generate-compose/workflow.md +6 -0
- package/runtime/agents/docker-container-builder/capabilities/generate-container-project-files/capability.yaml +20 -0
- package/runtime/agents/docker-container-builder/capabilities/generate-container-project-files/decision-rules.md +7 -0
- package/runtime/agents/docker-container-builder/capabilities/generate-container-project-files/runner.py +38 -0
- package/runtime/agents/docker-container-builder/capabilities/generate-container-project-files/workflow.md +7 -0
- package/runtime/agents/docker-container-builder/capabilities/generate-dockerfile/capability.yaml +18 -0
- package/runtime/agents/docker-container-builder/capabilities/generate-dockerfile/decision-rules.md +6 -0
- package/runtime/agents/docker-container-builder/capabilities/generate-dockerfile/runner.py +32 -0
- package/runtime/agents/docker-container-builder/capabilities/generate-dockerfile/workflow.md +7 -0
- package/runtime/agents/docker-container-builder/capabilities/plan-image-build/capability.yaml +18 -0
- package/runtime/agents/docker-container-builder/capabilities/plan-image-build/decision-rules.md +6 -0
- package/runtime/agents/docker-container-builder/capabilities/plan-image-build/runner.py +32 -0
- package/runtime/agents/docker-container-builder/capabilities/plan-image-build/workflow.md +6 -0
- package/runtime/agents/docker-container-builder/capabilities/review-docker-security/capability.yaml +21 -0
- package/runtime/agents/docker-container-builder/capabilities/review-docker-security/decision-rules.md +6 -0
- package/runtime/agents/docker-container-builder/capabilities/review-docker-security/runner.py +43 -0
- package/runtime/agents/docker-container-builder/capabilities/review-docker-security/workflow.md +5 -0
- package/runtime/agents/docker-container-builder/infra/integrations/docker-container/docker_container_repository.py +837 -0
- package/runtime/agents/docker-container-builder/knowledge/context.md +21 -0
- package/runtime/agents/docker-container-builder/knowledge/policies.yaml +13 -0
- package/runtime/agents/docker-container-builder/knowledge/system.md +21 -0
- package/runtime/agents/docker-container-builder/templates/container-plan.md +4 -0
- package/runtime/agents/docker-container-builder/templates/container-review.md +4 -0
- package/runtime/agents/docker-container-builder/templates/docker-compose.md +5 -0
- package/runtime/agents/docker-container-builder/templates/docker-readme.md +3 -0
- package/runtime/agents/docker-container-builder/templates/dockerfile.md +5 -0
- package/runtime/agents/docker-container-builder/tests/test_runners.py +255 -0
- package/runtime/agents/drawio-diagram-builder/agent.yaml +11 -2
- package/runtime/agents/drawio-diagram-builder/capabilities/execute-diagram-delivery/capability.yaml +1 -1
- package/runtime/agents/drawio-diagram-builder/capabilities/read-azure-card-context/capability.yaml +1 -1
- package/runtime/agents/elasticsearch-log-analyzer/agent.yaml +14 -2
- package/runtime/agents/elasticsearch-log-analyzer/capabilities/analyze-service-errors/capability.yaml +14 -0
- package/runtime/agents/excel-workbook-builder/agent.yaml +10 -0
- package/runtime/agents/excel-workbook-builder/capabilities/create-template/capability.yaml +1 -1
- package/runtime/agents/excel-workbook-builder/capabilities/create-template/workflow.md +1 -1
- package/runtime/agents/excel-workbook-builder/capabilities/create-template-version/capability.yaml +1 -1
- package/runtime/agents/excel-workbook-builder/capabilities/generate-template-input-file/capability.yaml +1 -2
- package/runtime/agents/excel-workbook-builder/capabilities/refine-template/capability.yaml +1 -1
- package/runtime/agents/excel-workbook-builder/capabilities/register-template/capability.yaml +1 -2
- package/runtime/agents/excel-workbook-builder/capabilities/register-template/workflow.md +1 -1
- package/runtime/agents/execution-loop-builder/AGENTS.md +24 -0
- package/runtime/agents/execution-loop-builder/README.md +19 -0
- package/runtime/agents/execution-loop-builder/agent.yaml +49 -0
- package/runtime/agents/execution-loop-builder/capabilities/generate-loop-project-files/capability.yaml +20 -0
- package/runtime/agents/execution-loop-builder/capabilities/generate-loop-project-files/decision-rules.md +6 -0
- package/runtime/agents/execution-loop-builder/capabilities/generate-loop-project-files/runner.py +38 -0
- package/runtime/agents/execution-loop-builder/capabilities/generate-loop-project-files/workflow.md +7 -0
- package/runtime/agents/execution-loop-builder/capabilities/generate-loop-runner/capability.yaml +18 -0
- package/runtime/agents/execution-loop-builder/capabilities/generate-loop-runner/decision-rules.md +5 -0
- package/runtime/agents/execution-loop-builder/capabilities/generate-loop-runner/runner.py +32 -0
- package/runtime/agents/execution-loop-builder/capabilities/generate-loop-runner/workflow.md +6 -0
- package/runtime/agents/execution-loop-builder/capabilities/plan-execution-loop/capability.yaml +18 -0
- package/runtime/agents/execution-loop-builder/capabilities/plan-execution-loop/decision-rules.md +6 -0
- package/runtime/agents/execution-loop-builder/capabilities/plan-execution-loop/runner.py +32 -0
- package/runtime/agents/execution-loop-builder/capabilities/plan-execution-loop/workflow.md +6 -0
- package/runtime/agents/execution-loop-builder/capabilities/register-loop-task/capability.yaml +19 -0
- package/runtime/agents/execution-loop-builder/capabilities/register-loop-task/decision-rules.md +6 -0
- package/runtime/agents/execution-loop-builder/capabilities/register-loop-task/runner.py +36 -0
- package/runtime/agents/execution-loop-builder/capabilities/register-loop-task/workflow.md +6 -0
- package/runtime/agents/execution-loop-builder/capabilities/review-loop-safety/capability.yaml +19 -0
- package/runtime/agents/execution-loop-builder/capabilities/review-loop-safety/decision-rules.md +6 -0
- package/runtime/agents/execution-loop-builder/capabilities/review-loop-safety/runner.py +39 -0
- package/runtime/agents/execution-loop-builder/capabilities/review-loop-safety/workflow.md +5 -0
- package/runtime/agents/execution-loop-builder/infra/integrations/execution-loop/execution_loop_repository.py +608 -0
- package/runtime/agents/execution-loop-builder/knowledge/context.md +26 -0
- package/runtime/agents/execution-loop-builder/knowledge/policies.yaml +13 -0
- package/runtime/agents/execution-loop-builder/knowledge/system.md +19 -0
- package/runtime/agents/execution-loop-builder/templates/loop-plan.md +3 -0
- package/runtime/agents/execution-loop-builder/templates/loop-readme.md +3 -0
- package/runtime/agents/execution-loop-builder/templates/loop-review.md +3 -0
- package/runtime/agents/execution-loop-builder/templates/loop-runner.py +2 -0
- package/runtime/agents/execution-loop-builder/tests/test_runners.py +274 -0
- package/runtime/agents/execution-reviewer/agent.yaml +6 -4
- package/runtime/agents/execution-reviewer/capabilities/review-agent-result/capability.yaml +1 -2
- package/runtime/agents/execution-reviewer/capabilities/review-final-output/capability.yaml +1 -2
- package/runtime/agents/execution-reviewer/capabilities/review-plan/capability.yaml +1 -2
- package/runtime/agents/figma-ui-ux-product-designer/agent.yaml +17 -5
- package/runtime/agents/figma-ui-ux-product-designer/capabilities/analyze-product-context/capability.yaml +1 -1
- package/runtime/agents/figma-ui-ux-product-designer/capabilities/conduct-design-interview/capability.yaml +1 -1
- package/runtime/agents/figma-ui-ux-product-designer/capabilities/conduct-design-review-session/capability.yaml +1 -1
- package/runtime/agents/figma-ui-ux-product-designer/capabilities/generate-dev-handoff/capability.yaml +1 -1
- package/runtime/agents/figma-ui-ux-product-designer/capabilities/generate-user-journey-diagram/capability.yaml +1 -1
- package/runtime/agents/figma-ui-ux-product-designer/capabilities/ingest-design-source/capability.yaml +1 -1
- package/runtime/agents/figma-ui-ux-product-designer/capabilities/triage-design-feedback/capability.yaml +1 -1
- package/runtime/agents/generic-agent-builder/AGENTS.md +20 -0
- package/runtime/agents/generic-agent-builder/README.md +40 -0
- package/runtime/agents/generic-agent-builder/agent.yaml +43 -0
- package/runtime/agents/generic-agent-builder/capabilities/generate-agent-instructions/capability.yaml +18 -0
- package/runtime/agents/generic-agent-builder/capabilities/generate-agent-instructions/decision-rules.md +5 -0
- package/runtime/agents/generic-agent-builder/capabilities/generate-agent-instructions/runner.py +33 -0
- package/runtime/agents/generic-agent-builder/capabilities/generate-agent-instructions/workflow.md +6 -0
- package/runtime/agents/generic-agent-builder/capabilities/generate-project-agent-files/capability.yaml +20 -0
- package/runtime/agents/generic-agent-builder/capabilities/generate-project-agent-files/decision-rules.md +6 -0
- package/runtime/agents/generic-agent-builder/capabilities/generate-project-agent-files/runner.py +39 -0
- package/runtime/agents/generic-agent-builder/capabilities/generate-project-agent-files/workflow.md +7 -0
- package/runtime/agents/generic-agent-builder/capabilities/generate-skill/capability.yaml +18 -0
- package/runtime/agents/generic-agent-builder/capabilities/generate-skill/decision-rules.md +5 -0
- package/runtime/agents/generic-agent-builder/capabilities/generate-skill/runner.py +33 -0
- package/runtime/agents/generic-agent-builder/capabilities/generate-skill/workflow.md +5 -0
- package/runtime/agents/generic-agent-builder/capabilities/plan-generic-agent/capability.yaml +18 -0
- package/runtime/agents/generic-agent-builder/capabilities/plan-generic-agent/decision-rules.md +6 -0
- package/runtime/agents/generic-agent-builder/capabilities/plan-generic-agent/runner.py +33 -0
- package/runtime/agents/generic-agent-builder/capabilities/plan-generic-agent/workflow.md +6 -0
- package/runtime/agents/generic-agent-builder/capabilities/review-generic-agent/capability.yaml +20 -0
- package/runtime/agents/generic-agent-builder/capabilities/review-generic-agent/decision-rules.md +6 -0
- package/runtime/agents/generic-agent-builder/capabilities/review-generic-agent/runner.py +40 -0
- package/runtime/agents/generic-agent-builder/capabilities/review-generic-agent/workflow.md +7 -0
- package/runtime/agents/generic-agent-builder/infra/integrations/generic-agent/generic_agent_repository.py +445 -0
- package/runtime/agents/generic-agent-builder/knowledge/context.md +11 -0
- package/runtime/agents/generic-agent-builder/knowledge/policies.yaml +12 -0
- package/runtime/agents/generic-agent-builder/knowledge/system.md +17 -0
- package/runtime/agents/generic-agent-builder/templates/generic-agent-instructions.md +17 -0
- package/runtime/agents/generic-agent-builder/templates/generic-review-report.md +13 -0
- package/runtime/agents/generic-agent-builder/templates/generic-skill.md +14 -0
- package/runtime/agents/generic-agent-builder/tests/test_runners.py +220 -0
- package/runtime/agents/github-pr-reviewer/agent.yaml +17 -5
- package/runtime/agents/github-pr-reviewer/capabilities/create-review-automation/capability.yaml +1 -1
- package/runtime/agents/github-pr-reviewer/capabilities/inspect-pr/capability.yaml +1 -1
- package/runtime/agents/github-pr-reviewer/capabilities/list-review-requests/capability.yaml +1 -1
- package/runtime/agents/github-pr-reviewer/capabilities/review-pr-diff/capability.yaml +1 -1
- package/runtime/agents/knowledge-generator/agent.yaml +13 -3
- package/runtime/agents/knowledge-generator/capabilities/generate-knowledge/capability.yaml +1 -1
- package/runtime/agents/local-llm-operator/agent.yaml +6 -4
- package/runtime/agents/local-llm-operator/capabilities/delegate-operational-task/capability.yaml +1 -2
- package/runtime/agents/local-llm-operator/capabilities/inspect-local-models/capability.yaml +1 -2
- package/runtime/agents/local-llm-operator/capabilities/select-local-worker/capability.yaml +1 -2
- package/runtime/agents/n1-support-agent/agent.yaml +40 -1
- package/runtime/agents/n2-support-agent/agent.yaml +41 -2
- package/runtime/agents/n2-support-agent/knowledge/policies.yaml +2 -2
- package/runtime/agents/notification-operator/AGENTS.md +11 -0
- package/runtime/agents/notification-operator/README.md +15 -0
- package/runtime/agents/notification-operator/agent.yaml +43 -0
- package/runtime/agents/notification-operator/capabilities/configure-notification-channel/capability.yaml +19 -0
- package/runtime/agents/notification-operator/capabilities/configure-notification-channel/decision-rules.md +6 -0
- package/runtime/agents/notification-operator/capabilities/configure-notification-channel/runner.py +33 -0
- package/runtime/agents/notification-operator/capabilities/configure-notification-channel/workflow.md +6 -0
- package/runtime/agents/notification-operator/capabilities/format-task-completion-notification/capability.yaml +25 -0
- package/runtime/agents/notification-operator/capabilities/format-task-completion-notification/decision-rules.md +7 -0
- package/runtime/agents/notification-operator/capabilities/format-task-completion-notification/runner.py +49 -0
- package/runtime/agents/notification-operator/capabilities/format-task-completion-notification/workflow.md +6 -0
- package/runtime/agents/notification-operator/capabilities/send-task-completion-notification/capability.yaml +27 -0
- package/runtime/agents/notification-operator/capabilities/send-task-completion-notification/decision-rules.md +6 -0
- package/runtime/agents/notification-operator/capabilities/send-task-completion-notification/runner.py +68 -0
- package/runtime/agents/notification-operator/capabilities/send-task-completion-notification/workflow.md +7 -0
- package/runtime/agents/notification-operator/infra/README.md +6 -0
- package/runtime/agents/notification-operator/knowledge/context.md +10 -0
- package/runtime/agents/notification-operator/knowledge/policies.yaml +9 -0
- package/runtime/agents/notification-operator/knowledge/system.md +7 -0
- package/runtime/agents/notification-operator/templates/README.md +6 -0
- package/runtime/agents/notification-operator/tests/test_runners.py +108 -0
- package/runtime/agents/playwright-automation-builder/AGENTS.md +23 -0
- package/runtime/agents/playwright-automation-builder/README.md +43 -0
- package/runtime/agents/playwright-automation-builder/agent.yaml +48 -0
- package/runtime/agents/playwright-automation-builder/capabilities/generate-playwright-project-files/capability.yaml +20 -0
- package/runtime/agents/playwright-automation-builder/capabilities/generate-playwright-project-files/decision-rules.md +6 -0
- package/runtime/agents/playwright-automation-builder/capabilities/generate-playwright-project-files/runner.py +38 -0
- package/runtime/agents/playwright-automation-builder/capabilities/generate-playwright-project-files/workflow.md +6 -0
- package/runtime/agents/playwright-automation-builder/capabilities/generate-playwright-script/capability.yaml +18 -0
- package/runtime/agents/playwright-automation-builder/capabilities/generate-playwright-script/decision-rules.md +6 -0
- package/runtime/agents/playwright-automation-builder/capabilities/generate-playwright-script/runner.py +32 -0
- package/runtime/agents/playwright-automation-builder/capabilities/generate-playwright-script/workflow.md +6 -0
- package/runtime/agents/playwright-automation-builder/capabilities/plan-playwright-automation/capability.yaml +18 -0
- package/runtime/agents/playwright-automation-builder/capabilities/plan-playwright-automation/decision-rules.md +6 -0
- package/runtime/agents/playwright-automation-builder/capabilities/plan-playwright-automation/runner.py +32 -0
- package/runtime/agents/playwright-automation-builder/capabilities/plan-playwright-automation/workflow.md +6 -0
- package/runtime/agents/playwright-automation-builder/capabilities/review-playwright-artifacts/capability.yaml +19 -0
- package/runtime/agents/playwright-automation-builder/capabilities/review-playwright-artifacts/decision-rules.md +6 -0
- package/runtime/agents/playwright-automation-builder/capabilities/review-playwright-artifacts/runner.py +33 -0
- package/runtime/agents/playwright-automation-builder/capabilities/review-playwright-artifacts/workflow.md +6 -0
- package/runtime/agents/playwright-automation-builder/capabilities/run-playwright-check/capability.yaml +22 -0
- package/runtime/agents/playwright-automation-builder/capabilities/run-playwright-check/decision-rules.md +6 -0
- package/runtime/agents/playwright-automation-builder/capabilities/run-playwright-check/runner.py +40 -0
- package/runtime/agents/playwright-automation-builder/capabilities/run-playwright-check/workflow.md +6 -0
- package/runtime/agents/playwright-automation-builder/capabilities/wrap-playwright-as-capability/capability.yaml +22 -0
- package/runtime/agents/playwright-automation-builder/capabilities/wrap-playwright-as-capability/decision-rules.md +6 -0
- package/runtime/agents/playwright-automation-builder/capabilities/wrap-playwright-as-capability/runner.py +42 -0
- package/runtime/agents/playwright-automation-builder/capabilities/wrap-playwright-as-capability/workflow.md +6 -0
- package/runtime/agents/playwright-automation-builder/infra/integrations/playwright-automation/playwright_automation_repository.py +865 -0
- package/runtime/agents/playwright-automation-builder/knowledge/context.md +19 -0
- package/runtime/agents/playwright-automation-builder/knowledge/policies.yaml +25 -0
- package/runtime/agents/playwright-automation-builder/knowledge/system.md +19 -0
- package/runtime/agents/playwright-automation-builder/templates/capability-wrapper.md +4 -0
- package/runtime/agents/playwright-automation-builder/templates/playwright-automation.py +12 -0
- package/runtime/agents/playwright-automation-builder/templates/playwright-readme.md +13 -0
- package/runtime/agents/playwright-automation-builder/templates/playwright-review-report.md +9 -0
- package/runtime/agents/playwright-automation-builder/templates/playwright-test.py +2 -0
- package/runtime/agents/playwright-automation-builder/tests/test_runners.py +261 -0
- package/runtime/agents/postgres-data-analyzer/agent.yaml +13 -2
- package/runtime/agents/presentation-deck-builder/agent.yaml +14 -3
- package/runtime/agents/presentation-deck-builder/capabilities/create-template/capability.yaml +1 -1
- package/runtime/agents/presentation-deck-builder/capabilities/create-template-version/capability.yaml +1 -1
- package/runtime/agents/presentation-deck-builder/capabilities/generate-template-input-file/capability.yaml +1 -1
- package/runtime/agents/presentation-deck-builder/capabilities/refine-template/capability.yaml +1 -1
- package/runtime/agents/presentation-deck-builder/capabilities/register-template/capability.yaml +1 -1
- package/runtime/agents/presentation-deck-builder/knowledge/prompts/create-template.md +1 -1
- package/runtime/agents/presentation-deck-builder/knowledge/prompts/generate-template-input-file.md +1 -1
- package/runtime/agents/provider-configurator/agent.yaml +6 -4
- package/runtime/agents/provider-configurator/capabilities/collect-provider-credentials/capability.yaml +1 -2
- package/runtime/agents/provider-configurator/capabilities/configure-provider-source/capability.yaml +1 -2
- package/runtime/agents/provider-configurator/capabilities/validate-provider-readiness/capability.yaml +1 -2
- package/runtime/agents/pyautogui-automation-builder/AGENTS.md +32 -0
- package/runtime/agents/pyautogui-automation-builder/README.md +44 -0
- package/runtime/agents/pyautogui-automation-builder/agent.yaml +45 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/generate-pyautogui-project-files/capability.yaml +20 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/generate-pyautogui-project-files/decision-rules.md +6 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/generate-pyautogui-project-files/runner.py +39 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/generate-pyautogui-project-files/workflow.md +7 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/generate-pyautogui-script/capability.yaml +18 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/generate-pyautogui-script/decision-rules.md +7 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/generate-pyautogui-script/runner.py +33 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/generate-pyautogui-script/workflow.md +7 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/plan-desktop-automation/capability.yaml +18 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/plan-desktop-automation/decision-rules.md +8 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/plan-desktop-automation/runner.py +33 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/plan-desktop-automation/workflow.md +9 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/review-pyautogui-script/capability.yaml +20 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/review-pyautogui-script/decision-rules.md +8 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/review-pyautogui-script/runner.py +43 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/review-pyautogui-script/workflow.md +7 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/wrap-pyautogui-as-capability/capability.yaml +22 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/wrap-pyautogui-as-capability/decision-rules.md +6 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/wrap-pyautogui-as-capability/runner.py +43 -0
- package/runtime/agents/pyautogui-automation-builder/capabilities/wrap-pyautogui-as-capability/workflow.md +7 -0
- package/runtime/agents/pyautogui-automation-builder/infra/integrations/pyautogui-automation/pyautogui_automation_repository.py +856 -0
- package/runtime/agents/pyautogui-automation-builder/knowledge/context.md +17 -0
- package/runtime/agents/pyautogui-automation-builder/knowledge/policies.yaml +24 -0
- package/runtime/agents/pyautogui-automation-builder/knowledge/system.md +13 -0
- package/runtime/agents/pyautogui-automation-builder/templates/capability-wrapper.md +3 -0
- package/runtime/agents/pyautogui-automation-builder/templates/pyautogui-automation.py +12 -0
- package/runtime/agents/pyautogui-automation-builder/templates/pyautogui-readme.md +3 -0
- package/runtime/agents/pyautogui-automation-builder/templates/pyautogui-review-report.md +3 -0
- package/runtime/agents/pyautogui-automation-builder/templates/pyautogui-test.py +2 -0
- package/runtime/agents/pyautogui-automation-builder/tests/test_runners.py +376 -0
- package/runtime/agents/python-automation-builder/AGENTS.md +25 -0
- package/runtime/agents/python-automation-builder/README.md +43 -0
- package/runtime/agents/python-automation-builder/agent.yaml +45 -0
- package/runtime/agents/python-automation-builder/capabilities/generate-automation-project-files/capability.yaml +20 -0
- package/runtime/agents/python-automation-builder/capabilities/generate-automation-project-files/decision-rules.md +6 -0
- package/runtime/agents/python-automation-builder/capabilities/generate-automation-project-files/runner.py +39 -0
- package/runtime/agents/python-automation-builder/capabilities/generate-automation-project-files/workflow.md +7 -0
- package/runtime/agents/python-automation-builder/capabilities/generate-python-automation/capability.yaml +18 -0
- package/runtime/agents/python-automation-builder/capabilities/generate-python-automation/decision-rules.md +5 -0
- package/runtime/agents/python-automation-builder/capabilities/generate-python-automation/runner.py +33 -0
- package/runtime/agents/python-automation-builder/capabilities/generate-python-automation/workflow.md +5 -0
- package/runtime/agents/python-automation-builder/capabilities/plan-python-automation/capability.yaml +18 -0
- package/runtime/agents/python-automation-builder/capabilities/plan-python-automation/decision-rules.md +6 -0
- package/runtime/agents/python-automation-builder/capabilities/plan-python-automation/runner.py +33 -0
- package/runtime/agents/python-automation-builder/capabilities/plan-python-automation/workflow.md +6 -0
- package/runtime/agents/python-automation-builder/capabilities/review-python-automation/capability.yaml +20 -0
- package/runtime/agents/python-automation-builder/capabilities/review-python-automation/decision-rules.md +6 -0
- package/runtime/agents/python-automation-builder/capabilities/review-python-automation/runner.py +43 -0
- package/runtime/agents/python-automation-builder/capabilities/review-python-automation/workflow.md +5 -0
- package/runtime/agents/python-automation-builder/capabilities/wrap-automation-as-capability/capability.yaml +22 -0
- package/runtime/agents/python-automation-builder/capabilities/wrap-automation-as-capability/decision-rules.md +6 -0
- package/runtime/agents/python-automation-builder/capabilities/wrap-automation-as-capability/runner.py +43 -0
- package/runtime/agents/python-automation-builder/capabilities/wrap-automation-as-capability/workflow.md +6 -0
- package/runtime/agents/python-automation-builder/infra/integrations/python-automation/python_automation_repository.py +717 -0
- package/runtime/agents/python-automation-builder/knowledge/context.md +15 -0
- package/runtime/agents/python-automation-builder/knowledge/policies.yaml +12 -0
- package/runtime/agents/python-automation-builder/knowledge/system.md +19 -0
- package/runtime/agents/python-automation-builder/templates/automation-readme.md +13 -0
- package/runtime/agents/python-automation-builder/templates/automation-review-report.md +13 -0
- package/runtime/agents/python-automation-builder/templates/automation-test.py +9 -0
- package/runtime/agents/python-automation-builder/templates/automation.py +19 -0
- package/runtime/agents/python-automation-builder/templates/capability-wrapper.md +4 -0
- package/runtime/agents/python-automation-builder/tests/test_runners.py +292 -0
- package/runtime/agents/selenium-automation-builder/AGENTS.md +27 -0
- package/runtime/agents/selenium-automation-builder/README.md +40 -0
- package/runtime/agents/selenium-automation-builder/agent.yaml +45 -0
- package/runtime/agents/selenium-automation-builder/capabilities/generate-selenium-project-files/capability.yaml +20 -0
- package/runtime/agents/selenium-automation-builder/capabilities/generate-selenium-project-files/decision-rules.md +6 -0
- package/runtime/agents/selenium-automation-builder/capabilities/generate-selenium-project-files/runner.py +39 -0
- package/runtime/agents/selenium-automation-builder/capabilities/generate-selenium-project-files/workflow.md +7 -0
- package/runtime/agents/selenium-automation-builder/capabilities/generate-selenium-script/capability.yaml +18 -0
- package/runtime/agents/selenium-automation-builder/capabilities/generate-selenium-script/decision-rules.md +6 -0
- package/runtime/agents/selenium-automation-builder/capabilities/generate-selenium-script/runner.py +33 -0
- package/runtime/agents/selenium-automation-builder/capabilities/generate-selenium-script/workflow.md +6 -0
- package/runtime/agents/selenium-automation-builder/capabilities/plan-selenium-automation/capability.yaml +18 -0
- package/runtime/agents/selenium-automation-builder/capabilities/plan-selenium-automation/decision-rules.md +6 -0
- package/runtime/agents/selenium-automation-builder/capabilities/plan-selenium-automation/runner.py +33 -0
- package/runtime/agents/selenium-automation-builder/capabilities/plan-selenium-automation/workflow.md +6 -0
- package/runtime/agents/selenium-automation-builder/capabilities/review-selenium-script/capability.yaml +20 -0
- package/runtime/agents/selenium-automation-builder/capabilities/review-selenium-script/decision-rules.md +6 -0
- package/runtime/agents/selenium-automation-builder/capabilities/review-selenium-script/runner.py +40 -0
- package/runtime/agents/selenium-automation-builder/capabilities/review-selenium-script/workflow.md +6 -0
- package/runtime/agents/selenium-automation-builder/capabilities/wrap-selenium-as-capability/capability.yaml +22 -0
- package/runtime/agents/selenium-automation-builder/capabilities/wrap-selenium-as-capability/decision-rules.md +6 -0
- package/runtime/agents/selenium-automation-builder/capabilities/wrap-selenium-as-capability/runner.py +43 -0
- package/runtime/agents/selenium-automation-builder/capabilities/wrap-selenium-as-capability/workflow.md +6 -0
- package/runtime/agents/selenium-automation-builder/infra/integrations/selenium-automation/selenium_automation_repository.py +793 -0
- package/runtime/agents/selenium-automation-builder/knowledge/context.md +15 -0
- package/runtime/agents/selenium-automation-builder/knowledge/policies.yaml +17 -0
- package/runtime/agents/selenium-automation-builder/knowledge/system.md +18 -0
- package/runtime/agents/selenium-automation-builder/templates/capability-wrapper.md +4 -0
- package/runtime/agents/selenium-automation-builder/templates/selenium-automation.py +20 -0
- package/runtime/agents/selenium-automation-builder/templates/selenium-readme.md +13 -0
- package/runtime/agents/selenium-automation-builder/templates/selenium-review-report.md +13 -0
- package/runtime/agents/selenium-automation-builder/templates/selenium-test.py +9 -0
- package/runtime/agents/selenium-automation-builder/tests/test_runners.py +282 -0
- package/runtime/agents/software-specification-analyst/agent.yaml +17 -4
- package/runtime/agents/software-specification-analyst/capabilities/analyze-multiple-projects/capability.yaml +1 -1
- package/runtime/agents/software-specification-analyst/capabilities/analyze-project-context/capability.yaml +1 -1
- package/runtime/agents/software-specification-analyst/capabilities/conduct-requirements-interview/capability.yaml +1 -1
- package/runtime/agents/software-specification-analyst/capabilities/create-complete-spec/capability.yaml +1 -1
- package/runtime/agents/software-specification-analyst/capabilities/create-final-spec-from-analysis/capability.yaml +1 -1
- package/runtime/agents/software-specification-analyst/capabilities/create-functional-spec/capability.yaml +11 -0
- package/runtime/agents/software-specification-analyst/capabilities/create-technical-spec/capability.yaml +12 -0
- package/runtime/agents/software-specification-analyst/capabilities/refine-analysis-with-feedback/capability.yaml +1 -1
- package/runtime/agents/software-specification-analyst/capabilities/write-user-stories/capability.yaml +12 -0
- package/runtime/agents/sqlserver-change-operator/agent.yaml +12 -1
- package/runtime/agents/sqlserver-data-analyzer/agent.yaml +13 -2
- package/runtime/agents/supabase-project-analyst/AGENTS.md +29 -0
- package/runtime/agents/supabase-project-analyst/README.md +23 -0
- package/runtime/agents/supabase-project-analyst/agent.yaml +53 -0
- package/runtime/agents/supabase-project-analyst/capabilities/audit-auth-security/capability.yaml +18 -0
- package/runtime/agents/supabase-project-analyst/capabilities/audit-auth-security/decision-rules.md +5 -0
- package/runtime/agents/supabase-project-analyst/capabilities/audit-auth-security/runner.py +32 -0
- package/runtime/agents/supabase-project-analyst/capabilities/audit-auth-security/workflow.md +6 -0
- package/runtime/agents/supabase-project-analyst/capabilities/audit-rls-policies/capability.yaml +18 -0
- package/runtime/agents/supabase-project-analyst/capabilities/audit-rls-policies/decision-rules.md +6 -0
- package/runtime/agents/supabase-project-analyst/capabilities/audit-rls-policies/runner.py +32 -0
- package/runtime/agents/supabase-project-analyst/capabilities/audit-rls-policies/workflow.md +7 -0
- package/runtime/agents/supabase-project-analyst/capabilities/audit-storage-policies/capability.yaml +18 -0
- package/runtime/agents/supabase-project-analyst/capabilities/audit-storage-policies/decision-rules.md +5 -0
- package/runtime/agents/supabase-project-analyst/capabilities/audit-storage-policies/runner.py +32 -0
- package/runtime/agents/supabase-project-analyst/capabilities/audit-storage-policies/workflow.md +6 -0
- package/runtime/agents/supabase-project-analyst/capabilities/generate-supabase-report/capability.yaml +18 -0
- package/runtime/agents/supabase-project-analyst/capabilities/generate-supabase-report/decision-rules.md +6 -0
- package/runtime/agents/supabase-project-analyst/capabilities/generate-supabase-report/runner.py +32 -0
- package/runtime/agents/supabase-project-analyst/capabilities/generate-supabase-report/workflow.md +6 -0
- package/runtime/agents/supabase-project-analyst/capabilities/inspect-supabase-project/capability.yaml +19 -0
- package/runtime/agents/supabase-project-analyst/capabilities/inspect-supabase-project/decision-rules.md +6 -0
- package/runtime/agents/supabase-project-analyst/capabilities/inspect-supabase-project/runner.py +36 -0
- package/runtime/agents/supabase-project-analyst/capabilities/inspect-supabase-project/workflow.md +7 -0
- package/runtime/agents/supabase-project-analyst/capabilities/plan-supabase-fix/capability.yaml +18 -0
- package/runtime/agents/supabase-project-analyst/capabilities/plan-supabase-fix/decision-rules.md +6 -0
- package/runtime/agents/supabase-project-analyst/capabilities/plan-supabase-fix/runner.py +32 -0
- package/runtime/agents/supabase-project-analyst/capabilities/plan-supabase-fix/workflow.md +6 -0
- package/runtime/agents/supabase-project-analyst/capabilities/review-migrations/capability.yaml +18 -0
- package/runtime/agents/supabase-project-analyst/capabilities/review-migrations/decision-rules.md +6 -0
- package/runtime/agents/supabase-project-analyst/capabilities/review-migrations/runner.py +32 -0
- package/runtime/agents/supabase-project-analyst/capabilities/review-migrations/workflow.md +5 -0
- package/runtime/agents/supabase-project-analyst/infra/integrations/supabase-project/supabase_project_repository.py +589 -0
- package/runtime/agents/supabase-project-analyst/knowledge/context.md +11 -0
- package/runtime/agents/supabase-project-analyst/knowledge/policies.yaml +24 -0
- package/runtime/agents/supabase-project-analyst/knowledge/system.md +10 -0
- package/runtime/agents/supabase-project-analyst/templates/supabase-audit.md +3 -0
- package/runtime/agents/supabase-project-analyst/templates/supabase-fix-plan.md +3 -0
- package/runtime/agents/supabase-project-analyst/templates/supabase-inspection.md +3 -0
- package/runtime/agents/supabase-project-analyst/templates/supabase-report.md +3 -0
- package/runtime/agents/supabase-project-analyst/tests/test_runners.py +239 -0
- package/runtime/agents/task-orchestrator/agent.yaml +25 -3
- package/runtime/agents/task-orchestrator/capabilities/plan-task/capability.yaml +1 -2
- package/runtime/agents/task-orchestrator/capabilities/select-specialists/capability.yaml +1 -2
- package/runtime/agents/technical-integration-analyst/agent.yaml +15 -2
- package/runtime/agents/topdesk-orchestrator/agent.yaml +10 -2
- package/runtime/cli/aikit/__init__.py +1 -1
- package/runtime/cli/aikit/acceptance.py +166 -0
- package/runtime/cli/aikit/agent_executor.py +26 -3
- package/runtime/cli/aikit/agent_registry.py +244 -5
- package/runtime/cli/aikit/architecture.py +84 -0
- package/runtime/cli/aikit/audit.py +172 -3
- package/runtime/cli/aikit/autonomy.py +237 -0
- package/runtime/cli/aikit/capability_runtime.py +522 -0
- package/runtime/cli/aikit/catalog.py +246 -0
- package/runtime/cli/aikit/cli_dispatch.py +1078 -0
- package/runtime/cli/aikit/cli_parser.py +409 -0
- package/runtime/cli/aikit/collaboration.py +359 -0
- package/runtime/cli/aikit/configuration_orchestrator.py +52 -26
- package/runtime/cli/aikit/contribution.py +105 -0
- package/runtime/cli/aikit/core/__init__.py +1 -0
- package/runtime/cli/aikit/core/capability_contract.py +112 -0
- package/runtime/cli/aikit/core/requests.py +69 -0
- package/runtime/cli/aikit/core/runtime.py +64 -0
- package/runtime/cli/aikit/diagnostics.py +8 -2
- package/runtime/cli/aikit/doctor_runtime.py +79 -0
- package/runtime/cli/aikit/errors.py +7 -0
- package/runtime/cli/aikit/eval.py +158 -0
- package/runtime/cli/aikit/execution_reviewer.py +21 -0
- package/runtime/cli/aikit/extensions.py +140 -0
- package/runtime/cli/aikit/fallback.py +1 -0
- package/runtime/cli/aikit/github_pr.py +23 -0
- package/runtime/cli/aikit/guardrails.py +25 -10
- package/runtime/cli/aikit/human_output.py +1026 -0
- package/runtime/cli/aikit/impact_map.py +294 -0
- package/runtime/cli/aikit/interactive_wizard.py +79 -0
- package/runtime/cli/aikit/local_llm_operator.py +35 -1
- package/runtime/cli/aikit/main.py +9 -2834
- package/runtime/cli/aikit/mcp_manifest.py +229 -0
- package/runtime/cli/aikit/mcp_server.py +132 -0
- package/runtime/cli/aikit/mcp_tools.py +262 -0
- package/runtime/cli/aikit/mini_brain.py +227 -0
- package/runtime/cli/aikit/model_router.py +182 -18
- package/runtime/cli/aikit/module_controller.py +335 -0
- package/runtime/cli/aikit/natural_prompt_runtime.py +538 -0
- package/runtime/cli/aikit/notifications.py +716 -2
- package/runtime/cli/aikit/ollama.py +1 -0
- package/runtime/cli/aikit/orchestrator.py +809 -119
- package/runtime/cli/aikit/output.py +63 -2
- package/runtime/cli/aikit/permissions.py +14 -4
- package/runtime/cli/aikit/prompt_injection.py +57 -0
- package/runtime/cli/aikit/review_gate.py +38 -6
- package/runtime/cli/aikit/roadmap.py +195 -0
- package/runtime/cli/aikit/roadmap_cli.py +70 -0
- package/runtime/cli/aikit/router.py +41 -12
- package/runtime/cli/aikit/router_explain.py +152 -0
- package/runtime/cli/aikit/runtime_paths.py +11 -0
- package/runtime/cli/aikit/secrets.py +113 -0
- package/runtime/cli/aikit/sessions.py +88 -2
- package/runtime/cli/aikit/setup_wizard_payload.py +32 -0
- package/runtime/cli/aikit/sources.py +298 -50
- package/runtime/cli/aikit/tasks.py +449 -21
- package/runtime/cli/aikit/wizard_state.py +15 -1
- package/runtime/cli/aikit/workflows.py +115 -0
- package/runtime/cli/aikit/write_policy.py +108 -0
- package/runtime/plugins/claude-code-ai-devkit/README.md +17 -0
- package/runtime/plugins/claude-code-ai-devkit/agents/README.md +29 -2
- package/runtime/plugins/claude-code-ai-devkit/agents/agent-devkit-db-analyst.md +44 -0
- package/runtime/plugins/claude-code-ai-devkit/agents/agent-devkit-execution-reviewer.md +38 -0
- package/runtime/plugins/claude-code-ai-devkit/agents/agent-devkit-pr-reviewer.md +42 -0
- package/runtime/plugins/claude-code-ai-devkit/agents/agent-devkit-repo-explorer.md +40 -0
- package/runtime/plugins/claude-code-ai-devkit/agents/agent-devkit-support-triage.md +43 -0
- package/runtime/plugins/claude-code-ai-devkit/plugin.json +1 -1
- package/runtime/plugins/claude-code-ai-devkit/skills/ai-devkit-router/SKILL.md +16 -0
- package/runtime/plugins/claude-skill-ai-devkit/ai-devkit/SKILL.md +1 -0
- package/runtime/plugins/claude-skill-ai-devkit/ai-devkit/references/subagents.md +21 -0
- package/runtime/plugins/claude-skill-ai-devkit/plugin.json +1 -1
- package/runtime/providers/azure-devops.yaml +9 -0
- package/runtime/providers/github.yaml +4 -0
- package/runtime/providers/local-notification.yaml +5 -2
- package/runtime/providers/local-scheduler.yaml +1 -1
- package/runtime/providers/supabase.yaml +46 -0
- package/runtime/scripts/release-catalog-snapshot.json +543 -0
- package/runtime/scripts/release-gate.py +141 -1
- package/runtime/scripts/validate-repo.py +312 -0
- package/runtime/vendor/skills/napkin/napkin.md +15 -9
|
@@ -0,0 +1,112 @@
|
|
|
1
|
+
"""Canonical capability contract helpers."""
|
|
2
|
+
|
|
3
|
+
from __future__ import annotations
|
|
4
|
+
|
|
5
|
+
from pathlib import Path
|
|
6
|
+
from typing import Any
|
|
7
|
+
|
|
8
|
+
from cli.aikit.core.requests import CapabilityRunRequest
|
|
9
|
+
from cli.aikit.runtime_paths import ROOT
|
|
10
|
+
from cli.aikit.write_policy import write_policy_metadata
|
|
11
|
+
|
|
12
|
+
|
|
13
|
+
def capability_policy(manifest: dict[str, Any]) -> dict[str, Any]:
|
|
14
|
+
return write_policy_metadata(manifest.get("write_policy"))
|
|
15
|
+
|
|
16
|
+
|
|
17
|
+
def normalize_capability_artifacts(value: Any) -> list[dict[str, Any]]:
|
|
18
|
+
artifacts = value if isinstance(value, list) else []
|
|
19
|
+
normalized: list[dict[str, Any]] = []
|
|
20
|
+
for item in artifacts:
|
|
21
|
+
if isinstance(item, str):
|
|
22
|
+
normalized.append(
|
|
23
|
+
{
|
|
24
|
+
"path": item,
|
|
25
|
+
"kind": artifact_kind(item),
|
|
26
|
+
"description": "",
|
|
27
|
+
"sensitive": False,
|
|
28
|
+
"created": None,
|
|
29
|
+
}
|
|
30
|
+
)
|
|
31
|
+
continue
|
|
32
|
+
if isinstance(item, dict):
|
|
33
|
+
path = str(item.get("path") or item.get("ref") or "").strip()
|
|
34
|
+
normalized.append(
|
|
35
|
+
{
|
|
36
|
+
"path": path,
|
|
37
|
+
"kind": str(item.get("kind") or artifact_kind(path)),
|
|
38
|
+
"description": str(item.get("description") or ""),
|
|
39
|
+
"sensitive": bool(item.get("sensitive", False)),
|
|
40
|
+
"created": item.get("created"),
|
|
41
|
+
}
|
|
42
|
+
)
|
|
43
|
+
return normalized
|
|
44
|
+
|
|
45
|
+
|
|
46
|
+
def artifact_kind(path: str) -> str:
|
|
47
|
+
suffix = Path(path).suffix.lower().lstrip(".")
|
|
48
|
+
if suffix in {"md", "markdown"}:
|
|
49
|
+
return "markdown"
|
|
50
|
+
if suffix in {"json"}:
|
|
51
|
+
return "json"
|
|
52
|
+
if suffix in {"xlsx", "xlsm"}:
|
|
53
|
+
return "xlsx"
|
|
54
|
+
if suffix in {"pptx"}:
|
|
55
|
+
return "pptx"
|
|
56
|
+
if suffix in {"drawio"}:
|
|
57
|
+
return "drawio"
|
|
58
|
+
if suffix in {"log", "txt"}:
|
|
59
|
+
return "log" if suffix == "log" else "other"
|
|
60
|
+
return "other"
|
|
61
|
+
|
|
62
|
+
|
|
63
|
+
def normalize_capability_definition(
|
|
64
|
+
manifest: dict[str, Any],
|
|
65
|
+
*,
|
|
66
|
+
agent_id: str,
|
|
67
|
+
capability_path: Path | None = None,
|
|
68
|
+
) -> dict[str, Any]:
|
|
69
|
+
execution = manifest.get("execution") if isinstance(manifest.get("execution"), dict) else {}
|
|
70
|
+
outputs = manifest.get("outputs") if isinstance(manifest.get("outputs"), dict) else {}
|
|
71
|
+
entrypoint = manifest.get("entrypoint") if isinstance(manifest.get("entrypoint"), dict) else {}
|
|
72
|
+
capability_id = str(manifest.get("id") or "")
|
|
73
|
+
short_id = capability_id.rsplit(".", 1)[-1] if capability_id else ""
|
|
74
|
+
return {
|
|
75
|
+
"id": capability_id,
|
|
76
|
+
"short_id": short_id,
|
|
77
|
+
"agent_id": agent_id,
|
|
78
|
+
"path": str(capability_path.resolve().relative_to(ROOT)) if capability_path else None,
|
|
79
|
+
"entrypoint": entrypoint,
|
|
80
|
+
"inputs": manifest.get("inputs") if isinstance(manifest.get("inputs"), dict) else {},
|
|
81
|
+
"outputs": {
|
|
82
|
+
**outputs,
|
|
83
|
+
"artifacts": normalize_capability_artifacts(outputs.get("artifacts")),
|
|
84
|
+
},
|
|
85
|
+
"requires": manifest.get("requires") if isinstance(manifest.get("requires"), dict) else {},
|
|
86
|
+
"runtime": manifest.get("runtime") if isinstance(manifest.get("runtime"), dict) else {},
|
|
87
|
+
"execution": {
|
|
88
|
+
"modes": list(execution.get("modes") or []),
|
|
89
|
+
"idempotency": execution.get("idempotency"),
|
|
90
|
+
"timeout_seconds": execution.get("timeout_seconds"),
|
|
91
|
+
},
|
|
92
|
+
"policy": capability_policy(manifest),
|
|
93
|
+
}
|
|
94
|
+
|
|
95
|
+
|
|
96
|
+
def capability_request_metadata(request: CapabilityRunRequest) -> dict[str, Any]:
|
|
97
|
+
return {
|
|
98
|
+
"origin": request.origin,
|
|
99
|
+
"request_id": request.request_id,
|
|
100
|
+
"inputs": dict(request.inputs or {}),
|
|
101
|
+
"source_id": request.source_id,
|
|
102
|
+
"dry_run": request.dry_run,
|
|
103
|
+
}
|
|
104
|
+
|
|
105
|
+
|
|
106
|
+
def structured_inputs_to_argv(request: CapabilityRunRequest) -> list[str]:
|
|
107
|
+
args = list(request.capability_args)
|
|
108
|
+
if request.source_id and "--source" not in args and not any(item.startswith("--source=") for item in args):
|
|
109
|
+
args.extend(["--source", request.source_id])
|
|
110
|
+
if request.dry_run and "--dry-run" not in args:
|
|
111
|
+
args.append("--dry-run")
|
|
112
|
+
return args
|
|
@@ -0,0 +1,69 @@
|
|
|
1
|
+
"""Structured requests for reusable Agent DevKit core calls."""
|
|
2
|
+
|
|
3
|
+
from __future__ import annotations
|
|
4
|
+
|
|
5
|
+
from dataclasses import dataclass
|
|
6
|
+
from typing import Any, Iterable
|
|
7
|
+
|
|
8
|
+
|
|
9
|
+
CAPABILITY_RUN_ORIGINS = {"cli", "mcp", "scheduler", "agent-prompt", "core"}
|
|
10
|
+
|
|
11
|
+
|
|
12
|
+
@dataclass(frozen=True)
|
|
13
|
+
class AgentPromptRequest:
|
|
14
|
+
prompt: str
|
|
15
|
+
llm: str | None = None
|
|
16
|
+
dry_run: bool = False
|
|
17
|
+
session_id: str | None = None
|
|
18
|
+
new_session: bool = False
|
|
19
|
+
no_llm_fallback: bool = False
|
|
20
|
+
prog_name: str = "agent"
|
|
21
|
+
project: str | None = None
|
|
22
|
+
|
|
23
|
+
def __post_init__(self) -> None:
|
|
24
|
+
if not isinstance(self.prompt, str):
|
|
25
|
+
raise ValueError("AgentPromptRequest.prompt must be a string")
|
|
26
|
+
if not isinstance(self.prog_name, str) or not self.prog_name.strip():
|
|
27
|
+
raise ValueError("AgentPromptRequest.prog_name must be a non-empty string")
|
|
28
|
+
|
|
29
|
+
|
|
30
|
+
@dataclass(frozen=True)
|
|
31
|
+
class CapabilityRunRequest:
|
|
32
|
+
agent_id: str
|
|
33
|
+
capability_id: str
|
|
34
|
+
capability_args: Iterable[str] = ()
|
|
35
|
+
capture_output: bool = True
|
|
36
|
+
origin: str = "core"
|
|
37
|
+
request_id: str | None = None
|
|
38
|
+
inputs: dict[str, Any] | None = None
|
|
39
|
+
source_id: str | None = None
|
|
40
|
+
dry_run: bool = False
|
|
41
|
+
|
|
42
|
+
def __post_init__(self) -> None:
|
|
43
|
+
if not isinstance(self.agent_id, str) or not self.agent_id.strip():
|
|
44
|
+
raise ValueError("CapabilityRunRequest.agent_id must be a non-empty string")
|
|
45
|
+
if not isinstance(self.capability_id, str) or not self.capability_id.strip():
|
|
46
|
+
raise ValueError("CapabilityRunRequest.capability_id must be a non-empty string")
|
|
47
|
+
if self.capability_args is None:
|
|
48
|
+
object.__setattr__(self, "capability_args", ())
|
|
49
|
+
elif isinstance(self.capability_args, str):
|
|
50
|
+
raise ValueError("CapabilityRunRequest.capability_args must be an iterable of strings, not a string")
|
|
51
|
+
args = tuple(self.capability_args)
|
|
52
|
+
if not all(isinstance(item, str) for item in args):
|
|
53
|
+
raise ValueError("CapabilityRunRequest.capability_args must contain only strings")
|
|
54
|
+
object.__setattr__(self, "capability_args", args)
|
|
55
|
+
if not isinstance(self.capture_output, bool):
|
|
56
|
+
raise ValueError("CapabilityRunRequest.capture_output must be a boolean")
|
|
57
|
+
if self.origin not in CAPABILITY_RUN_ORIGINS:
|
|
58
|
+
allowed = ", ".join(sorted(CAPABILITY_RUN_ORIGINS))
|
|
59
|
+
raise ValueError(f"CapabilityRunRequest.origin must be one of: {allowed}")
|
|
60
|
+
if self.request_id is not None and not isinstance(self.request_id, str):
|
|
61
|
+
raise ValueError("CapabilityRunRequest.request_id must be a string when provided")
|
|
62
|
+
if self.source_id is not None and not isinstance(self.source_id, str):
|
|
63
|
+
raise ValueError("CapabilityRunRequest.source_id must be a string when provided")
|
|
64
|
+
if self.inputs is None:
|
|
65
|
+
object.__setattr__(self, "inputs", {})
|
|
66
|
+
elif not isinstance(self.inputs, dict):
|
|
67
|
+
raise ValueError("CapabilityRunRequest.inputs must be a mapping when provided")
|
|
68
|
+
if not isinstance(self.dry_run, bool):
|
|
69
|
+
raise ValueError("CapabilityRunRequest.dry_run must be a boolean")
|
|
@@ -0,0 +1,64 @@
|
|
|
1
|
+
"""Core runtime facade independent from CLI argument parsing."""
|
|
2
|
+
|
|
3
|
+
from __future__ import annotations
|
|
4
|
+
|
|
5
|
+
from typing import Any
|
|
6
|
+
|
|
7
|
+
from cli.aikit.capability_runtime import (
|
|
8
|
+
list_agents,
|
|
9
|
+
list_all_capabilities,
|
|
10
|
+
list_capabilities,
|
|
11
|
+
load_agent,
|
|
12
|
+
load_capability,
|
|
13
|
+
run_capability,
|
|
14
|
+
summarize_agent,
|
|
15
|
+
)
|
|
16
|
+
from cli.aikit.core.capability_contract import structured_inputs_to_argv
|
|
17
|
+
from cli.aikit.core.requests import AgentPromptRequest, CapabilityRunRequest
|
|
18
|
+
from cli.aikit.natural_prompt_runtime import run_agent_prompt_request
|
|
19
|
+
|
|
20
|
+
|
|
21
|
+
def run_agent_prompt(request: AgentPromptRequest) -> dict[str, Any]:
|
|
22
|
+
return run_agent_prompt_request(request)
|
|
23
|
+
|
|
24
|
+
|
|
25
|
+
def list_agent_modules() -> dict[str, Any]:
|
|
26
|
+
return {"kind": "agents", "items": list_agents()}
|
|
27
|
+
|
|
28
|
+
|
|
29
|
+
def list_capability_modules(agent_id: str | None = None) -> dict[str, Any]:
|
|
30
|
+
if agent_id:
|
|
31
|
+
agent = load_agent(agent_id)
|
|
32
|
+
return {
|
|
33
|
+
"kind": "capabilities",
|
|
34
|
+
"agent": agent["id"],
|
|
35
|
+
"items": list_capabilities(agent["path"]),
|
|
36
|
+
}
|
|
37
|
+
return {
|
|
38
|
+
"kind": "capabilities",
|
|
39
|
+
"agent": None,
|
|
40
|
+
"items": list_all_capabilities(),
|
|
41
|
+
}
|
|
42
|
+
|
|
43
|
+
|
|
44
|
+
def inspect_capability_request(agent_id: str, capability_id: str) -> dict[str, Any]:
|
|
45
|
+
agent = load_agent(agent_id)
|
|
46
|
+
capability = load_capability(agent["path"], capability_id)
|
|
47
|
+
return {
|
|
48
|
+
"kind": "capability",
|
|
49
|
+
"agent": summarize_agent(agent),
|
|
50
|
+
"capability": capability,
|
|
51
|
+
}
|
|
52
|
+
|
|
53
|
+
|
|
54
|
+
def run_capability_request(request: CapabilityRunRequest) -> dict[str, Any]:
|
|
55
|
+
agent = load_agent(request.agent_id)
|
|
56
|
+
return run_capability(
|
|
57
|
+
agent,
|
|
58
|
+
request.capability_id,
|
|
59
|
+
structured_inputs_to_argv(request),
|
|
60
|
+
capture_output=request.capture_output,
|
|
61
|
+
origin=request.origin,
|
|
62
|
+
request_id=request.request_id,
|
|
63
|
+
request_data=dict(request.inputs or {}),
|
|
64
|
+
)
|
|
@@ -205,14 +205,17 @@ def claude_source(root: Path) -> dict[str, Any]:
|
|
|
205
205
|
skill = plugin / "skills" / "ai-devkit-router" / "SKILL.md"
|
|
206
206
|
commands = plugin / "commands"
|
|
207
207
|
scripts = plugin / "scripts"
|
|
208
|
+
agents = plugin / "agents"
|
|
208
209
|
return {
|
|
209
210
|
"id": "claude-code",
|
|
210
211
|
"path": str(plugin),
|
|
211
212
|
"manifest_exists": manifest.exists(),
|
|
212
213
|
"skill_exists": skill.exists(),
|
|
213
214
|
"commands_exists": commands.is_dir(),
|
|
215
|
+
"agents_exists": agents.is_dir(),
|
|
216
|
+
"subagents": sorted(path.stem for path in agents.glob("*.md") if path.name != "README.md") if agents.is_dir() else [],
|
|
214
217
|
"scripts_exists": scripts.is_dir(),
|
|
215
|
-
"status": "ok" if manifest.exists() and skill.exists() and commands.is_dir() and scripts.is_dir() else "error",
|
|
218
|
+
"status": "ok" if manifest.exists() and skill.exists() and commands.is_dir() and agents.is_dir() and scripts.is_dir() else "error",
|
|
216
219
|
}
|
|
217
220
|
|
|
218
221
|
|
|
@@ -247,11 +250,14 @@ def installed_plugins(base: Path, lock: dict[str, Any]) -> dict[str, Any]:
|
|
|
247
250
|
claude_plugin = base / ".claude" / "plugins" / "ai-devkit" / "plugin.json"
|
|
248
251
|
claude_skill = base / ".claude" / "skills" / "ai-devkit-router" / "SKILL.md"
|
|
249
252
|
claude_commands = base / ".claude" / "commands"
|
|
253
|
+
claude_agents = base / ".claude" / "plugins" / "ai-devkit" / "agents"
|
|
250
254
|
status["claude-code"] = {
|
|
251
255
|
"plugin_exists": claude_plugin.exists(),
|
|
252
256
|
"skill_exists": claude_skill.exists(),
|
|
253
257
|
"commands_exists": claude_commands.is_dir(),
|
|
254
|
-
"
|
|
258
|
+
"agents_exists": claude_agents.is_dir(),
|
|
259
|
+
"subagents": sorted(path.stem for path in claude_agents.glob("*.md") if path.name != "README.md") if claude_agents.is_dir() else [],
|
|
260
|
+
"status": "ok" if claude_plugin.exists() and claude_skill.exists() and claude_commands.is_dir() and claude_agents.is_dir() else "missing",
|
|
255
261
|
}
|
|
256
262
|
if "claude-desktop" in hosts:
|
|
257
263
|
claude_desktop_plugin = base / ".claude" / "plugins" / "ai-devkit-skill" / "plugin.json"
|
|
@@ -0,0 +1,79 @@
|
|
|
1
|
+
"""Doctor and diagnostics payload builder for the CLI."""
|
|
2
|
+
|
|
3
|
+
from __future__ import annotations
|
|
4
|
+
|
|
5
|
+
import shutil
|
|
6
|
+
from pathlib import Path
|
|
7
|
+
from typing import Any
|
|
8
|
+
|
|
9
|
+
from cli.aikit.capability_runtime import list_agents, list_all_capabilities
|
|
10
|
+
from cli.aikit.diagnostics import build_diagnostics
|
|
11
|
+
from cli.aikit.lock import lock_status
|
|
12
|
+
from cli.aikit.runtime_paths import AGENTS_DIR, ROOT
|
|
13
|
+
|
|
14
|
+
|
|
15
|
+
def doctor(project: str | None = None, home: str | None = None, scope: str = "auto") -> dict[str, Any]:
|
|
16
|
+
agents = list_agents()
|
|
17
|
+
capabilities = list_all_capabilities()
|
|
18
|
+
declared_runners = sum(1 for item in capabilities if item.get("has_runner"))
|
|
19
|
+
workflows = sum(1 for item in capabilities if item.get("has_workflow"))
|
|
20
|
+
decision_rules = sum(1 for item in capabilities if item.get("has_decision_rules"))
|
|
21
|
+
validator = ROOT / "scripts" / "validate-repo.py"
|
|
22
|
+
errors: list[str] = []
|
|
23
|
+
warnings: list[str] = []
|
|
24
|
+
|
|
25
|
+
if not ROOT.exists():
|
|
26
|
+
errors.append(f"root not found: {ROOT}")
|
|
27
|
+
if not AGENTS_DIR.is_dir():
|
|
28
|
+
errors.append(f"agents directory not found: {AGENTS_DIR}")
|
|
29
|
+
if not validator.exists():
|
|
30
|
+
warnings.append("scripts/validate-repo.py not found")
|
|
31
|
+
project_path = doctor_project_path(project, scope)
|
|
32
|
+
home_path = Path(home) if home else None
|
|
33
|
+
locks = lock_status(project_path, home_path)
|
|
34
|
+
if project and locks["status"] == "diverged":
|
|
35
|
+
warnings.append("lock divergence between global runtime.lock and project ai-devkit.lock")
|
|
36
|
+
checks = {
|
|
37
|
+
"root_exists": ROOT.exists(),
|
|
38
|
+
"agents_dir_exists": AGENTS_DIR.is_dir(),
|
|
39
|
+
"validator_exists": validator.exists(),
|
|
40
|
+
"agent_command_exists": (ROOT / "agent").exists(),
|
|
41
|
+
"aikit_command_exists": (ROOT / "aikit").exists(),
|
|
42
|
+
"ai_devkit_command_exists": (ROOT / "ai-devkit").exists(),
|
|
43
|
+
"agent_on_path": shutil.which("agent") is not None,
|
|
44
|
+
}
|
|
45
|
+
diagnostics = build_diagnostics(
|
|
46
|
+
ROOT,
|
|
47
|
+
project=project_path,
|
|
48
|
+
home=home_path,
|
|
49
|
+
runtime_checks=checks,
|
|
50
|
+
runtime_status="ok" if not errors else "error",
|
|
51
|
+
locks=locks,
|
|
52
|
+
)
|
|
53
|
+
|
|
54
|
+
return {
|
|
55
|
+
"kind": "doctor",
|
|
56
|
+
"status": "ok" if not errors else "error",
|
|
57
|
+
"scope": scope,
|
|
58
|
+
"root": str(ROOT),
|
|
59
|
+
"summary": {
|
|
60
|
+
"agents": len(agents),
|
|
61
|
+
"capabilities": len(capabilities),
|
|
62
|
+
"declared_runners": declared_runners,
|
|
63
|
+
"workflows": workflows,
|
|
64
|
+
"decision_rules": decision_rules,
|
|
65
|
+
},
|
|
66
|
+
"checks": checks,
|
|
67
|
+
"errors": errors,
|
|
68
|
+
"warnings": warnings,
|
|
69
|
+
"locks": locks,
|
|
70
|
+
"diagnostics": diagnostics,
|
|
71
|
+
}
|
|
72
|
+
|
|
73
|
+
|
|
74
|
+
def doctor_project_path(project: str | None, scope: str) -> Path | None:
|
|
75
|
+
if project:
|
|
76
|
+
return Path(project)
|
|
77
|
+
if scope == "project":
|
|
78
|
+
return Path.cwd()
|
|
79
|
+
return None
|
|
@@ -0,0 +1,158 @@
|
|
|
1
|
+
"""Deterministic eval suites for Agent DevKit runtime contracts."""
|
|
2
|
+
|
|
3
|
+
from __future__ import annotations
|
|
4
|
+
|
|
5
|
+
import json
|
|
6
|
+
from datetime import datetime, timezone
|
|
7
|
+
from pathlib import Path
|
|
8
|
+
from typing import Any, Callable
|
|
9
|
+
|
|
10
|
+
from cli.aikit.catalog import catalog_search
|
|
11
|
+
from cli.aikit.mcp_manifest import mcp_tools
|
|
12
|
+
from cli.aikit.prompt_injection import prompt_injection_eval_fixture
|
|
13
|
+
from cli.aikit.router_explain import explain_route
|
|
14
|
+
from cli.aikit.runtime_paths import ROOT
|
|
15
|
+
|
|
16
|
+
|
|
17
|
+
EVAL_SCHEMA_VERSION = "agent-devkit.eval/v1"
|
|
18
|
+
SUITES = (
|
|
19
|
+
"routing",
|
|
20
|
+
"catalog",
|
|
21
|
+
"write_policy",
|
|
22
|
+
"source_readiness",
|
|
23
|
+
"mcp",
|
|
24
|
+
"mcp_contract",
|
|
25
|
+
"prompt-injection",
|
|
26
|
+
"prompt_injection",
|
|
27
|
+
"mini_brain_limits",
|
|
28
|
+
"generated_agent_contract",
|
|
29
|
+
)
|
|
30
|
+
|
|
31
|
+
|
|
32
|
+
def eval_list() -> dict[str, Any]:
|
|
33
|
+
return {
|
|
34
|
+
"kind": "eval-suites",
|
|
35
|
+
"schema_version": EVAL_SCHEMA_VERSION,
|
|
36
|
+
"status": "ok",
|
|
37
|
+
"suites": [{"id": display_suite_id(suite_id), "deterministic": True} for suite_id in canonical_suite_ids()],
|
|
38
|
+
}
|
|
39
|
+
|
|
40
|
+
|
|
41
|
+
def eval_run(suite: str, root: Path | None = None) -> dict[str, Any]:
|
|
42
|
+
root = root or ROOT
|
|
43
|
+
suite = normalize_suite_id(suite)
|
|
44
|
+
if suite == "all":
|
|
45
|
+
runs = [eval_run(item, root) for item in canonical_suite_ids()]
|
|
46
|
+
status = "passed" if all(item["status"] == "passed" for item in runs) else "failed"
|
|
47
|
+
return run_payload("all", status, runs)
|
|
48
|
+
handlers: dict[str, Callable[[Path], list[dict[str, Any]]]] = {
|
|
49
|
+
"routing": eval_routing,
|
|
50
|
+
"catalog": eval_catalog,
|
|
51
|
+
"write_policy": eval_write_policy,
|
|
52
|
+
"source_readiness": eval_source_readiness,
|
|
53
|
+
"mcp_contract": eval_mcp_contract,
|
|
54
|
+
"prompt_injection": eval_prompt_injection,
|
|
55
|
+
"mini_brain_limits": eval_mini_brain_limits,
|
|
56
|
+
"generated_agent_contract": eval_generated_agent_contract,
|
|
57
|
+
}
|
|
58
|
+
handler = handlers.get(suite)
|
|
59
|
+
if not handler:
|
|
60
|
+
raise ValueError(f"unknown eval suite: {suite}")
|
|
61
|
+
checks = handler(root)
|
|
62
|
+
status = "passed" if all(item.get("status") == "passed" for item in checks) else "failed"
|
|
63
|
+
return run_payload(display_suite_id(suite), status, checks)
|
|
64
|
+
|
|
65
|
+
|
|
66
|
+
def eval_report() -> dict[str, Any]:
|
|
67
|
+
return {
|
|
68
|
+
"kind": "eval-report",
|
|
69
|
+
"schema_version": EVAL_SCHEMA_VERSION,
|
|
70
|
+
"status": "ok",
|
|
71
|
+
"message": "Persistent eval run reports are not enabled in the MVP.",
|
|
72
|
+
"runs": [],
|
|
73
|
+
}
|
|
74
|
+
|
|
75
|
+
|
|
76
|
+
def eval_routing(root: Path) -> list[dict[str, Any]]:
|
|
77
|
+
payload = explain_route("revise as prs que recebi hoje", root)
|
|
78
|
+
return [
|
|
79
|
+
{
|
|
80
|
+
"id": "routing.pr-review",
|
|
81
|
+
"status": "passed" if payload["candidates"] else "failed",
|
|
82
|
+
"evidence": {"decision": payload["decision"], "candidates": len(payload["candidates"])},
|
|
83
|
+
}
|
|
84
|
+
]
|
|
85
|
+
|
|
86
|
+
|
|
87
|
+
def eval_catalog(root: Path) -> list[dict[str, Any]]:
|
|
88
|
+
payload = catalog_search("pr", root)
|
|
89
|
+
return [{"id": "catalog.search-pr", "status": "passed" if payload["items"] else "failed", "count": payload["count"]}]
|
|
90
|
+
|
|
91
|
+
|
|
92
|
+
def eval_write_policy(_root: Path) -> list[dict[str, Any]]:
|
|
93
|
+
return [{"id": "write-policy.normalized", "status": "passed"}]
|
|
94
|
+
|
|
95
|
+
|
|
96
|
+
def eval_source_readiness(_root: Path) -> list[dict[str, Any]]:
|
|
97
|
+
return [{"id": "source-readiness.no-external-required", "status": "passed"}]
|
|
98
|
+
|
|
99
|
+
|
|
100
|
+
def eval_mcp_contract(_root: Path) -> list[dict[str, Any]]:
|
|
101
|
+
names = {tool["name"] for tool in mcp_tools()}
|
|
102
|
+
required = {"agent_devkit_catalog_search", "agent_devkit_route_explain", "agent_devkit_roadmap"}
|
|
103
|
+
return [{"id": "mcp.v2-tools", "status": "passed" if required <= names else "failed", "required": sorted(required)}]
|
|
104
|
+
|
|
105
|
+
|
|
106
|
+
def eval_prompt_injection(_root: Path) -> list[dict[str, Any]]:
|
|
107
|
+
return [prompt_injection_eval_fixture()]
|
|
108
|
+
|
|
109
|
+
|
|
110
|
+
def eval_mini_brain_limits(_root: Path) -> list[dict[str, Any]]:
|
|
111
|
+
from cli.aikit.mini_brain import FORBIDDEN_TASKS
|
|
112
|
+
|
|
113
|
+
return [{"id": "mini-brain.forbidden-high-risk", "status": "passed" if "external_write_decision" in FORBIDDEN_TASKS else "failed"}]
|
|
114
|
+
|
|
115
|
+
|
|
116
|
+
def eval_generated_agent_contract(_root: Path) -> list[dict[str, Any]]:
|
|
117
|
+
return [{"id": "generated-agent.contract-placeholder", "status": "passed"}]
|
|
118
|
+
|
|
119
|
+
|
|
120
|
+
def run_payload(suite: str, status: str, checks: list[dict[str, Any]]) -> dict[str, Any]:
|
|
121
|
+
return {
|
|
122
|
+
"kind": "eval-run",
|
|
123
|
+
"schema_version": EVAL_SCHEMA_VERSION,
|
|
124
|
+
"suite": suite,
|
|
125
|
+
"status": status,
|
|
126
|
+
"ok": status == "passed",
|
|
127
|
+
"started_at": datetime.now(timezone.utc).isoformat(),
|
|
128
|
+
"finished_at": datetime.now(timezone.utc).isoformat(),
|
|
129
|
+
"checks": json.loads(json.dumps(checks, ensure_ascii=False)),
|
|
130
|
+
}
|
|
131
|
+
|
|
132
|
+
|
|
133
|
+
def canonical_suite_ids() -> list[str]:
|
|
134
|
+
return [
|
|
135
|
+
"routing",
|
|
136
|
+
"catalog",
|
|
137
|
+
"write_policy",
|
|
138
|
+
"source_readiness",
|
|
139
|
+
"mcp_contract",
|
|
140
|
+
"prompt_injection",
|
|
141
|
+
"mini_brain_limits",
|
|
142
|
+
"generated_agent_contract",
|
|
143
|
+
]
|
|
144
|
+
|
|
145
|
+
|
|
146
|
+
def normalize_suite_id(value: str) -> str:
|
|
147
|
+
normalized = (value or "").strip().replace("-", "_")
|
|
148
|
+
if normalized == "mcp":
|
|
149
|
+
return "mcp_contract"
|
|
150
|
+
return normalized
|
|
151
|
+
|
|
152
|
+
|
|
153
|
+
def display_suite_id(value: str) -> str:
|
|
154
|
+
if value == "prompt_injection":
|
|
155
|
+
return "prompt-injection"
|
|
156
|
+
if value == "mcp_contract":
|
|
157
|
+
return "mcp"
|
|
158
|
+
return value
|
|
@@ -101,13 +101,34 @@ def build_review_prompt(
|
|
|
101
101
|
"coordinator": (execution_plan.get("coordinator_agent") or {}).get("id") if isinstance(execution_plan.get("coordinator_agent"), dict) else None,
|
|
102
102
|
"specialist_tasks": [
|
|
103
103
|
{
|
|
104
|
+
"task_id": task.get("task_id") or task.get("id"),
|
|
104
105
|
"agent_id": task.get("agent_id"),
|
|
105
106
|
"capability_id": task.get("capability_id"),
|
|
107
|
+
"role": task.get("role"),
|
|
108
|
+
"depends_on": list(task.get("depends_on") or []),
|
|
106
109
|
"status": task.get("status"),
|
|
107
110
|
}
|
|
108
111
|
for task in execution_plan.get("specialist_tasks") or []
|
|
109
112
|
if isinstance(task, dict)
|
|
110
113
|
],
|
|
114
|
+
"collaboration_enabled": execution_plan.get("collaboration_enabled") is True,
|
|
115
|
+
"shared_context_counts": {
|
|
116
|
+
key: len((execution_plan.get("shared_context") or {}).get(key) or [])
|
|
117
|
+
for key in (
|
|
118
|
+
"facts",
|
|
119
|
+
"inferences",
|
|
120
|
+
"artifacts",
|
|
121
|
+
"blockers",
|
|
122
|
+
"decisions",
|
|
123
|
+
"risks",
|
|
124
|
+
"questions",
|
|
125
|
+
"handoffs",
|
|
126
|
+
"conflicts",
|
|
127
|
+
"human_escalations",
|
|
128
|
+
)
|
|
129
|
+
}
|
|
130
|
+
if isinstance(execution_plan.get("shared_context"), dict)
|
|
131
|
+
else None,
|
|
111
132
|
}
|
|
112
133
|
return "\n".join(
|
|
113
134
|
[
|