agentic-flow 1.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude/agents/MIGRATION_SUMMARY.md +222 -0
- package/.claude/agents/README.md +89 -0
- package/.claude/agents/analysis/code-analyzer.md +209 -0
- package/.claude/agents/analysis/code-review/analyze-code-quality.md +180 -0
- package/.claude/agents/architecture/system-design/arch-system-design.md +156 -0
- package/.claude/agents/base-template-generator.md +42 -0
- package/.claude/agents/consensus/README.md +253 -0
- package/.claude/agents/consensus/byzantine-coordinator.md +63 -0
- package/.claude/agents/consensus/crdt-synchronizer.md +997 -0
- package/.claude/agents/consensus/gossip-coordinator.md +63 -0
- package/.claude/agents/consensus/performance-benchmarker.md +851 -0
- package/.claude/agents/consensus/quorum-manager.md +823 -0
- package/.claude/agents/consensus/raft-manager.md +63 -0
- package/.claude/agents/consensus/security-manager.md +622 -0
- package/.claude/agents/core/coder.md +211 -0
- package/.claude/agents/core/planner.md +116 -0
- package/.claude/agents/core/researcher.md +136 -0
- package/.claude/agents/core/reviewer.md +272 -0
- package/.claude/agents/core/tester.md +266 -0
- package/.claude/agents/data/ml/data-ml-model.md +193 -0
- package/.claude/agents/development/backend/dev-backend-api.md +142 -0
- package/.claude/agents/devops/ci-cd/ops-cicd-github.md +164 -0
- package/.claude/agents/documentation/api-docs/docs-api-openapi.md +174 -0
- package/.claude/agents/flow-nexus/app-store.md +88 -0
- package/.claude/agents/flow-nexus/authentication.md +69 -0
- package/.claude/agents/flow-nexus/challenges.md +81 -0
- package/.claude/agents/flow-nexus/neural-network.md +88 -0
- package/.claude/agents/flow-nexus/payments.md +83 -0
- package/.claude/agents/flow-nexus/sandbox.md +76 -0
- package/.claude/agents/flow-nexus/swarm.md +76 -0
- package/.claude/agents/flow-nexus/user-tools.md +96 -0
- package/.claude/agents/flow-nexus/workflow.md +84 -0
- package/.claude/agents/github/code-review-swarm.md +538 -0
- package/.claude/agents/github/github-modes.md +173 -0
- package/.claude/agents/github/issue-tracker.md +319 -0
- package/.claude/agents/github/multi-repo-swarm.md +553 -0
- package/.claude/agents/github/pr-manager.md +191 -0
- package/.claude/agents/github/project-board-sync.md +509 -0
- package/.claude/agents/github/release-manager.md +367 -0
- package/.claude/agents/github/release-swarm.md +583 -0
- package/.claude/agents/github/repo-architect.md +398 -0
- package/.claude/agents/github/swarm-issue.md +573 -0
- package/.claude/agents/github/swarm-pr.md +428 -0
- package/.claude/agents/github/sync-coordinator.md +452 -0
- package/.claude/agents/github/workflow-automation.md +635 -0
- package/.claude/agents/goal/agent.md +816 -0
- package/.claude/agents/goal/goal-planner.md +73 -0
- package/.claude/agents/optimization/README.md +250 -0
- package/.claude/agents/optimization/benchmark-suite.md +665 -0
- package/.claude/agents/optimization/load-balancer.md +431 -0
- package/.claude/agents/optimization/performance-monitor.md +672 -0
- package/.claude/agents/optimization/resource-allocator.md +674 -0
- package/.claude/agents/optimization/topology-optimizer.md +808 -0
- package/.claude/agents/payments/agentic-payments.md +126 -0
- package/.claude/agents/sparc/architecture.md +472 -0
- package/.claude/agents/sparc/pseudocode.md +318 -0
- package/.claude/agents/sparc/refinement.md +525 -0
- package/.claude/agents/sparc/specification.md +276 -0
- package/.claude/agents/specialized/mobile/spec-mobile-react-native.md +226 -0
- package/.claude/agents/sublinear/consensus-coordinator.md +338 -0
- package/.claude/agents/sublinear/matrix-optimizer.md +185 -0
- package/.claude/agents/sublinear/pagerank-analyzer.md +299 -0
- package/.claude/agents/sublinear/performance-optimizer.md +368 -0
- package/.claude/agents/sublinear/trading-predictor.md +246 -0
- package/.claude/agents/swarm/README.md +190 -0
- package/.claude/agents/swarm/adaptive-coordinator.md +396 -0
- package/.claude/agents/swarm/hierarchical-coordinator.md +256 -0
- package/.claude/agents/swarm/mesh-coordinator.md +392 -0
- package/.claude/agents/templates/automation-smart-agent.md +205 -0
- package/.claude/agents/templates/coordinator-swarm-init.md +90 -0
- package/.claude/agents/templates/github-pr-manager.md +177 -0
- package/.claude/agents/templates/implementer-sparc-coder.md +259 -0
- package/.claude/agents/templates/memory-coordinator.md +187 -0
- package/.claude/agents/templates/migration-plan.md +746 -0
- package/.claude/agents/templates/orchestrator-task.md +139 -0
- package/.claude/agents/templates/performance-analyzer.md +199 -0
- package/.claude/agents/templates/sparc-coordinator.md +183 -0
- package/.claude/agents/test-neural.md +14 -0
- package/.claude/agents/testing/unit/tdd-london-swarm.md +244 -0
- package/.claude/agents/testing/validation/production-validator.md +395 -0
- package/.claude/commands/agents/README.md +10 -0
- package/.claude/commands/agents/agent-capabilities.md +21 -0
- package/.claude/commands/agents/agent-coordination.md +28 -0
- package/.claude/commands/agents/agent-spawning.md +28 -0
- package/.claude/commands/agents/agent-types.md +26 -0
- package/.claude/commands/analysis/COMMAND_COMPLIANCE_REPORT.md +54 -0
- package/.claude/commands/analysis/README.md +9 -0
- package/.claude/commands/analysis/bottleneck-detect.md +162 -0
- package/.claude/commands/analysis/performance-bottlenecks.md +59 -0
- package/.claude/commands/analysis/performance-report.md +25 -0
- package/.claude/commands/analysis/token-efficiency.md +45 -0
- package/.claude/commands/analysis/token-usage.md +25 -0
- package/.claude/commands/automation/README.md +9 -0
- package/.claude/commands/automation/auto-agent.md +122 -0
- package/.claude/commands/automation/self-healing.md +106 -0
- package/.claude/commands/automation/session-memory.md +90 -0
- package/.claude/commands/automation/smart-agents.md +73 -0
- package/.claude/commands/automation/smart-spawn.md +25 -0
- package/.claude/commands/automation/workflow-select.md +25 -0
- package/.claude/commands/claude-flow-help.md +103 -0
- package/.claude/commands/claude-flow-memory.md +107 -0
- package/.claude/commands/claude-flow-swarm.md +205 -0
- package/.claude/commands/coordination/README.md +9 -0
- package/.claude/commands/coordination/agent-spawn.md +25 -0
- package/.claude/commands/coordination/init.md +44 -0
- package/.claude/commands/coordination/orchestrate.md +43 -0
- package/.claude/commands/coordination/spawn.md +45 -0
- package/.claude/commands/coordination/swarm-init.md +85 -0
- package/.claude/commands/coordination/task-orchestrate.md +25 -0
- package/.claude/commands/flow-nexus/app-store.md +124 -0
- package/.claude/commands/flow-nexus/challenges.md +120 -0
- package/.claude/commands/flow-nexus/login-registration.md +65 -0
- package/.claude/commands/flow-nexus/neural-network.md +134 -0
- package/.claude/commands/flow-nexus/payments.md +116 -0
- package/.claude/commands/flow-nexus/sandbox.md +83 -0
- package/.claude/commands/flow-nexus/swarm.md +87 -0
- package/.claude/commands/flow-nexus/user-tools.md +152 -0
- package/.claude/commands/flow-nexus/workflow.md +115 -0
- package/.claude/commands/github/README.md +11 -0
- package/.claude/commands/github/code-review-swarm.md +514 -0
- package/.claude/commands/github/code-review.md +25 -0
- package/.claude/commands/github/github-modes.md +147 -0
- package/.claude/commands/github/github-swarm.md +121 -0
- package/.claude/commands/github/issue-tracker.md +292 -0
- package/.claude/commands/github/issue-triage.md +25 -0
- package/.claude/commands/github/multi-repo-swarm.md +519 -0
- package/.claude/commands/github/pr-enhance.md +26 -0
- package/.claude/commands/github/pr-manager.md +170 -0
- package/.claude/commands/github/project-board-sync.md +471 -0
- package/.claude/commands/github/release-manager.md +338 -0
- package/.claude/commands/github/release-swarm.md +544 -0
- package/.claude/commands/github/repo-analyze.md +25 -0
- package/.claude/commands/github/repo-architect.md +367 -0
- package/.claude/commands/github/swarm-issue.md +482 -0
- package/.claude/commands/github/swarm-pr.md +285 -0
- package/.claude/commands/github/sync-coordinator.md +301 -0
- package/.claude/commands/github/workflow-automation.md +442 -0
- package/.claude/commands/hive-mind/README.md +17 -0
- package/.claude/commands/hive-mind/hive-mind-consensus.md +8 -0
- package/.claude/commands/hive-mind/hive-mind-init.md +18 -0
- package/.claude/commands/hive-mind/hive-mind-memory.md +8 -0
- package/.claude/commands/hive-mind/hive-mind-metrics.md +8 -0
- package/.claude/commands/hive-mind/hive-mind-resume.md +8 -0
- package/.claude/commands/hive-mind/hive-mind-sessions.md +8 -0
- package/.claude/commands/hive-mind/hive-mind-spawn.md +21 -0
- package/.claude/commands/hive-mind/hive-mind-status.md +8 -0
- package/.claude/commands/hive-mind/hive-mind-stop.md +8 -0
- package/.claude/commands/hive-mind/hive-mind-wizard.md +8 -0
- package/.claude/commands/hive-mind/hive-mind.md +27 -0
- package/.claude/commands/hooks/README.md +11 -0
- package/.claude/commands/hooks/overview.md +58 -0
- package/.claude/commands/hooks/post-edit.md +117 -0
- package/.claude/commands/hooks/post-task.md +112 -0
- package/.claude/commands/hooks/pre-edit.md +113 -0
- package/.claude/commands/hooks/pre-task.md +111 -0
- package/.claude/commands/hooks/session-end.md +118 -0
- package/.claude/commands/hooks/setup.md +103 -0
- package/.claude/commands/memory/README.md +9 -0
- package/.claude/commands/memory/memory-persist.md +25 -0
- package/.claude/commands/memory/memory-search.md +25 -0
- package/.claude/commands/memory/memory-usage.md +25 -0
- package/.claude/commands/memory/neural.md +47 -0
- package/.claude/commands/memory/usage.md +46 -0
- package/.claude/commands/monitoring/README.md +9 -0
- package/.claude/commands/monitoring/agent-metrics.md +25 -0
- package/.claude/commands/monitoring/agents.md +44 -0
- package/.claude/commands/monitoring/real-time-view.md +25 -0
- package/.claude/commands/monitoring/status.md +46 -0
- package/.claude/commands/monitoring/swarm-monitor.md +25 -0
- package/.claude/commands/optimization/README.md +9 -0
- package/.claude/commands/optimization/auto-topology.md +62 -0
- package/.claude/commands/optimization/cache-manage.md +25 -0
- package/.claude/commands/optimization/parallel-execute.md +25 -0
- package/.claude/commands/optimization/parallel-execution.md +50 -0
- package/.claude/commands/optimization/topology-optimize.md +25 -0
- package/.claude/commands/pair/README.md +261 -0
- package/.claude/commands/pair/commands.md +546 -0
- package/.claude/commands/pair/config.md +510 -0
- package/.claude/commands/pair/examples.md +512 -0
- package/.claude/commands/pair/modes.md +348 -0
- package/.claude/commands/pair/session.md +407 -0
- package/.claude/commands/pair/start.md +209 -0
- package/.claude/commands/sparc/analyzer.md +52 -0
- package/.claude/commands/sparc/architect.md +53 -0
- package/.claude/commands/sparc/ask.md +97 -0
- package/.claude/commands/sparc/batch-executor.md +54 -0
- package/.claude/commands/sparc/code.md +89 -0
- package/.claude/commands/sparc/coder.md +54 -0
- package/.claude/commands/sparc/debug.md +83 -0
- package/.claude/commands/sparc/debugger.md +54 -0
- package/.claude/commands/sparc/designer.md +53 -0
- package/.claude/commands/sparc/devops.md +109 -0
- package/.claude/commands/sparc/docs-writer.md +80 -0
- package/.claude/commands/sparc/documenter.md +54 -0
- package/.claude/commands/sparc/innovator.md +54 -0
- package/.claude/commands/sparc/integration.md +83 -0
- package/.claude/commands/sparc/mcp.md +117 -0
- package/.claude/commands/sparc/memory-manager.md +54 -0
- package/.claude/commands/sparc/optimizer.md +54 -0
- package/.claude/commands/sparc/orchestrator.md +132 -0
- package/.claude/commands/sparc/post-deployment-monitoring-mode.md +83 -0
- package/.claude/commands/sparc/refinement-optimization-mode.md +83 -0
- package/.claude/commands/sparc/researcher.md +54 -0
- package/.claude/commands/sparc/reviewer.md +54 -0
- package/.claude/commands/sparc/security-review.md +80 -0
- package/.claude/commands/sparc/sparc-modes.md +174 -0
- package/.claude/commands/sparc/sparc.md +111 -0
- package/.claude/commands/sparc/spec-pseudocode.md +80 -0
- package/.claude/commands/sparc/supabase-admin.md +348 -0
- package/.claude/commands/sparc/swarm-coordinator.md +54 -0
- package/.claude/commands/sparc/tdd.md +54 -0
- package/.claude/commands/sparc/tester.md +54 -0
- package/.claude/commands/sparc/tutorial.md +79 -0
- package/.claude/commands/sparc/workflow-manager.md +54 -0
- package/.claude/commands/sparc.md +166 -0
- package/.claude/commands/stream-chain/pipeline.md +121 -0
- package/.claude/commands/stream-chain/run.md +70 -0
- package/.claude/commands/swarm/README.md +15 -0
- package/.claude/commands/swarm/analysis.md +95 -0
- package/.claude/commands/swarm/development.md +96 -0
- package/.claude/commands/swarm/examples.md +168 -0
- package/.claude/commands/swarm/maintenance.md +102 -0
- package/.claude/commands/swarm/optimization.md +117 -0
- package/.claude/commands/swarm/research.md +136 -0
- package/.claude/commands/swarm/swarm-analysis.md +8 -0
- package/.claude/commands/swarm/swarm-background.md +8 -0
- package/.claude/commands/swarm/swarm-init.md +19 -0
- package/.claude/commands/swarm/swarm-modes.md +8 -0
- package/.claude/commands/swarm/swarm-monitor.md +8 -0
- package/.claude/commands/swarm/swarm-spawn.md +19 -0
- package/.claude/commands/swarm/swarm-status.md +8 -0
- package/.claude/commands/swarm/swarm-strategies.md +8 -0
- package/.claude/commands/swarm/swarm.md +27 -0
- package/.claude/commands/swarm/testing.md +131 -0
- package/.claude/commands/training/README.md +9 -0
- package/.claude/commands/training/model-update.md +25 -0
- package/.claude/commands/training/neural-patterns.md +74 -0
- package/.claude/commands/training/neural-train.md +25 -0
- package/.claude/commands/training/pattern-learn.md +25 -0
- package/.claude/commands/training/specialization.md +63 -0
- package/.claude/commands/truth/start.md +143 -0
- package/.claude/commands/verify/check.md +50 -0
- package/.claude/commands/verify/start.md +128 -0
- package/.claude/commands/workflows/README.md +9 -0
- package/.claude/commands/workflows/development.md +78 -0
- package/.claude/commands/workflows/research.md +63 -0
- package/.claude/commands/workflows/workflow-create.md +25 -0
- package/.claude/commands/workflows/workflow-execute.md +25 -0
- package/.claude/commands/workflows/workflow-export.md +25 -0
- package/.claude/helpers/checkpoint-manager.sh +251 -0
- package/.claude/helpers/github-safe.js +106 -0
- package/.claude/helpers/github-setup.sh +28 -0
- package/.claude/helpers/quick-start.sh +19 -0
- package/.claude/helpers/setup-mcp.sh +18 -0
- package/.claude/helpers/standard-checkpoint-hooks.sh +179 -0
- package/.claude/mcp.json +13 -0
- package/.claude/settings-backup.json +130 -0
- package/.claude/settings-optimized.json +116 -0
- package/.claude/settings-simple.json +78 -0
- package/.claude/settings.json +114 -0
- package/.claude/settings.local.json +14 -0
- package/README.md +1280 -0
- package/dist/agents/claudeAgent.js +73 -0
- package/dist/agents/claudeFlowAgent.js +115 -0
- package/dist/agents/codeReviewAgent.js +34 -0
- package/dist/agents/dataAgent.js +34 -0
- package/dist/agents/directApiAgent.js +260 -0
- package/dist/agents/webResearchAgent.js +35 -0
- package/dist/cli/mcp.js +135 -0
- package/dist/cli-proxy.js +246 -0
- package/dist/cli.js +158 -0
- package/dist/config/claudeFlow.js +67 -0
- package/dist/config/tools.js +33 -0
- package/dist/coordination/parallelSwarm.js +226 -0
- package/dist/examples/multi-agent-orchestration.js +45 -0
- package/dist/examples/parallel-swarm-deployment.js +171 -0
- package/dist/examples/use-goal-planner.js +52 -0
- package/dist/health.js +46 -0
- package/dist/index-with-proxy.js +101 -0
- package/dist/index.js +167 -0
- package/dist/mcp/claudeFlowSdkServer.js +202 -0
- package/dist/mcp/fastmcp/servers/claude-flow-sdk.js +198 -0
- package/dist/mcp/fastmcp/servers/http-streaming-updated.js +421 -0
- package/dist/mcp/fastmcp/servers/poc-stdio.js +82 -0
- package/dist/mcp/fastmcp/servers/stdio-full.js +421 -0
- package/dist/mcp/fastmcp/tools/agent/add-agent.js +107 -0
- package/dist/mcp/fastmcp/tools/agent/add-command.js +117 -0
- package/dist/mcp/fastmcp/tools/agent/execute.js +56 -0
- package/dist/mcp/fastmcp/tools/agent/list.js +82 -0
- package/dist/mcp/fastmcp/tools/agent/parallel.js +63 -0
- package/dist/mcp/fastmcp/tools/memory/retrieve.js +38 -0
- package/dist/mcp/fastmcp/tools/memory/search.js +41 -0
- package/dist/mcp/fastmcp/tools/memory/store.js +56 -0
- package/dist/mcp/fastmcp/tools/swarm/init.js +41 -0
- package/dist/mcp/fastmcp/tools/swarm/orchestrate.js +47 -0
- package/dist/mcp/fastmcp/tools/swarm/spawn.js +40 -0
- package/dist/mcp/fastmcp/types/index.js +2 -0
- package/dist/proxy/anthropic-to-openrouter.js +246 -0
- package/dist/router/providers/anthropic.js +89 -0
- package/dist/router/providers/onnx-local-optimized.js +167 -0
- package/dist/router/providers/onnx-local.js +294 -0
- package/dist/router/providers/onnx-phi4.js +190 -0
- package/dist/router/providers/onnx.js +242 -0
- package/dist/router/providers/openrouter.js +242 -0
- package/dist/router/router.js +283 -0
- package/dist/router/test-integration.js +140 -0
- package/dist/router/test-onnx-benchmark.js +145 -0
- package/dist/router/test-onnx-integration.js +128 -0
- package/dist/router/test-onnx-local.js +37 -0
- package/dist/router/test-onnx.js +148 -0
- package/dist/router/test-openrouter.js +121 -0
- package/dist/router/test-phi4.js +137 -0
- package/dist/router/types.js +2 -0
- package/dist/utils/agentLoader.js +106 -0
- package/dist/utils/cli.js +128 -0
- package/dist/utils/logger.js +41 -0
- package/dist/utils/mcpCommands.js +214 -0
- package/dist/utils/model-downloader.js +182 -0
- package/dist/utils/retry.js +54 -0
- package/docs/.claude-flow/metrics/agent-metrics.json +1 -0
- package/docs/.claude-flow/metrics/performance.json +9 -0
- package/docs/.claude-flow/metrics/task-metrics.json +10 -0
- package/docs/CHANGELOG.md +155 -0
- package/docs/CLAUDE.md +352 -0
- package/docs/COMPLETE_VALIDATION_SUMMARY.md +405 -0
- package/docs/INDEX.md +183 -0
- package/docs/LICENSE +21 -0
- package/docs/ONNX_CLI_USAGE.md +344 -0
- package/docs/ONNX_ENV_VARS.md +564 -0
- package/docs/ONNX_INTEGRATION.md +422 -0
- package/docs/ONNX_OPTIMIZATION_GUIDE.md +665 -0
- package/docs/ONNX_OPTIMIZATION_SUMMARY.md +374 -0
- package/docs/ONNX_VS_CLAUDE_QUALITY.md +442 -0
- package/docs/OPENROUTER_DEPLOYMENT.md +495 -0
- package/docs/architecture/EXECUTIVE_SUMMARY.md +310 -0
- package/docs/architecture/IMPROVEMENT_PLAN.md +11 -0
- package/docs/architecture/INTEGRATION-STATUS.md +290 -0
- package/docs/architecture/MULTI_MODEL_ROUTER_PLAN.md +620 -0
- package/docs/architecture/QUICK_WINS.md +333 -0
- package/docs/architecture/README.md +15 -0
- package/docs/architecture/RESEARCH_SUMMARY.md +652 -0
- package/docs/archived/FASTMCP_COMPLETE.md +428 -0
- package/docs/archived/FASTMCP_INTEGRATION_STATUS.md +288 -0
- package/docs/archived/FLOW-NEXUS-COMPLETE.md +269 -0
- package/docs/archived/INTEGRATION_CONFIRMED.md +351 -0
- package/docs/archived/ONNX_FINAL_REPORT.md +312 -0
- package/docs/archived/ONNX_IMPLEMENTATION_COMPLETE.md +215 -0
- package/docs/archived/ONNX_IMPLEMENTATION_SUMMARY.md +197 -0
- package/docs/archived/ONNX_SUCCESS_REPORT.md +271 -0
- package/docs/archived/OPENROUTER_PROXY_COMPLETE.md +494 -0
- package/docs/archived/PACKAGE-COMPLETE.md +138 -0
- package/docs/archived/README.md +27 -0
- package/docs/archived/RESEARCH_COMPLETE.txt +335 -0
- package/docs/archived/SDK-SETUP-COMPLETE.md +252 -0
- package/docs/guides/ALTERNATIVE_LLM_MODELS.md +524 -0
- package/docs/guides/DOCKER_AGENT_USAGE.md +352 -0
- package/docs/guides/IMPLEMENTATION_EXAMPLES.md +960 -0
- package/docs/guides/NPM-PUBLISH.md +218 -0
- package/docs/guides/README.md +17 -0
- package/docs/guides/agent-sdk.md +234 -0
- package/docs/integrations/CLAUDE_AGENTS_INTEGRATION.md +356 -0
- package/docs/integrations/CLAUDE_FLOW_INTEGRATION.md +535 -0
- package/docs/integrations/FASTMCP_CLI_INTEGRATION.md +503 -0
- package/docs/integrations/FLOW-NEXUS-INTEGRATION.md +319 -0
- package/docs/integrations/README.md +18 -0
- package/docs/integrations/fastmcp-implementation-plan.md +2516 -0
- package/docs/integrations/fastmcp-poc-integration.md +198 -0
- package/docs/router/ONNX_PHI4_RESEARCH.md +220 -0
- package/docs/router/ONNX_RUNTIME_INTEGRATION_PLAN.md +866 -0
- package/docs/router/PHI4_HYPEROPTIMIZATION_PLAN.md +2488 -0
- package/docs/router/README.md +552 -0
- package/docs/router/ROUTER_CONFIG_REFERENCE.md +577 -0
- package/docs/router/ROUTER_USER_GUIDE.md +865 -0
- package/docs/validation/DOCKER_MCP_VALIDATION.md +358 -0
- package/docs/validation/DOCKER_OPENROUTER_VALIDATION.md +443 -0
- package/docs/validation/FINAL_SYSTEM_VALIDATION.md +458 -0
- package/docs/validation/FINAL_VALIDATION_SUMMARY.md +409 -0
- package/docs/validation/MCP_CLI_TOOLS_VALIDATION.md +266 -0
- package/docs/validation/MODEL_VALIDATION_REPORT.md +386 -0
- package/docs/validation/OPENROUTER_VALIDATION_COMPLETE.md +382 -0
- package/docs/validation/README.md +20 -0
- package/docs/validation/ROUTER_VALIDATION.md +311 -0
- package/package.json +140 -0
|
@@ -0,0 +1,344 @@
|
|
|
1
|
+
# ONNX Local Inference - CLI Usage Guide
|
|
2
|
+
|
|
3
|
+
## Quick Start
|
|
4
|
+
|
|
5
|
+
Run AI agents with **100% free local inference** using Microsoft's Phi-4 model:
|
|
6
|
+
|
|
7
|
+
```bash
|
|
8
|
+
# Auto-downloads Phi-4 (~4.9GB one-time download)
|
|
9
|
+
npx agentic-flow --agent coder --task "Create hello world" --provider onnx
|
|
10
|
+
```
|
|
11
|
+
|
|
12
|
+
## Installation & Setup
|
|
13
|
+
|
|
14
|
+
### Prerequisites
|
|
15
|
+
- Node.js 18+
|
|
16
|
+
- ~5GB disk space for Phi-4 model
|
|
17
|
+
- Internet connection for first-time download
|
|
18
|
+
|
|
19
|
+
### Automatic Model Download
|
|
20
|
+
|
|
21
|
+
The Phi-4-mini ONNX model downloads automatically on first use:
|
|
22
|
+
|
|
23
|
+
```bash
|
|
24
|
+
npx agentic-flow --agent coder --task "test" --provider onnx
|
|
25
|
+
|
|
26
|
+
# Output:
|
|
27
|
+
# 🔍 Phi-4-mini ONNX model not found locally
|
|
28
|
+
# 📥 Starting automatic download...
|
|
29
|
+
# This is a one-time download (~4.9GB total)
|
|
30
|
+
# Model: microsoft/Phi-4-mini-instruct-onnx (INT4 quantized)
|
|
31
|
+
# Files: model.onnx (~52MB) + model.onnx.data (~4.86GB)
|
|
32
|
+
#
|
|
33
|
+
# 📦 Downloading model.onnx...
|
|
34
|
+
# ✅ Model downloaded successfully
|
|
35
|
+
#
|
|
36
|
+
# 📦 Downloading model.onnx.data (this is the large 4.86GB file)...
|
|
37
|
+
# 📥 Downloading: 10.0% (463.16/4631.59 MB)
|
|
38
|
+
# 📥 Downloading: 20.0% (926.32/4631.59 MB)
|
|
39
|
+
# ...
|
|
40
|
+
# ✅ Model downloaded successfully
|
|
41
|
+
```
|
|
42
|
+
|
|
43
|
+
## CLI Usage
|
|
44
|
+
|
|
45
|
+
### Basic Commands
|
|
46
|
+
|
|
47
|
+
```bash
|
|
48
|
+
# Use ONNX provider with --provider flag
|
|
49
|
+
npx agentic-flow --agent <agent> --task "<task>" --provider onnx
|
|
50
|
+
|
|
51
|
+
# Examples
|
|
52
|
+
npx agentic-flow --agent coder --task "Write Python hello world" --provider onnx
|
|
53
|
+
npx agentic-flow --agent researcher --task "Analyze AI trends" --provider onnx
|
|
54
|
+
npx agentic-flow --agent reviewer --task "Review code quality" --provider onnx
|
|
55
|
+
```
|
|
56
|
+
|
|
57
|
+
### Environment Variables
|
|
58
|
+
|
|
59
|
+
```bash
|
|
60
|
+
# Force ONNX for all commands
|
|
61
|
+
export USE_ONNX=true
|
|
62
|
+
npx agentic-flow --agent coder --task "Build API"
|
|
63
|
+
|
|
64
|
+
# Or set provider explicitly
|
|
65
|
+
export PROVIDER=onnx
|
|
66
|
+
npx agentic-flow --agent coder --task "Build API"
|
|
67
|
+
|
|
68
|
+
# Enable optimizations for better quality and speed
|
|
69
|
+
export ONNX_OPTIMIZED=true
|
|
70
|
+
|
|
71
|
+
# Custom model path (if downloaded manually)
|
|
72
|
+
export ONNX_MODEL_PATH=./path/to/model.onnx
|
|
73
|
+
|
|
74
|
+
# GPU acceleration (10-50x faster!)
|
|
75
|
+
export ONNX_EXECUTION_PROVIDERS=cuda,cpu # NVIDIA
|
|
76
|
+
# export ONNX_EXECUTION_PROVIDERS=dml,cpu # Windows DirectML
|
|
77
|
+
# export ONNX_EXECUTION_PROVIDERS=coreml,cpu # macOS Metal
|
|
78
|
+
```
|
|
79
|
+
|
|
80
|
+
**See full environment variable reference:** [ONNX_ENV_VARS.md](./ONNX_ENV_VARS.md)
|
|
81
|
+
|
|
82
|
+
### Available Agents
|
|
83
|
+
|
|
84
|
+
All 75+ agents work with ONNX provider:
|
|
85
|
+
|
|
86
|
+
**Core Development:**
|
|
87
|
+
- `coder` - Code generation
|
|
88
|
+
- `reviewer` - Code review
|
|
89
|
+
- `tester` - Test creation
|
|
90
|
+
- `researcher` - Research & analysis
|
|
91
|
+
|
|
92
|
+
**Specialized:**
|
|
93
|
+
- `backend-dev` - Backend APIs
|
|
94
|
+
- `mobile-dev` - Mobile apps
|
|
95
|
+
- `ml-developer` - ML models
|
|
96
|
+
- `cicd-engineer` - CI/CD pipelines
|
|
97
|
+
- `api-docs` - API documentation
|
|
98
|
+
|
|
99
|
+
See full list: `npx agentic-flow --list`
|
|
100
|
+
|
|
101
|
+
## Performance
|
|
102
|
+
|
|
103
|
+
### CPU Performance (Intel i7)
|
|
104
|
+
- **Speed:** ~6 tokens/second (base), ~12 tokens/sec (optimized)
|
|
105
|
+
- **Latency:** ~3s for 20 tokens, ~16s for 100 tokens
|
|
106
|
+
- **Cost:** $0.00 (free)
|
|
107
|
+
|
|
108
|
+
### GPU Performance (with CUDA/DirectML/Metal)
|
|
109
|
+
- **Speed:** 60-300 tokens/second
|
|
110
|
+
- **Latency:** ~0.08s for 20 tokens, ~0.42s for 100 tokens
|
|
111
|
+
- **Cost:** $0.00 (free)
|
|
112
|
+
|
|
113
|
+
### Optimized Performance (ONNX_OPTIMIZED=true)
|
|
114
|
+
- **Quality:** 6.5/10 → 8.5/10 (31% improvement)
|
|
115
|
+
- **Speed:** 2-4x faster with context pruning
|
|
116
|
+
- **CPU:** ~12 tokens/sec (2x faster than base)
|
|
117
|
+
- **GPU:** ~180 tokens/sec (30x faster than base CPU)
|
|
118
|
+
|
|
119
|
+
See GPU setup in [ONNX_INTEGRATION.md](./ONNX_INTEGRATION.md#gpu-acceleration)
|
|
120
|
+
See optimization guide in [ONNX_OPTIMIZATION_GUIDE.md](./ONNX_OPTIMIZATION_GUIDE.md)
|
|
121
|
+
|
|
122
|
+
## Use Cases
|
|
123
|
+
|
|
124
|
+
### ✅ Perfect For
|
|
125
|
+
|
|
126
|
+
1. **Offline Development**
|
|
127
|
+
```bash
|
|
128
|
+
# Work without internet (after initial download)
|
|
129
|
+
export PROVIDER=onnx
|
|
130
|
+
export ONNX_OPTIMIZED=true
|
|
131
|
+
npx agentic-flow --agent coder --task "Build feature"
|
|
132
|
+
```
|
|
133
|
+
|
|
134
|
+
2. **Privacy-Sensitive Data**
|
|
135
|
+
```bash
|
|
136
|
+
# Process PII/HIPAA data locally
|
|
137
|
+
export PROVIDER=onnx
|
|
138
|
+
export ONNX_OPTIMIZED=true
|
|
139
|
+
npx agentic-flow --agent coder --task "Process medical records"
|
|
140
|
+
```
|
|
141
|
+
|
|
142
|
+
3. **Cost Optimization**
|
|
143
|
+
```bash
|
|
144
|
+
# Free inference for simple tasks with better quality
|
|
145
|
+
export PROVIDER=onnx
|
|
146
|
+
export ONNX_OPTIMIZED=true
|
|
147
|
+
export ONNX_TEMPERATURE=0.3 # Lower for code tasks
|
|
148
|
+
|
|
149
|
+
for task in task1 task2 task3; do
|
|
150
|
+
npx agentic-flow --agent coder --task "$task"
|
|
151
|
+
done
|
|
152
|
+
```
|
|
153
|
+
|
|
154
|
+
4. **High-Volume Simple Tasks**
|
|
155
|
+
```bash
|
|
156
|
+
# Thousands of generations daily at $0 cost
|
|
157
|
+
export PROVIDER=onnx
|
|
158
|
+
export ONNX_OPTIMIZED=true
|
|
159
|
+
export ONNX_MAX_CONTEXT_TOKENS=1000 # Faster
|
|
160
|
+
|
|
161
|
+
cat tasks.txt | while read task; do
|
|
162
|
+
npx agentic-flow --agent coder --task "$task"
|
|
163
|
+
done
|
|
164
|
+
```
|
|
165
|
+
|
|
166
|
+
5. **GPU-Accelerated Development**
|
|
167
|
+
```bash
|
|
168
|
+
# 30x faster with GPU (180 tokens/sec)
|
|
169
|
+
export PROVIDER=onnx
|
|
170
|
+
export ONNX_OPTIMIZED=true
|
|
171
|
+
export ONNX_EXECUTION_PROVIDERS=cuda,cpu # or dml, coreml
|
|
172
|
+
|
|
173
|
+
npx agentic-flow --agent coder --task "Complex feature"
|
|
174
|
+
```
|
|
175
|
+
|
|
176
|
+
### ❌ Not Ideal For
|
|
177
|
+
|
|
178
|
+
- **Complex Reasoning** - Use Claude or DeepSeek via OpenRouter
|
|
179
|
+
- **Tool Calling** - ONNX doesn't support MCP tools (use Anthropic/OpenRouter)
|
|
180
|
+
- **Long Context** - Limited to 4K tokens (use cloud models for >4K)
|
|
181
|
+
- **Streaming** - Not implemented yet (use OpenRouter/Anthropic)
|
|
182
|
+
|
|
183
|
+
## Hybrid Deployments
|
|
184
|
+
|
|
185
|
+
Mix ONNX with OpenRouter/Anthropic based on task complexity:
|
|
186
|
+
|
|
187
|
+
### Scenario 1: Simple Local, Complex Cloud
|
|
188
|
+
|
|
189
|
+
```bash
|
|
190
|
+
# Simple tasks - free ONNX
|
|
191
|
+
npx agentic-flow --agent coder --task "Hello world" --provider onnx
|
|
192
|
+
|
|
193
|
+
# Complex tasks - cheap OpenRouter
|
|
194
|
+
npx agentic-flow --agent coder --task "Design distributed system" \
|
|
195
|
+
--model "deepseek/deepseek-chat-v3.1"
|
|
196
|
+
```
|
|
197
|
+
|
|
198
|
+
### Scenario 2: Privacy-First with Fallback
|
|
199
|
+
|
|
200
|
+
```bash
|
|
201
|
+
# Privacy-sensitive - ONNX
|
|
202
|
+
export USE_ONNX=true
|
|
203
|
+
npx agentic-flow --agent coder --task "Process PII"
|
|
204
|
+
|
|
205
|
+
# Non-sensitive - OpenRouter (cheaper)
|
|
206
|
+
unset USE_ONNX
|
|
207
|
+
export OPENROUTER_API_KEY=sk-or-v1-...
|
|
208
|
+
npx agentic-flow --agent coder --task "Public API"
|
|
209
|
+
```
|
|
210
|
+
|
|
211
|
+
## Troubleshooting
|
|
212
|
+
|
|
213
|
+
### Model Download Failed
|
|
214
|
+
|
|
215
|
+
```bash
|
|
216
|
+
# Check internet connection
|
|
217
|
+
curl -I https://huggingface.co
|
|
218
|
+
|
|
219
|
+
# Retry download
|
|
220
|
+
rm -rf ./models/phi-4-mini
|
|
221
|
+
npx agentic-flow --agent coder --task "test" --provider onnx
|
|
222
|
+
```
|
|
223
|
+
|
|
224
|
+
### Slow Inference (6 tokens/sec)
|
|
225
|
+
|
|
226
|
+
Enable GPU acceleration - see [GPU Setup Guide](./ONNX_INTEGRATION.md#gpu-acceleration)
|
|
227
|
+
|
|
228
|
+
### Out of Memory
|
|
229
|
+
|
|
230
|
+
```bash
|
|
231
|
+
# Reduce max tokens
|
|
232
|
+
export ONNX_MAX_TOKENS=50
|
|
233
|
+
npx agentic-flow --agent coder --task "small task" --provider onnx
|
|
234
|
+
```
|
|
235
|
+
|
|
236
|
+
### Model Not Found Error
|
|
237
|
+
|
|
238
|
+
```bash
|
|
239
|
+
# Ensure model downloaded completely
|
|
240
|
+
ls -lh ./models/phi-4-mini/cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4/
|
|
241
|
+
# Should show:
|
|
242
|
+
# model.onnx (~52MB)
|
|
243
|
+
# model.onnx.data (~4.86GB)
|
|
244
|
+
```
|
|
245
|
+
|
|
246
|
+
## Cost Comparison
|
|
247
|
+
|
|
248
|
+
### 1,000 Code Generation Tasks
|
|
249
|
+
|
|
250
|
+
| Provider | Model | Cost |
|
|
251
|
+
|----------|-------|------|
|
|
252
|
+
| **ONNX Local** | Phi-4-mini | **$0.00** |
|
|
253
|
+
| OpenRouter | Llama 3.1 8B | $0.30 |
|
|
254
|
+
| OpenRouter | DeepSeek V3.1 | $1.40 |
|
|
255
|
+
| Anthropic | Claude 3.5 Sonnet | $81.00 |
|
|
256
|
+
|
|
257
|
+
**Monthly Savings:** $81/month vs Claude, $1.40/month vs DeepSeek
|
|
258
|
+
|
|
259
|
+
### Electricity Cost
|
|
260
|
+
|
|
261
|
+
Assuming 100W CPU, 1hr/day, $0.12/kWh:
|
|
262
|
+
- Daily: $0.012
|
|
263
|
+
- Monthly: $0.36
|
|
264
|
+
- Annual: $4.32
|
|
265
|
+
|
|
266
|
+
**Still cheaper than 5 OpenRouter requests!**
|
|
267
|
+
|
|
268
|
+
## Model Details
|
|
269
|
+
|
|
270
|
+
### Phi-4-mini-instruct-onnx
|
|
271
|
+
- **Source:** microsoft/Phi-4-mini-instruct-onnx (HuggingFace)
|
|
272
|
+
- **Architecture:** Phi-4 (14B parameters)
|
|
273
|
+
- **Quantization:** INT4 (4-bit integers)
|
|
274
|
+
- **Size:** 4.9GB (52MB model + 4.86GB weights)
|
|
275
|
+
- **Optimization:** CPU and mobile optimized
|
|
276
|
+
- **Context:** 4K tokens
|
|
277
|
+
- **License:** Microsoft Research License
|
|
278
|
+
|
|
279
|
+
## Advanced Configuration
|
|
280
|
+
|
|
281
|
+
### Custom Model Path
|
|
282
|
+
|
|
283
|
+
```bash
|
|
284
|
+
export ONNX_MODEL_PATH=/custom/path/to/model.onnx
|
|
285
|
+
npx agentic-flow --agent coder --task "test" --provider onnx
|
|
286
|
+
```
|
|
287
|
+
|
|
288
|
+
### Execution Providers
|
|
289
|
+
|
|
290
|
+
```bash
|
|
291
|
+
# CPU only (default)
|
|
292
|
+
export ONNX_EXECUTION_PROVIDERS=cpu
|
|
293
|
+
|
|
294
|
+
# GPU acceleration (NVIDIA)
|
|
295
|
+
export ONNX_EXECUTION_PROVIDERS=cuda,cpu
|
|
296
|
+
|
|
297
|
+
# GPU acceleration (Windows DirectML)
|
|
298
|
+
export ONNX_EXECUTION_PROVIDERS=dml,cpu
|
|
299
|
+
|
|
300
|
+
# GPU acceleration (macOS Metal)
|
|
301
|
+
export ONNX_EXECUTION_PROVIDERS=coreml,cpu
|
|
302
|
+
```
|
|
303
|
+
|
|
304
|
+
### Generation Parameters
|
|
305
|
+
|
|
306
|
+
```bash
|
|
307
|
+
# Max output tokens
|
|
308
|
+
export ONNX_MAX_TOKENS=100
|
|
309
|
+
|
|
310
|
+
# Temperature (0.0 = deterministic, 1.0 = creative)
|
|
311
|
+
export ONNX_TEMPERATURE=0.7
|
|
312
|
+
```
|
|
313
|
+
|
|
314
|
+
## Security & Privacy
|
|
315
|
+
|
|
316
|
+
### Data Privacy
|
|
317
|
+
- ✅ **100% Local Processing** - No data leaves your machine
|
|
318
|
+
- ✅ **No API Calls** - Zero external requests
|
|
319
|
+
- ✅ **No Telemetry** - No usage tracking
|
|
320
|
+
- ✅ **GDPR Compliant** - No data transmission
|
|
321
|
+
- ✅ **HIPAA Suitable** - Process sensitive health data locally
|
|
322
|
+
|
|
323
|
+
### Model Security
|
|
324
|
+
- ✅ **Official Source** - Downloaded from Microsoft HuggingFace
|
|
325
|
+
- ✅ **SHA256 Verification** - Optional integrity checks
|
|
326
|
+
- ✅ **Read-Only** - Model not modified after download
|
|
327
|
+
|
|
328
|
+
## Next Steps
|
|
329
|
+
|
|
330
|
+
1. **Enable GPU Acceleration:** [GPU Setup Guide](./ONNX_INTEGRATION.md#gpu-acceleration)
|
|
331
|
+
2. **Explore All Agents:** `npx agentic-flow --list`
|
|
332
|
+
3. **Hybrid Deployments:** [Router Configuration](./ONNX_INTEGRATION.md#integration-with-proxy-system)
|
|
333
|
+
4. **Advanced Features:** [Full ONNX Guide](./ONNX_INTEGRATION.md)
|
|
334
|
+
|
|
335
|
+
## Support
|
|
336
|
+
|
|
337
|
+
- **Documentation:** [ONNX_INTEGRATION.md](./ONNX_INTEGRATION.md)
|
|
338
|
+
- **Issues:** https://github.com/ruvnet/agentic-flow/issues
|
|
339
|
+
- **Model:** https://huggingface.co/microsoft/Phi-4-mini-instruct-onnx
|
|
340
|
+
- **ONNX Runtime:** https://onnxruntime.ai
|
|
341
|
+
|
|
342
|
+
---
|
|
343
|
+
|
|
344
|
+
**Run AI agents for free. Zero API costs. Complete privacy. Works offline.**
|