autoforgeai 2.7.11__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- autoforgeai-2.7.11/LICENSE +21 -0
- autoforgeai-2.7.11/PKG-INFO +420 -0
- autoforgeai-2.7.11/README.md +369 -0
- autoforgeai-2.7.11/autoforge/__init__.py +8 -0
- autoforgeai-2.7.11/autoforge/cli/__init__.py +84 -0
- autoforgeai-2.7.11/autoforge/cli/app.py +1309 -0
- autoforgeai-2.7.11/autoforge/cli/display.py +125 -0
- autoforgeai-2.7.11/autoforge/cli/interactive.py +199 -0
- autoforgeai-2.7.11/autoforge/cli/setup_wizard.py +894 -0
- autoforgeai-2.7.11/autoforge/contracts/__init__.py +2 -0
- autoforgeai-2.7.11/autoforge/contracts/paper_repro_contract.schema.json +128 -0
- autoforgeai-2.7.11/autoforge/data/constitution/CONSTITUTION.md +61 -0
- autoforgeai-2.7.11/autoforge/data/constitution/agents/architect.md +92 -0
- autoforgeai-2.7.11/autoforge/data/constitution/agents/builder.md +58 -0
- autoforgeai-2.7.11/autoforge/data/constitution/agents/director.md +134 -0
- autoforgeai-2.7.11/autoforge/data/constitution/agents/gardener.md +57 -0
- autoforgeai-2.7.11/autoforge/data/constitution/agents/reviewer.md +69 -0
- autoforgeai-2.7.11/autoforge/data/constitution/agents/scanner.md +79 -0
- autoforgeai-2.7.11/autoforge/data/constitution/agents/tester.md +68 -0
- autoforgeai-2.7.11/autoforge/data/constitution/quality_gates.md +80 -0
- autoforgeai-2.7.11/autoforge/data/constitution/workflows/build.md +29 -0
- autoforgeai-2.7.11/autoforge/data/constitution/workflows/deliver.md +40 -0
- autoforgeai-2.7.11/autoforge/data/constitution/workflows/import.md +51 -0
- autoforgeai-2.7.11/autoforge/data/constitution/workflows/refactor.md +20 -0
- autoforgeai-2.7.11/autoforge/data/constitution/workflows/review.md +42 -0
- autoforgeai-2.7.11/autoforge/data/constitution/workflows/spec.md +25 -0
- autoforgeai-2.7.11/autoforge/data/constitution/workflows/verify.md +21 -0
- autoforgeai-2.7.11/autoforge/engine/__init__.py +1 -0
- autoforgeai-2.7.11/autoforge/engine/adaptive_compute.py +723 -0
- autoforgeai-2.7.11/autoforge/engine/agent_base.py +463 -0
- autoforgeai-2.7.11/autoforge/engine/agent_debate.py +549 -0
- autoforgeai-2.7.11/autoforge/engine/agents/__init__.py +32 -0
- autoforgeai-2.7.11/autoforge/engine/agents/architect.py +238 -0
- autoforgeai-2.7.11/autoforge/engine/agents/builder.py +210 -0
- autoforgeai-2.7.11/autoforge/engine/agents/director.py +178 -0
- autoforgeai-2.7.11/autoforge/engine/agents/gardener.py +156 -0
- autoforgeai-2.7.11/autoforge/engine/agents/reviewer.py +139 -0
- autoforgeai-2.7.11/autoforge/engine/agents/scanner.py +257 -0
- autoforgeai-2.7.11/autoforge/engine/agents/tester.py +154 -0
- autoforgeai-2.7.11/autoforge/engine/article_reasoning.py +989 -0
- autoforgeai-2.7.11/autoforge/engine/article_verifier.py +1135 -0
- autoforgeai-2.7.11/autoforge/engine/auth.py +774 -0
- autoforgeai-2.7.11/autoforge/engine/autonomous_discovery.py +1618 -0
- autoforgeai-2.7.11/autoforge/engine/benchmark_eval.py +1027 -0
- autoforgeai-2.7.11/autoforge/engine/capability_dag.py +1431 -0
- autoforgeai-2.7.11/autoforge/engine/channels/__init__.py +1 -0
- autoforgeai-2.7.11/autoforge/engine/channels/telegram_bot.py +339 -0
- autoforgeai-2.7.11/autoforge/engine/channels/webhook.py +221 -0
- autoforgeai-2.7.11/autoforge/engine/checkpoints.py +277 -0
- autoforgeai-2.7.11/autoforge/engine/cloud_prover.py +625 -0
- autoforgeai-2.7.11/autoforge/engine/config.py +683 -0
- autoforgeai-2.7.11/autoforge/engine/curriculum_learning.py +851 -0
- autoforgeai-2.7.11/autoforge/engine/daemon.py +259 -0
- autoforgeai-2.7.11/autoforge/engine/dense_retrieval.py +888 -0
- autoforgeai-2.7.11/autoforge/engine/deploy_guide.py +242 -0
- autoforgeai-2.7.11/autoforge/engine/dynamic_constitution.py +344 -0
- autoforgeai-2.7.11/autoforge/engine/evolution.py +915 -0
- autoforgeai-2.7.11/autoforge/engine/evomac.py +541 -0
- autoforgeai-2.7.11/autoforge/engine/experiment_loop.py +1102 -0
- autoforgeai-2.7.11/autoforge/engine/formal_verify.py +550 -0
- autoforgeai-2.7.11/autoforge/engine/git_manager.py +181 -0
- autoforgeai-2.7.11/autoforge/engine/hierarchical_decomp.py +451 -0
- autoforgeai-2.7.11/autoforge/engine/ldb_debugger.py +713 -0
- autoforgeai-2.7.11/autoforge/engine/lean_prover.py +13 -0
- autoforgeai-2.7.11/autoforge/engine/literature_search.py +1680 -0
- autoforgeai-2.7.11/autoforge/engine/llm_router.py +821 -0
- autoforgeai-2.7.11/autoforge/engine/lock_manager.py +240 -0
- autoforgeai-2.7.11/autoforge/engine/multi_prover.py +6 -0
- autoforgeai-2.7.11/autoforge/engine/orchestrator.py +3084 -0
- autoforgeai-2.7.11/autoforge/engine/paper_formalizer.py +872 -0
- autoforgeai-2.7.11/autoforge/engine/paper_repro.py +1570 -0
- autoforgeai-2.7.11/autoforge/engine/paper_writer.py +1327 -0
- autoforgeai-2.7.11/autoforge/engine/peer_review.py +1047 -0
- autoforgeai-2.7.11/autoforge/engine/process_reward.py +582 -0
- autoforgeai-2.7.11/autoforge/engine/project_registry.py +431 -0
- autoforgeai-2.7.11/autoforge/engine/prompt_optimizer.py +649 -0
- autoforgeai-2.7.11/autoforge/engine/proof_embedding.py +1371 -0
- autoforgeai-2.7.11/autoforge/engine/provers/__init__.py +13 -0
- autoforgeai-2.7.11/autoforge/engine/provers/lean_core.py +702 -0
- autoforgeai-2.7.11/autoforge/engine/provers/lean_lake.py +859 -0
- autoforgeai-2.7.11/autoforge/engine/provers/multi_prover.py +1233 -0
- autoforgeai-2.7.11/autoforge/engine/provers/pantograph_repl.py +879 -0
- autoforgeai-2.7.11/autoforge/engine/provers/proof_library.py +1189 -0
- autoforgeai-2.7.11/autoforge/engine/provers/proof_search.py +1147 -0
- autoforgeai-2.7.11/autoforge/engine/rag_retrieval.py +656 -0
- autoforgeai-2.7.11/autoforge/engine/reasoning_extension.py +1344 -0
- autoforgeai-2.7.11/autoforge/engine/recursive_decomp_prover.py +1019 -0
- autoforgeai-2.7.11/autoforge/engine/reflexion.py +374 -0
- autoforgeai-2.7.11/autoforge/engine/repro_contract.py +419 -0
- autoforgeai-2.7.11/autoforge/engine/request_intake.py +171 -0
- autoforgeai-2.7.11/autoforge/engine/rl_proof_search.py +1974 -0
- autoforgeai-2.7.11/autoforge/engine/sandbox.py +374 -0
- autoforgeai-2.7.11/autoforge/engine/search_tree.py +1073 -0
- autoforgeai-2.7.11/autoforge/engine/security_scan.py +588 -0
- autoforgeai-2.7.11/autoforge/engine/self_play_conjecture.py +681 -0
- autoforgeai-2.7.11/autoforge/engine/sica.py +1368 -0
- autoforgeai-2.7.11/autoforge/engine/speculative_pipeline.py +527 -0
- autoforgeai-2.7.11/autoforge/engine/symbolic_compute.py +1010 -0
- autoforgeai-2.7.11/autoforge/engine/task_dag.py +291 -0
- autoforgeai-2.7.11/autoforge/engine/theoretical_reasoning.py +2480 -0
- autoforgeai-2.7.11/autoforge/engine/tools/__init__.py +182 -0
- autoforgeai-2.7.11/autoforge/engine/tools/github_search.py +392 -0
- autoforgeai-2.7.11/autoforge/engine/tools/search.py +265 -0
- autoforgeai-2.7.11/autoforge/engine/tools/web.py +255 -0
- autoforgeai-2.7.11/autoforge/engine/utils.py +124 -0
- autoforgeai-2.7.11/autoforge/engine/vlm_figure.py +1101 -0
- autoforgeai-2.7.11/autoforge/engine/world_model.py +390 -0
- autoforgeai-2.7.11/autoforgeai.egg-info/PKG-INFO +420 -0
- autoforgeai-2.7.11/autoforgeai.egg-info/SOURCES.txt +118 -0
- autoforgeai-2.7.11/autoforgeai.egg-info/dependency_links.txt +1 -0
- autoforgeai-2.7.11/autoforgeai.egg-info/entry_points.txt +2 -0
- autoforgeai-2.7.11/autoforgeai.egg-info/requires.txt +34 -0
- autoforgeai-2.7.11/autoforgeai.egg-info/top_level.txt +1 -0
- autoforgeai-2.7.11/pyproject.toml +126 -0
- autoforgeai-2.7.11/setup.cfg +4 -0
- autoforgeai-2.7.11/tests/test_academic.py +566 -0
- autoforgeai-2.7.11/tests/test_academic_hardening.py +176 -0
- autoforgeai-2.7.11/tests/test_academic_p0_p2_fixes.py +185 -0
- autoforgeai-2.7.11/tests/test_engines.py +1246 -0
- autoforgeai-2.7.11/tests/test_repro_contract.py +332 -0
|
@@ -0,0 +1,21 @@
|
|
|
1
|
+
MIT License
|
|
2
|
+
|
|
3
|
+
Copyright (c) 2026
|
|
4
|
+
|
|
5
|
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
6
|
+
of this software and associated documentation files (the "Software"), to deal
|
|
7
|
+
in the Software without restriction, including without limitation the rights
|
|
8
|
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
9
|
+
copies of the Software, and to permit persons to whom the Software is
|
|
10
|
+
furnished to do so, subject to the following conditions:
|
|
11
|
+
|
|
12
|
+
The above copyright notice and this permission notice shall be included in all
|
|
13
|
+
copies or substantial portions of the Software.
|
|
14
|
+
|
|
15
|
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
16
|
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
17
|
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
18
|
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
19
|
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
20
|
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
21
|
+
SOFTWARE.
|
|
@@ -0,0 +1,420 @@
|
|
|
1
|
+
Metadata-Version: 2.4
|
|
2
|
+
Name: autoforgeai
|
|
3
|
+
Version: 2.7.11
|
|
4
|
+
Summary: AutoForge AI-powered multi-agent development platform
|
|
5
|
+
Author: AlyciaBHZ
|
|
6
|
+
License-Expression: MIT
|
|
7
|
+
Project-URL: Homepage, https://github.com/AlyciaBHZ/autoforge
|
|
8
|
+
Project-URL: Repository, https://github.com/AlyciaBHZ/autoforge
|
|
9
|
+
Project-URL: Issues, https://github.com/AlyciaBHZ/autoforge/issues
|
|
10
|
+
Keywords: ai,agents,code-generation,multi-agent,llm,automation
|
|
11
|
+
Classifier: Development Status :: 4 - Beta
|
|
12
|
+
Classifier: Intended Audience :: Developers
|
|
13
|
+
Classifier: Programming Language :: Python :: 3
|
|
14
|
+
Classifier: Programming Language :: Python :: 3.11
|
|
15
|
+
Classifier: Programming Language :: Python :: 3.12
|
|
16
|
+
Classifier: Programming Language :: Python :: 3.13
|
|
17
|
+
Classifier: Topic :: Software Development :: Code Generators
|
|
18
|
+
Requires-Python: >=3.11
|
|
19
|
+
Description-Content-Type: text/markdown
|
|
20
|
+
License-File: LICENSE
|
|
21
|
+
Requires-Dist: anthropic>=0.84.0
|
|
22
|
+
Requires-Dist: python-dotenv>=1.0.0
|
|
23
|
+
Requires-Dist: rich>=13.0
|
|
24
|
+
Requires-Dist: pyyaml>=6.0
|
|
25
|
+
Requires-Dist: InquirerPy>=0.3.4
|
|
26
|
+
Requires-Dist: tomli-w>=1.0
|
|
27
|
+
Requires-Dist: aiosqlite>=0.20.0
|
|
28
|
+
Requires-Dist: httpx>=0.27
|
|
29
|
+
Provides-Extra: openai
|
|
30
|
+
Requires-Dist: openai>=1.0; extra == "openai"
|
|
31
|
+
Provides-Extra: google
|
|
32
|
+
Requires-Dist: google-genai>=1.0; extra == "google"
|
|
33
|
+
Requires-Dist: google-auth>=2.0; extra == "google"
|
|
34
|
+
Provides-Extra: search
|
|
35
|
+
Requires-Dist: duckduckgo-search<9.0,>=7.0; extra == "search"
|
|
36
|
+
Requires-Dist: html2text>=2024.2; extra == "search"
|
|
37
|
+
Provides-Extra: channels
|
|
38
|
+
Requires-Dist: fastapi>=0.115.0; extra == "channels"
|
|
39
|
+
Requires-Dist: uvicorn>=0.32.0; extra == "channels"
|
|
40
|
+
Requires-Dist: python-telegram-bot>=21.0; extra == "channels"
|
|
41
|
+
Provides-Extra: all
|
|
42
|
+
Requires-Dist: openai>=1.0; extra == "all"
|
|
43
|
+
Requires-Dist: google-genai>=1.0; extra == "all"
|
|
44
|
+
Requires-Dist: google-auth>=2.0; extra == "all"
|
|
45
|
+
Requires-Dist: duckduckgo-search<9.0,>=7.0; extra == "all"
|
|
46
|
+
Requires-Dist: html2text>=2024.2; extra == "all"
|
|
47
|
+
Requires-Dist: fastapi>=0.115.0; extra == "all"
|
|
48
|
+
Requires-Dist: uvicorn>=0.32.0; extra == "all"
|
|
49
|
+
Requires-Dist: python-telegram-bot>=21.0; extra == "all"
|
|
50
|
+
Dynamic: license-file
|
|
51
|
+
|
|
52
|
+
```
|
|
53
|
+
_ _ _____
|
|
54
|
+
/ \ _ _| |_ ___ | ___|__ _ __ __ _ ___
|
|
55
|
+
/ _ \| | | | __/ _ \| |_ / _ \| '__/ _` |/ _ \
|
|
56
|
+
/ ___ \ |_| | || (_) | _| (_) | | | (_| | __/
|
|
57
|
+
/_/ \_\__,_|\__\___/|_| \___/|_| \__, |\___|
|
|
58
|
+
|___/
|
|
59
|
+
```
|
|
60
|
+
|
|
61
|
+
**AI 多智能体框架 — 自主科研推理 · 形式化证明 · 全栈项目生成**
|
|
62
|
+
|
|
63
|
+
[](https://python.org)
|
|
64
|
+
[](LICENSE)
|
|
65
|
+
[](tests/)
|
|
66
|
+
[](autoforge/engine/)
|
|
67
|
+
|
|
68
|
+
[English](docs/README_EN.md) | [开发者文档](CLAUDE.md)
|
|
69
|
+
|
|
70
|
+
---
|
|
71
|
+
|
|
72
|
+
## 目录
|
|
73
|
+
|
|
74
|
+
- [安装与配置](#安装与配置)
|
|
75
|
+
- [安装](#安装)
|
|
76
|
+
- [首次运行引导](#首次运行引导)
|
|
77
|
+
- [支持的 LLM 提供商](#支持的-llm-提供商)
|
|
78
|
+
- [系统要求](#系统要求)
|
|
79
|
+
- [三种工作模式](#三种工作模式)
|
|
80
|
+
- [学术与科研能力](#学术与科研能力)
|
|
81
|
+
- [端到端文章推理](#端到端文章推理)
|
|
82
|
+
- [形式化验证与定理证明](#形式化验证与定理证明)
|
|
83
|
+
- [自主科研发现](#自主科研发现)
|
|
84
|
+
- [论文全流程](#论文全流程)
|
|
85
|
+
- [论文复现管线](#论文复现管线)
|
|
86
|
+
- [核心技术来源](#核心技术来源)
|
|
87
|
+
- [工程能力](#工程能力)
|
|
88
|
+
- [5 阶段流水线](#5-阶段流水线)
|
|
89
|
+
- [6 智能体协作](#6-智能体协作)
|
|
90
|
+
- [智能引擎](#智能引擎)
|
|
91
|
+
- [CLI 命令参考](#cli-命令参考)
|
|
92
|
+
- [守护进程模式](#守护进程模式)
|
|
93
|
+
|
|
94
|
+
---
|
|
95
|
+
|
|
96
|
+
## 安装与配置
|
|
97
|
+
|
|
98
|
+
### 安装
|
|
99
|
+
|
|
100
|
+
```bash
|
|
101
|
+
pip install forgeai # 从 PyPI 安装
|
|
102
|
+
forgeai # 启动(首次运行自动进入配置引导)
|
|
103
|
+
```
|
|
104
|
+
|
|
105
|
+
<details>
|
|
106
|
+
<summary>可选依赖</summary>
|
|
107
|
+
|
|
108
|
+
```bash
|
|
109
|
+
pip install "forgeai[openai]" # OpenAI 支持
|
|
110
|
+
pip install "forgeai[google]" # Google Gemini 支持
|
|
111
|
+
pip install "forgeai[search]" # Web 搜索能力
|
|
112
|
+
pip install "forgeai[channels]" # Telegram / Webhook 频道
|
|
113
|
+
pip install "forgeai[all]" # 全部安装
|
|
114
|
+
```
|
|
115
|
+
|
|
116
|
+
</details>
|
|
117
|
+
|
|
118
|
+
<details>
|
|
119
|
+
<summary>从源码安装</summary>
|
|
120
|
+
|
|
121
|
+
```bash
|
|
122
|
+
git clone https://github.com/AlyciaBHZ/autoforge.git
|
|
123
|
+
cd autoforge
|
|
124
|
+
pip install -e ".[all]"
|
|
125
|
+
```
|
|
126
|
+
|
|
127
|
+
</details>
|
|
128
|
+
|
|
129
|
+
### 首次运行引导
|
|
130
|
+
|
|
131
|
+
首次运行 `forgeai` 会自动进入交互式配置向导,全部步骤均可跳过(Ctrl+C),之后随时用 `forgeai setup` 重新配置:
|
|
132
|
+
|
|
133
|
+
```
|
|
134
|
+
步骤 1 │ 配置 LLM 提供商(可选)
|
|
135
|
+
│ 选择 Anthropic / OpenAI / Google(可多选)
|
|
136
|
+
│ 每个提供商支持多种认证方式(API Key、OAuth、Bedrock、Vertex AI 等)
|
|
137
|
+
│ 选择强模型(Director/Architect 使用)和快模型(Builder/Tester 使用)
|
|
138
|
+
│
|
|
139
|
+
步骤 2 │ 预算上限(默认 $10)
|
|
140
|
+
│
|
|
141
|
+
步骤 3 │ 并行 Builder 数量(默认 3,最多 8)
|
|
142
|
+
│
|
|
143
|
+
步骤 4 │ Docker 沙盒(可选,用于隔离构建环境)
|
|
144
|
+
│
|
|
145
|
+
步骤 5 │ GitHub 环境
|
|
146
|
+
│ 自动检测 git 和 gh CLI
|
|
147
|
+
│ 可选配置自动推送到 GitHub
|
|
148
|
+
```
|
|
149
|
+
|
|
150
|
+
配置保存在 `~/.autoforge/config.toml`,也可以通过环境变量覆盖。
|
|
151
|
+
|
|
152
|
+
### 支持的 LLM 提供商
|
|
153
|
+
|
|
154
|
+
| 提供商 | 环境变量 | 强模型 | 快模型 |
|
|
155
|
+
|--------|----------|--------|--------|
|
|
156
|
+
| **Anthropic** | `ANTHROPIC_API_KEY` | Claude Opus 4.6 | Claude Sonnet 4.5 |
|
|
157
|
+
| **OpenAI** | `OPENAI_API_KEY` | Codex 5.3、o3、GPT-4o | o4-mini、GPT-4o-mini |
|
|
158
|
+
| **Google** | `GOOGLE_API_KEY` | Gemini 2.5 Pro | Gemini 2.5 Flash、Gemini 2.0 Flash |
|
|
159
|
+
|
|
160
|
+
**支持的认证方式:**
|
|
161
|
+
|
|
162
|
+
| 认证方式 | 适用提供商 | 说明 |
|
|
163
|
+
|----------|-----------|------|
|
|
164
|
+
| API Key | 全部 | 最简单,推荐入门使用 |
|
|
165
|
+
| Codex OAuth | OpenAI | 浏览器登录,使用 ChatGPT 订阅额度 |
|
|
166
|
+
| Device Code | OpenAI | 无头/SSH 环境 |
|
|
167
|
+
| OAuth2 Client Credentials | Anthropic、OpenAI | 企业级 |
|
|
168
|
+
| Bearer Token + Custom URL | Anthropic、OpenAI | Azure、LiteLLM 等代理 |
|
|
169
|
+
| Amazon Bedrock | Anthropic | AWS Profile / Access Key / Instance Role |
|
|
170
|
+
| Google Vertex AI | Anthropic | GCP Project + ADC |
|
|
171
|
+
| ADC / Service Account | Google | Google Cloud 原生认证 |
|
|
172
|
+
|
|
173
|
+
支持跨厂商混搭模型:
|
|
174
|
+
|
|
175
|
+
```bash
|
|
176
|
+
export FORGE_MODEL_STRONG=o3 # 强模型用 OpenAI
|
|
177
|
+
export FORGE_MODEL_FAST=gemini-2.5-flash # 快模型用 Google
|
|
178
|
+
```
|
|
179
|
+
|
|
180
|
+
### 系统要求
|
|
181
|
+
|
|
182
|
+
- **Python 3.11+** — [python.org](https://python.org)
|
|
183
|
+
- **至少一个 LLM API Key** — [Anthropic](https://console.anthropic.com/) / [OpenAI](https://platform.openai.com/api-keys) / [Google](https://aistudio.google.com/apikey)
|
|
184
|
+
- **Git**(推荐)— 用于 Worktree 隔离并行构建
|
|
185
|
+
- **Docker**(可选)— 用于沙盒执行
|
|
186
|
+
- **Lean 4**(可选)— 用于形式化定理证明
|
|
187
|
+
|
|
188
|
+
---
|
|
189
|
+
|
|
190
|
+
## 三种工作模式
|
|
191
|
+
|
|
192
|
+
配置完成后,`forgeai` 进入交互式会话,第一步选择工作模式:
|
|
193
|
+
|
|
194
|
+
```
|
|
195
|
+
? Select mode:
|
|
196
|
+
❯ Development — generate complete runnable projects
|
|
197
|
+
Academic — scientific reasoning, theorem proving, theory evolution
|
|
198
|
+
Verification — review & verify existing codebases
|
|
199
|
+
```
|
|
200
|
+
|
|
201
|
+
| 模式 | 用途 | 支持的操作 |
|
|
202
|
+
|------|------|-----------|
|
|
203
|
+
| **Development** | 全栈项目生成 | 生成新项目、导入并增强已有项目 |
|
|
204
|
+
| **Academic** | 科研推理与定理证明 | 生成研究项目、分析已有代码库 |
|
|
205
|
+
| **Verification** | 代码审查与验证 | 审查项目质量、安全性、架构 |
|
|
206
|
+
|
|
207
|
+
每种模式下可进一步设置预算和并行度,然后用自然语言描述任务即开始。
|
|
208
|
+
|
|
209
|
+
---
|
|
210
|
+
|
|
211
|
+
## 学术与科研能力
|
|
212
|
+
|
|
213
|
+
AutoForge 内置完整的学术科研流水线,可作为 AI 驱动的自主科研助手使用——从输入一篇论文到输出一篇新论文,全部自动化。
|
|
214
|
+
|
|
215
|
+
### 端到端文章推理
|
|
216
|
+
|
|
217
|
+
> 输入任意一篇论文,自动完成:**解析 → 理论图谱构建 → 声明验证 → 形式-非形式交错推理 → Lean 4 形式化 → 自主发现 → Elo 假说排序 → 推理扩展 → 同行评审 → 输出新论文**
|
|
218
|
+
|
|
219
|
+
核心编排模块:[`article_reasoning.py`](autoforge/engine/article_reasoning.py) — 统一 8 阶段管线
|
|
220
|
+
|
|
221
|
+
### 形式化验证与定理证明
|
|
222
|
+
|
|
223
|
+
| 模块 | 功能 | 技术方法 |
|
|
224
|
+
|------|------|----------|
|
|
225
|
+
| [Lean 4 MCTS 证明搜索](autoforge/engine/provers/proof_search.py) | 策略空间蒙特卡洛树搜索 | HILBERT 递归分解 + COPRA + STP |
|
|
226
|
+
| [Lean Lake 集成](autoforge/engine/provers/lean_lake.py) | 真实 Lean 4 编译与 Mathlib 项目管理 | Lake 构建系统,32 组概念→import 映射 |
|
|
227
|
+
| [Pantograph REPL](autoforge/engine/provers/pantograph_repl.py) | 增量策略应用,无需全量编译 | TACAS 2025,机器-机器 Lean 4 交互,BFS/DFS 搜索 |
|
|
228
|
+
| [GRPO 可验证奖励训练](autoforge/engine/rl_proof_search.py) | 组相对策略优化 + 脚手架渐进 RL | DeepSeek-Prover-V2 (88.9% miniF2F) + Scaf-GRPO |
|
|
229
|
+
| [Kimina 交错推理](autoforge/engine/recursive_decomp_prover.py) | 非形式-形式交错单次生成证明 | Kimina-Prover (80.7% miniF2F) |
|
|
230
|
+
| [DPO 策略优化](autoforge/engine/proof_embedding.py) | 直接偏好优化,免奖励模型 | BFS-Prover-V2 state-tactic DPO |
|
|
231
|
+
| [多证明器交叉验证](autoforge/engine/provers/multi_prover.py) | Coq、Isabelle、TLA+、Z3/SMT、Dafny | 6 后端并行验证 |
|
|
232
|
+
| [密集嵌入检索](autoforge/engine/dense_retrieval.py) | 前提选择替代 Jaccard | ReProver/LeanDojo 风格 + FAISS |
|
|
233
|
+
| [证明嵌入迁移](autoforge/engine/proof_embedding.py) | 跨领域策略迁移学习 | 向量记忆库 + FAISS + 经验追踪 |
|
|
234
|
+
| [标准基准评测](autoforge/engine/benchmark_eval.py) | miniF2F / PutnamBench / LeanWorkbook / ProofNet | Pass@k 无偏估计 |
|
|
235
|
+
|
|
236
|
+
### 自主科研发现
|
|
237
|
+
|
|
238
|
+
| 模块 | 功能 | 技术方法 |
|
|
239
|
+
|------|------|----------|
|
|
240
|
+
| [自主定理发现](autoforge/engine/autonomous_discovery.py) | 从论文提取核心 → 生成猜想 → 过滤新颖性 → 评估深度 | DomainContext 模板 + Thompson 采样策略选择 |
|
|
241
|
+
| [Elo 假说锦标赛](autoforge/engine/autonomous_discovery.py) | 假说两两对决 → Elo 排序 → 筛选最优 | Google AI Co-Scientist (2025) 风格 |
|
|
242
|
+
| [自对弈猜想生成](autoforge/engine/self_play_conjecture.py) | 双智能体 Conjecturer/Prover 对弈 | STP (ICML 2025) + 贝叶斯难度校准 |
|
|
243
|
+
| [推理核心自增长](autoforge/engine/reasoning_extension.py) | 从最小公理核心出发,迭代生成深层结论 | Thompson 采样 + 出版级质量门控 |
|
|
244
|
+
| [跨领域科学推理](autoforge/engine/theoretical_reasoning.py) | TheoryGraph + 超图 n 元关系 + 12 种推理策略 | SciAgents HyperEdge + 10 种验证模式融合 |
|
|
245
|
+
| [结构化世界模型](autoforge/engine/world_model.py) | TheoryGraph 时序查询层 + 跨会话持久化 | Kosmos (2025) |
|
|
246
|
+
| [课程学习](autoforge/engine/curriculum_learning.py) | 复杂度排序 + 正迁移追踪 | LeanAgent (ICLR 2025) |
|
|
247
|
+
|
|
248
|
+
### 论文全流程
|
|
249
|
+
|
|
250
|
+
| 模块 | 功能 | 技术方法 |
|
|
251
|
+
|------|------|----------|
|
|
252
|
+
| [闭环实验管线](autoforge/engine/experiment_loop.py) | 假设 → 代码 → 运行 → 分析 → 消融实验 → 迭代 | AI Scientist v2 |
|
|
253
|
+
| [自动论文撰写](autoforge/engine/paper_writer.py) | LaTeX 生成 + BibTeX + 图表 + 模板 | NeurIPS/ICML/ICLR/ArXiv 模板 |
|
|
254
|
+
| [文献检索与分析](autoforge/engine/literature_search.py) | 引用图谱遍历 + SPECTER2 语义搜索 + 全文分析 + 研究空白检测 | Semantic Scholar API + arXiv |
|
|
255
|
+
| [VLM 图表分析](autoforge/engine/vlm_figure.py) | 图表提取 → 视觉分析 → 数据提取 → 复现 → 验证 | 视觉语言模型 |
|
|
256
|
+
| [符号计算后端](autoforge/engine/symbolic_compute.py) | SymPy/SageMath 集成,LaTeX↔SymPy 双向转换 | 代数恒等式验证 + 极限/级数检查 |
|
|
257
|
+
| [同行评审模拟](autoforge/engine/peer_review.py) | 多审稿人 + 作者反驳 + 元审稿 + 迭代修改 | 6 种审稿角色 |
|
|
258
|
+
|
|
259
|
+
### 论文复现管线
|
|
260
|
+
|
|
261
|
+
AutoForge 支持从高层研究目标出发,自动推断相关论文并构建复现方案:
|
|
262
|
+
|
|
263
|
+
```bash
|
|
264
|
+
forgeai paper infer "improve sample efficiency in offline RL" # 推断相关 ICLR 论文
|
|
265
|
+
forgeai paper benchmark # 评估推断质量
|
|
266
|
+
forgeai paper reproduce "goal" --with-pdf --run-generate # 端到端复现
|
|
267
|
+
```
|
|
268
|
+
|
|
269
|
+
管线流程:研究目标 → OpenReview 论文检索 → TF-IDF 排序匹配 → 信号提取 → 复现方案生成 → 可选自动执行
|
|
270
|
+
|
|
271
|
+
### 核心技术来源
|
|
272
|
+
|
|
273
|
+
| 技术 | 来源 | 关键创新 |
|
|
274
|
+
|------|------|----------|
|
|
275
|
+
| **GRPO 可验证奖励** | DeepSeek-Prover-V2 (2025, 88.9% miniF2F) | 组相对优势取代 PPO critic |
|
|
276
|
+
| **交错推理模式** | Kimina-Prover (2025, 80.7% miniF2F) | 非形式+形式交错单次生成 |
|
|
277
|
+
| **Pantograph REPL** | TACAS 2025 | 增量策略应用,10x+ 编译加速 |
|
|
278
|
+
| **DPO 策略偏好** | BFS-Prover-V2 (72.95% miniF2F) | 直接偏好优化免奖励模型 |
|
|
279
|
+
| **Elo 假说排序** | Google AI Co-Scientist (2025) | 两两对决动态排序 |
|
|
280
|
+
| **超图知识表示** | SciAgents + Hypergraph KG (2025) | n 元关系取代二元关系 |
|
|
281
|
+
| **达尔文自改写** | Darwin Gödel Machine (2025) | 演化自重写智能体宪法 |
|
|
282
|
+
| **脚手架渐进 RL** | Scaf-GRPO (2025, 44.3%↑ AIME) | 分层提示 + 渐进撤除 |
|
|
283
|
+
| **PUCT-MCTS** | AlphaProof (DeepMind, 2024) | AlphaZero 适配策略空间 |
|
|
284
|
+
| **递归分解** | HILBERT (NeurIPS 2025) | informal reasoner + prover + verifier + retriever |
|
|
285
|
+
| **自对弈猜想** | STP (ICML 2025, 28.5% LeanWorkbook) | 贝叶斯难度校准 50% 甜区 |
|
|
286
|
+
| **密集前提检索** | ReProver / LeanDojo (NeurIPS 2023) | FAISS 索引替代 Jaccard |
|
|
287
|
+
| **课程学习** | LeanAgent (ICLR 2025) | 复杂度排序 + 正迁移终身学习 |
|
|
288
|
+
| **闭环实验** | AI Scientist v2 (2025) | 假设→代码→执行→分析→消融→迭代 |
|
|
289
|
+
| **过程奖励模型** | CodePRM (2024) | 步级质量评估 |
|
|
290
|
+
| **语言强化学习** | Reflexion (NeurIPS 2023) | 语言化记忆 + 失败模式避免 |
|
|
291
|
+
|
|
292
|
+
---
|
|
293
|
+
|
|
294
|
+
## 工程能力
|
|
295
|
+
|
|
296
|
+
AutoForge 同时也是一个全栈代码生成引擎——6 个 AI 智能体协作,将自然语言描述转化为完整可运行的代码项目。
|
|
297
|
+
|
|
298
|
+
### 5 阶段流水线
|
|
299
|
+
|
|
300
|
+
```
|
|
301
|
+
"做一个带登录的 Todo App"
|
|
302
|
+
│
|
|
303
|
+
▼
|
|
304
|
+
┌────────────────────────────────────────────────┐
|
|
305
|
+
│ SPEC Director 分析需求、拆解模块 │
|
|
306
|
+
├────────────────────────────────────────────────┤
|
|
307
|
+
│ BUILD Architect 设计架构 │
|
|
308
|
+
│ Builder 并行写代码,Reviewer 审查 │
|
|
309
|
+
├────────────────────────────────────────────────┤
|
|
310
|
+
│ VERIFY Tester 安装依赖、构建、运行测试 │
|
|
311
|
+
│ 失败自动生成修复任务 │
|
|
312
|
+
├────────────────────────────────────────────────┤
|
|
313
|
+
│ REFACTOR Gardener 优化代码质量 │
|
|
314
|
+
├────────────────────────────────────────────────┤
|
|
315
|
+
│ DELIVER 生成 README、整理结构、成本报告 │
|
|
316
|
+
└────────────────────────────────────────────────┘
|
|
317
|
+
│
|
|
318
|
+
▼
|
|
319
|
+
workspace/my-todo-app/
|
|
320
|
+
```
|
|
321
|
+
|
|
322
|
+
另有两条专用管线:
|
|
323
|
+
- **Review 管线:** SCAN → REVIEW → REFACTOR → REPORT
|
|
324
|
+
- **Import 管线:** SCAN → REVIEW → ENHANCE → VERIFY → REFACTOR → DELIVER
|
|
325
|
+
|
|
326
|
+
### 6 智能体协作
|
|
327
|
+
|
|
328
|
+
| 智能体 | 角色 | 模型层级 |
|
|
329
|
+
|--------|------|----------|
|
|
330
|
+
| **Director** | 需求分析与范围界定 | Strong(强模型) |
|
|
331
|
+
| **Architect** | 系统设计与任务依赖图 | Strong(强模型) |
|
|
332
|
+
| **Builder** | 代码生成(可并行,最多 8 个) | Fast(快模型) |
|
|
333
|
+
| **Reviewer** | 代码审查与评分 | Fast(快模型) |
|
|
334
|
+
| **Tester** | 构建、测试、自动修复循环 | Fast(快模型) |
|
|
335
|
+
| **Gardener** | 重构与安全修复 | Fast(快模型) |
|
|
336
|
+
|
|
337
|
+
### 智能引擎
|
|
338
|
+
|
|
339
|
+
47 个内置引擎在构建全流程中自动协作:
|
|
340
|
+
|
|
341
|
+
- **MCTS 搜索树** — 架构方案探索与择优,基于执行反馈动态修正
|
|
342
|
+
- **自然语言梯度反馈 (EvoMAC)** — Agent 间通过文本反向传播互相优化
|
|
343
|
+
- **过程奖励模型 (CodePRM)** — 逐步评估代码质量,而非仅看最终结果
|
|
344
|
+
- **自适应算力分配** — 根据任务难度动态调整推理深度
|
|
345
|
+
- **语言强化学习 (Reflexion)** — 从失败中提取经验,重试时自动规避
|
|
346
|
+
- **块级故障定位 (LDB)** — 精确定位缺陷到代码块级别
|
|
347
|
+
- **函数级任务分解** — 复杂需求拆解为可独立验证的子任务
|
|
348
|
+
- **阶段预执行** — 流水线各阶段重叠并行,加速构建
|
|
349
|
+
- **达尔文自改写 (SICA)** — 演化式自重写智能体宪法与工作流
|
|
350
|
+
- **安全扫描 (RedCode)** — 模式匹配 + LLM 深度漏洞分析
|
|
351
|
+
- **跨项目 RAG** — BM25+TF-IDF 混合跨项目代码检索
|
|
352
|
+
- **知识图谱自增长 (CapabilityDAG)** — 跨项目能力积累,社区可合并
|
|
353
|
+
|
|
354
|
+
<details>
|
|
355
|
+
<summary>成本估算</summary>
|
|
356
|
+
|
|
357
|
+
| 复杂度 | 示例 | 预估成本 |
|
|
358
|
+
|--------|------|:--------:|
|
|
359
|
+
| 简单 | Todo App、落地页 | $2–3 |
|
|
360
|
+
| 中等 | 博客系统、预约平台 | $4–6 |
|
|
361
|
+
| 复杂 | 电商 MVP、多角色平台 | $7–10 |
|
|
362
|
+
|
|
363
|
+
默认预算上限 $10,可通过 `--budget` 覆盖。
|
|
364
|
+
|
|
365
|
+
</details>
|
|
366
|
+
|
|
367
|
+
---
|
|
368
|
+
|
|
369
|
+
## CLI 命令参考
|
|
370
|
+
|
|
371
|
+
```bash
|
|
372
|
+
# 交互式(推荐)
|
|
373
|
+
forgeai # 引导式会话
|
|
374
|
+
|
|
375
|
+
# 项目生成
|
|
376
|
+
forgeai generate "用 Flask + Vue 做书店管理系统"
|
|
377
|
+
forgeai generate "SaaS 落地页" --budget 3.00
|
|
378
|
+
|
|
379
|
+
# 代码审查
|
|
380
|
+
forgeai review ./my-project
|
|
381
|
+
|
|
382
|
+
# 导入增强
|
|
383
|
+
forgeai import ./my-project --enhance "加上暗色模式"
|
|
384
|
+
|
|
385
|
+
# 运行管理
|
|
386
|
+
forgeai status # 查看所有项目
|
|
387
|
+
forgeai resume # 恢复中断的任务
|
|
388
|
+
forgeai setup # 重新配置
|
|
389
|
+
|
|
390
|
+
# 论文复现
|
|
391
|
+
forgeai paper infer "research goal" # 推断相关论文
|
|
392
|
+
forgeai paper benchmark # 评估推断质量
|
|
393
|
+
forgeai paper reproduce "goal" --run-generate # 端到端复现
|
|
394
|
+
```
|
|
395
|
+
|
|
396
|
+
全局可选参数:`--budget`、`--agents`、`--model`、`--mode`、`--mobile`、`--tdd`、`--verbose`
|
|
397
|
+
|
|
398
|
+
---
|
|
399
|
+
|
|
400
|
+
## 守护进程模式
|
|
401
|
+
|
|
402
|
+
AutoForge 可作为 24/7 后台服务运行,通过 CLI、Telegram 或 Webhook 接收构建请求:
|
|
403
|
+
|
|
404
|
+
```bash
|
|
405
|
+
forgeai daemon start # 启动守护进程
|
|
406
|
+
forgeai daemon status # 查看状态
|
|
407
|
+
forgeai daemon stop # 停止
|
|
408
|
+
|
|
409
|
+
forgeai queue "支持 Markdown 的博客系统" # 排队构建
|
|
410
|
+
forgeai projects # 查看所有项目
|
|
411
|
+
forgeai deploy <project_id> # 显示部署指南
|
|
412
|
+
```
|
|
413
|
+
|
|
414
|
+
支持 systemd (Linux) 和 launchd (macOS) 系统服务安装,详见 `services/` 目录。
|
|
415
|
+
|
|
416
|
+
---
|
|
417
|
+
|
|
418
|
+
## 许可证
|
|
419
|
+
|
|
420
|
+
MIT
|