ai-atlasforge 1.2.3__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- ai_atlasforge-1.2.3/LICENSE +21 -0
- ai_atlasforge-1.2.3/PKG-INFO +324 -0
- ai_atlasforge-1.2.3/README.md +280 -0
- ai_atlasforge-1.2.3/adversarial_testing/__init__.py +243 -0
- ai_atlasforge-1.2.3/adversarial_testing/adversarial_runner.py +591 -0
- ai_atlasforge-1.2.3/adversarial_testing/blind_validator.py +494 -0
- ai_atlasforge-1.2.3/adversarial_testing/content_preservation.py +965 -0
- ai_atlasforge-1.2.3/adversarial_testing/cost_estimator.py +545 -0
- ai_atlasforge-1.2.3/adversarial_testing/enhanced_runner.py +547 -0
- ai_atlasforge-1.2.3/adversarial_testing/epistemic_metrics.py +553 -0
- ai_atlasforge-1.2.3/adversarial_testing/mission_drift_validator.py +870 -0
- ai_atlasforge-1.2.3/adversarial_testing/mutation_testing.py +584 -0
- ai_atlasforge-1.2.3/adversarial_testing/phase_aware_drift.py +1199 -0
- ai_atlasforge-1.2.3/adversarial_testing/phase_aware_validator.py +813 -0
- ai_atlasforge-1.2.3/adversarial_testing/property_testing.py +608 -0
- ai_atlasforge-1.2.3/adversarial_testing/red_team_agent.py +410 -0
- ai_atlasforge-1.2.3/adversarial_testing/resilience.py +570 -0
- ai_atlasforge-1.2.3/adversarial_testing/vulnerability_database.py +511 -0
- ai_atlasforge-1.2.3/ai_atlasforge.egg-info/PKG-INFO +324 -0
- ai_atlasforge-1.2.3/ai_atlasforge.egg-info/SOURCES.txt +46 -0
- ai_atlasforge-1.2.3/ai_atlasforge.egg-info/dependency_links.txt +1 -0
- ai_atlasforge-1.2.3/ai_atlasforge.egg-info/entry_points.txt +3 -0
- ai_atlasforge-1.2.3/ai_atlasforge.egg-info/requires.txt +21 -0
- ai_atlasforge-1.2.3/ai_atlasforge.egg-info/top_level.txt +3 -0
- ai_atlasforge-1.2.3/atlasforge_enhancements/__init__.py +146 -0
- ai_atlasforge-1.2.3/atlasforge_enhancements/atlasforge_enhancer.py +998 -0
- ai_atlasforge-1.2.3/atlasforge_enhancements/bias_detector.py +426 -0
- ai_atlasforge-1.2.3/atlasforge_enhancements/context_healing.py +461 -0
- ai_atlasforge-1.2.3/atlasforge_enhancements/exploration_graph.py +2161 -0
- ai_atlasforge-1.2.3/atlasforge_enhancements/fingerprint_extractor.py +549 -0
- ai_atlasforge-1.2.3/atlasforge_enhancements/insight_extractor.py +811 -0
- ai_atlasforge-1.2.3/atlasforge_enhancements/knowledge_transfer.py +677 -0
- ai_atlasforge-1.2.3/atlasforge_enhancements/mission_continuity_tracker.py +584 -0
- ai_atlasforge-1.2.3/atlasforge_enhancements/scaffold_calibrator.py +636 -0
- ai_atlasforge-1.2.3/atlasforge_enhancements/scaffold_library.py +448 -0
- ai_atlasforge-1.2.3/dashboard_modules/__init__.py +90 -0
- ai_atlasforge-1.2.3/dashboard_modules/analytics.py +190 -0
- ai_atlasforge-1.2.3/dashboard_modules/atlasforge.py +225 -0
- ai_atlasforge-1.2.3/dashboard_modules/cache.py +98 -0
- ai_atlasforge-1.2.3/dashboard_modules/core.py +1269 -0
- ai_atlasforge-1.2.3/dashboard_modules/investigation.py +1357 -0
- ai_atlasforge-1.2.3/dashboard_modules/knowledge_base.py +1021 -0
- ai_atlasforge-1.2.3/dashboard_modules/queue_scheduler.py +1303 -0
- ai_atlasforge-1.2.3/dashboard_modules/recovery.py +483 -0
- ai_atlasforge-1.2.3/dashboard_modules/services.py +184 -0
- ai_atlasforge-1.2.3/dashboard_modules/url_handlers.py +119 -0
- ai_atlasforge-1.2.3/pyproject.toml +99 -0
- ai_atlasforge-1.2.3/setup.cfg +4 -0
|
@@ -0,0 +1,21 @@
|
|
|
1
|
+
MIT License
|
|
2
|
+
|
|
3
|
+
Copyright (c) 2024-2026 AI-AtlasForge Contributors
|
|
4
|
+
|
|
5
|
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
6
|
+
of this software and associated documentation files (the "Software"), to deal
|
|
7
|
+
in the Software without restriction, including without limitation the rights
|
|
8
|
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
9
|
+
copies of the Software, and to permit persons to whom the Software is
|
|
10
|
+
furnished to do so, subject to the following conditions:
|
|
11
|
+
|
|
12
|
+
The above copyright notice and this permission notice shall be included in all
|
|
13
|
+
copies or substantial portions of the Software.
|
|
14
|
+
|
|
15
|
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
16
|
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
17
|
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
18
|
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
19
|
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
20
|
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
21
|
+
SOFTWARE.
|
|
@@ -0,0 +1,324 @@
|
|
|
1
|
+
Metadata-Version: 2.2
|
|
2
|
+
Name: ai-atlasforge
|
|
3
|
+
Version: 1.2.3
|
|
4
|
+
Summary: Autonomous AI research and development platform powered by Claude
|
|
5
|
+
License: MIT
|
|
6
|
+
Project-URL: Homepage, https://github.com/DragonShadows1978/AI-AtlasForge
|
|
7
|
+
Project-URL: Documentation, https://github.com/DragonShadows1978/AI-AtlasForge#readme
|
|
8
|
+
Project-URL: Repository, https://github.com/DragonShadows1978/AI-AtlasForge.git
|
|
9
|
+
Project-URL: Issues, https://github.com/DragonShadows1978/AI-AtlasForge/issues
|
|
10
|
+
Keywords: ai,claude,autonomous,research,development
|
|
11
|
+
Classifier: Development Status :: 4 - Beta
|
|
12
|
+
Classifier: Environment :: Console
|
|
13
|
+
Classifier: Environment :: Web Environment
|
|
14
|
+
Classifier: Intended Audience :: Developers
|
|
15
|
+
Classifier: License :: OSI Approved :: MIT License
|
|
16
|
+
Classifier: Operating System :: POSIX :: Linux
|
|
17
|
+
Classifier: Programming Language :: Python :: 3
|
|
18
|
+
Classifier: Programming Language :: Python :: 3.10
|
|
19
|
+
Classifier: Programming Language :: Python :: 3.11
|
|
20
|
+
Classifier: Programming Language :: Python :: 3.12
|
|
21
|
+
Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
|
|
22
|
+
Classifier: Topic :: Software Development :: Code Generators
|
|
23
|
+
Requires-Python: >=3.10
|
|
24
|
+
Description-Content-Type: text/markdown
|
|
25
|
+
License-File: LICENSE
|
|
26
|
+
Requires-Dist: flask>=2.0.0
|
|
27
|
+
Requires-Dist: flask-socketio>=5.0.0
|
|
28
|
+
Requires-Dist: simple-websocket>=0.5.0
|
|
29
|
+
Requires-Dist: anthropic>=0.18.0
|
|
30
|
+
Requires-Dist: watchdog>=3.0.0
|
|
31
|
+
Requires-Dist: psutil>=5.9.0
|
|
32
|
+
Requires-Dist: numpy>=1.21.0
|
|
33
|
+
Requires-Dist: scikit-learn>=1.0.0
|
|
34
|
+
Provides-Extra: dev
|
|
35
|
+
Requires-Dist: pytest>=7.0.0; extra == "dev"
|
|
36
|
+
Requires-Dist: pytest-cov>=4.0.0; extra == "dev"
|
|
37
|
+
Requires-Dist: black>=23.0.0; extra == "dev"
|
|
38
|
+
Requires-Dist: flake8>=6.0.0; extra == "dev"
|
|
39
|
+
Requires-Dist: mypy>=1.0.0; extra == "dev"
|
|
40
|
+
Provides-Extra: tray
|
|
41
|
+
Requires-Dist: PyGObject>=3.42.0; extra == "tray"
|
|
42
|
+
Provides-Extra: all
|
|
43
|
+
Requires-Dist: ai-atlasforge[dev,tray]; extra == "all"
|
|
44
|
+
|
|
45
|
+
# AI-AtlasForge
|
|
46
|
+
|
|
47
|
+
An autonomous AI research and development platform powered by Claude. Run long-duration missions, accumulate cross-session knowledge, and build software autonomously.
|
|
48
|
+
|
|
49
|
+
## What is AI-AtlasForge?
|
|
50
|
+
|
|
51
|
+
AI-AtlasForge is not a chatbot wrapper. It's an **autonomous research engine** that:
|
|
52
|
+
|
|
53
|
+
- Runs multi-day missions without human intervention
|
|
54
|
+
- Maintains mission continuity across context windows
|
|
55
|
+
- Accumulates knowledge that persists across sessions
|
|
56
|
+
- Self-corrects when drifting from objectives
|
|
57
|
+
- Adversarially tests its own outputs
|
|
58
|
+
|
|
59
|
+
## Quick Start
|
|
60
|
+
|
|
61
|
+
### Prerequisites
|
|
62
|
+
|
|
63
|
+
- Python 3.10+
|
|
64
|
+
- Anthropic API key (get one at https://console.anthropic.com/)
|
|
65
|
+
- Linux environment (tested on Ubuntu 22.04+, Debian 12+)
|
|
66
|
+
|
|
67
|
+
> **Platform Notes:**
|
|
68
|
+
> - **Windows:** Use WSL2 (Windows Subsystem for Linux)
|
|
69
|
+
> - **macOS:** Should work but is untested. Please report issues.
|
|
70
|
+
|
|
71
|
+
### Option 1: Standard Installation
|
|
72
|
+
|
|
73
|
+
```bash
|
|
74
|
+
# Clone the repository
|
|
75
|
+
git clone https://github.com/DragonShadows1978/AI-AtlasForge.git
|
|
76
|
+
cd AI-AtlasForge
|
|
77
|
+
|
|
78
|
+
# Run the installer
|
|
79
|
+
./install.sh
|
|
80
|
+
|
|
81
|
+
# Configure your API key
|
|
82
|
+
export ANTHROPIC_API_KEY='your-key-here'
|
|
83
|
+
# Or edit config.yaml / .env
|
|
84
|
+
|
|
85
|
+
# Verify installation
|
|
86
|
+
./verify.sh
|
|
87
|
+
```
|
|
88
|
+
|
|
89
|
+
### Option 2: One-Liner Install
|
|
90
|
+
|
|
91
|
+
```bash
|
|
92
|
+
curl -sSL https://raw.githubusercontent.com/DragonShadows1978/AI-AtlasForge/main/quick_install.sh | bash
|
|
93
|
+
```
|
|
94
|
+
|
|
95
|
+
### Option 3: Docker Installation
|
|
96
|
+
|
|
97
|
+
```bash
|
|
98
|
+
git clone https://github.com/DragonShadows1978/AI-AtlasForge.git
|
|
99
|
+
cd AI-AtlasForge
|
|
100
|
+
docker compose up -d
|
|
101
|
+
# Dashboard at http://localhost:5050
|
|
102
|
+
```
|
|
103
|
+
|
|
104
|
+
For detailed installation options, see [INSTALL.md](INSTALL.md) or [QUICKSTART.md](QUICKSTART.md).
|
|
105
|
+
|
|
106
|
+
### Running Your First Mission
|
|
107
|
+
|
|
108
|
+
1. **Start the Dashboard** (optional, for monitoring):
|
|
109
|
+
```bash
|
|
110
|
+
make dashboard
|
|
111
|
+
# Or: python3 dashboard_v2.py
|
|
112
|
+
# Access at http://localhost:5050
|
|
113
|
+
```
|
|
114
|
+
|
|
115
|
+
2. **Create a Mission**:
|
|
116
|
+
- Via Dashboard: Click "Create Mission" and enter your objectives
|
|
117
|
+
- Via Sample: Run `make sample-mission` to load a hello-world mission
|
|
118
|
+
- Via JSON: Create `state/mission.json` manually
|
|
119
|
+
|
|
120
|
+
3. **Start the Engine**:
|
|
121
|
+
```bash
|
|
122
|
+
make run
|
|
123
|
+
# Or: python3 claude_autonomous.py --mode=rd
|
|
124
|
+
```
|
|
125
|
+
|
|
126
|
+
### Development Commands
|
|
127
|
+
|
|
128
|
+
Run `make help` to see all available commands:
|
|
129
|
+
|
|
130
|
+
```bash
|
|
131
|
+
make install # Full installation
|
|
132
|
+
make verify # Verify installation
|
|
133
|
+
make dashboard # Start dashboard
|
|
134
|
+
make run # Start autonomous agent
|
|
135
|
+
make docker # Start with Docker
|
|
136
|
+
make sample-mission # Load sample mission
|
|
137
|
+
```
|
|
138
|
+
|
|
139
|
+
## Architecture
|
|
140
|
+
|
|
141
|
+
```
|
|
142
|
+
+-------------------+
|
|
143
|
+
| Mission State |
|
|
144
|
+
| (mission.json) |
|
|
145
|
+
+--------+----------+
|
|
146
|
+
|
|
|
147
|
+
+--------------+--------------+
|
|
148
|
+
| |
|
|
149
|
+
+---------v---------+ +--------v--------+
|
|
150
|
+
| AtlasForge | | Dashboard |
|
|
151
|
+
| (Execution Engine)| | (Monitoring) |
|
|
152
|
+
+---------+---------+ +-----------------+
|
|
153
|
+
|
|
|
154
|
+
+---------v---------+
|
|
155
|
+
| R&D Engine |
|
|
156
|
+
| (State Machine) |
|
|
157
|
+
+---------+---------+
|
|
158
|
+
|
|
|
159
|
+
+---------v-------------------+
|
|
160
|
+
| Stage Pipeline |
|
|
161
|
+
| |
|
|
162
|
+
| PLANNING -> BUILDING -> |
|
|
163
|
+
| TESTING -> ANALYZING -> |
|
|
164
|
+
| CYCLE_END -> COMPLETE |
|
|
165
|
+
+-----------------------------+
|
|
166
|
+
```
|
|
167
|
+
|
|
168
|
+
## Mission Lifecycle
|
|
169
|
+
|
|
170
|
+
1. **PLANNING** - Understand objectives, research codebase, create implementation plan
|
|
171
|
+
2. **BUILDING** - Implement the solution
|
|
172
|
+
3. **TESTING** - Validate implementation
|
|
173
|
+
4. **ANALYZING** - Evaluate results, identify issues
|
|
174
|
+
5. **CYCLE_END** - Generate reports, prepare continuation
|
|
175
|
+
6. **COMPLETE** - Mission finished
|
|
176
|
+
|
|
177
|
+
Missions can iterate through multiple cycles until success criteria are met.
|
|
178
|
+
|
|
179
|
+
## Core Components
|
|
180
|
+
|
|
181
|
+
### atlasforge.py
|
|
182
|
+
Main execution loop. Spawns Claude instances, manages state, handles graceful shutdown.
|
|
183
|
+
|
|
184
|
+
### af_engine.py
|
|
185
|
+
State machine for mission execution. Manages stages, enforces constraints, tracks progress.
|
|
186
|
+
|
|
187
|
+
### dashboard_v2.py
|
|
188
|
+
Web-based monitoring interface showing mission status, knowledge base, and analytics.
|
|
189
|
+
|
|
190
|
+
### Knowledge Base
|
|
191
|
+
SQLite database accumulating learnings across all missions:
|
|
192
|
+
- Techniques discovered
|
|
193
|
+
- Insights gained
|
|
194
|
+
- Gotchas encountered
|
|
195
|
+
- Reusable code patterns
|
|
196
|
+
|
|
197
|
+
### Adversarial Testing
|
|
198
|
+
Separate Claude instances that test implementations:
|
|
199
|
+
- RedTeam agents with no implementation knowledge
|
|
200
|
+
- Mutation testing
|
|
201
|
+
- Property-based testing
|
|
202
|
+
|
|
203
|
+
### GlassBox
|
|
204
|
+
Post-mission introspection system:
|
|
205
|
+
- Transcript parsing
|
|
206
|
+
- Agent hierarchy reconstruction
|
|
207
|
+
- Stage timeline visualization
|
|
208
|
+
|
|
209
|
+
## Key Features
|
|
210
|
+
|
|
211
|
+
### Display Layer (Windows)
|
|
212
|
+
Visual environment for graphical application testing:
|
|
213
|
+
- Screenshot capture from virtual display
|
|
214
|
+
- Web-accessible display via noVNC (localhost:6080)
|
|
215
|
+
- Web terminal via ttyd (localhost:7681)
|
|
216
|
+
- Browser support for OAuth flows and web testing
|
|
217
|
+
- Automatic GPU detection with software fallback
|
|
218
|
+
|
|
219
|
+
See [docs/DISPLAY_LAYER.md](workspace/docs/DISPLAY_LAYER.md) for the user guide.
|
|
220
|
+
|
|
221
|
+
### Mission Continuity
|
|
222
|
+
Missions survive context window limits through:
|
|
223
|
+
- Persistent mission.json state
|
|
224
|
+
- Cycle-based iteration
|
|
225
|
+
- Continuation prompts that preserve context
|
|
226
|
+
|
|
227
|
+
### Knowledge Accumulation
|
|
228
|
+
Every mission adds to the knowledge base. The system improves over time as it learns patterns, gotchas, and techniques.
|
|
229
|
+
|
|
230
|
+
### Autonomous Operation
|
|
231
|
+
Designed for unattended execution:
|
|
232
|
+
- Graceful crash recovery
|
|
233
|
+
- Stage checkpointing
|
|
234
|
+
- Automatic cycle progression
|
|
235
|
+
|
|
236
|
+
## Directory Structure
|
|
237
|
+
|
|
238
|
+
```
|
|
239
|
+
AI-AtlasForge/
|
|
240
|
+
+-- atlasforge.py # Main entry point
|
|
241
|
+
+-- af_engine.py # Stage state machine
|
|
242
|
+
+-- dashboard_v2.py # Web dashboard
|
|
243
|
+
+-- adversarial_testing/ # Testing framework
|
|
244
|
+
+-- atlasforge_enhancements/ # Enhancement modules
|
|
245
|
+
+-- workspace/ # Active workspace
|
|
246
|
+
| +-- glassbox/ # Introspection tools
|
|
247
|
+
| +-- artifacts/ # Plans, reports
|
|
248
|
+
| +-- research/ # Notes, findings
|
|
249
|
+
| +-- tests/ # Test scripts
|
|
250
|
+
+-- state/ # Runtime state
|
|
251
|
+
| +-- mission.json # Current mission
|
|
252
|
+
| +-- claude_state.json # Execution state
|
|
253
|
+
+-- missions/ # Mission workspaces
|
|
254
|
+
+-- atlasforge_data/
|
|
255
|
+
| +-- knowledge_base/ # Accumulated learnings
|
|
256
|
+
+-- logs/ # Execution logs
|
|
257
|
+
```
|
|
258
|
+
|
|
259
|
+
## Configuration
|
|
260
|
+
|
|
261
|
+
AI-AtlasForge uses environment variables for configuration:
|
|
262
|
+
|
|
263
|
+
| Variable | Default | Description |
|
|
264
|
+
|----------|---------|-------------|
|
|
265
|
+
| `ATLASFORGE_PORT` | `5050` | Dashboard port |
|
|
266
|
+
| `ATLASFORGE_ROOT` | (script directory) | Base directory |
|
|
267
|
+
| `ATLASFORGE_DEBUG` | `false` | Enable debug logging |
|
|
268
|
+
|
|
269
|
+
## Dashboard Features
|
|
270
|
+
|
|
271
|
+
The web dashboard provides real-time monitoring:
|
|
272
|
+
|
|
273
|
+
- **Mission Status** - Current stage, progress, timing
|
|
274
|
+
- **Activity Feed** - Live log of agent actions
|
|
275
|
+
- **Knowledge Base** - Search and browse learnings
|
|
276
|
+
- **Analytics** - Token usage, cost tracking
|
|
277
|
+
- **Mission Queue** - Queue and schedule missions
|
|
278
|
+
- **GlassBox** - Post-mission analysis
|
|
279
|
+
|
|
280
|
+
## Philosophy
|
|
281
|
+
|
|
282
|
+
**First principles only.** No frameworks hiding integration failures. Every component built from scratch for full visibility.
|
|
283
|
+
|
|
284
|
+
**Speed of machine, not human.** Designed for autonomous operation. Check in when convenient, not when required.
|
|
285
|
+
|
|
286
|
+
**Knowledge accumulates.** Every mission adds to the knowledge base. The system gets better over time.
|
|
287
|
+
|
|
288
|
+
**Trust but verify.** Adversarial testing catches what regular testing misses. The same agent that writes code doesn't validate it.
|
|
289
|
+
|
|
290
|
+
## Requirements
|
|
291
|
+
|
|
292
|
+
- Python 3.10+
|
|
293
|
+
- Node.js 18+ (optional, for dashboard JS modifications)
|
|
294
|
+
- Anthropic API key
|
|
295
|
+
- Linux environment (Ubuntu 22.04+, Debian 12+)
|
|
296
|
+
|
|
297
|
+
### Python Dependencies
|
|
298
|
+
|
|
299
|
+
See `requirements.txt` or `pyproject.toml` for full list.
|
|
300
|
+
|
|
301
|
+
## Documentation
|
|
302
|
+
|
|
303
|
+
- [QUICKSTART.md](QUICKSTART.md) - Get started in 5 minutes
|
|
304
|
+
- [INSTALL.md](INSTALL.md) - Detailed installation guide
|
|
305
|
+
- [USAGE.md](USAGE.md) - How to use AI-AtlasForge
|
|
306
|
+
- [ARCHITECTURE.md](ARCHITECTURE.md) - System architecture
|
|
307
|
+
- [DISPLAY_LAYER.md](workspace/docs/DISPLAY_LAYER.md) - Display Layer user guide (Windows)
|
|
308
|
+
- [TROUBLESHOOTING.md](workspace/docs/TROUBLESHOOTING.md) - Display Layer troubleshooting
|
|
309
|
+
|
|
310
|
+
## License
|
|
311
|
+
|
|
312
|
+
MIT License - see [LICENSE](LICENSE) for details.
|
|
313
|
+
|
|
314
|
+
## Contributing
|
|
315
|
+
|
|
316
|
+
Contributions are welcome! Please feel free to submit issues and pull requests.
|
|
317
|
+
|
|
318
|
+
## Related Projects
|
|
319
|
+
|
|
320
|
+
- **[AI-AfterImage](https://github.com/DragonShadows1978/AI-AfterImage)** - Episodic memory for AI coding agents. Gives Claude Code persistent memory of code it has written across sessions. Works great with AtlasForge for cross-mission code recall.
|
|
321
|
+
|
|
322
|
+
## Acknowledgments
|
|
323
|
+
|
|
324
|
+
Built on Claude by Anthropic. Special thanks to the Claude Code team for making autonomous AI development possible.
|
|
@@ -0,0 +1,280 @@
|
|
|
1
|
+
# AI-AtlasForge
|
|
2
|
+
|
|
3
|
+
An autonomous AI research and development platform powered by Claude. Run long-duration missions, accumulate cross-session knowledge, and build software autonomously.
|
|
4
|
+
|
|
5
|
+
## What is AI-AtlasForge?
|
|
6
|
+
|
|
7
|
+
AI-AtlasForge is not a chatbot wrapper. It's an **autonomous research engine** that:
|
|
8
|
+
|
|
9
|
+
- Runs multi-day missions without human intervention
|
|
10
|
+
- Maintains mission continuity across context windows
|
|
11
|
+
- Accumulates knowledge that persists across sessions
|
|
12
|
+
- Self-corrects when drifting from objectives
|
|
13
|
+
- Adversarially tests its own outputs
|
|
14
|
+
|
|
15
|
+
## Quick Start
|
|
16
|
+
|
|
17
|
+
### Prerequisites
|
|
18
|
+
|
|
19
|
+
- Python 3.10+
|
|
20
|
+
- Anthropic API key (get one at https://console.anthropic.com/)
|
|
21
|
+
- Linux environment (tested on Ubuntu 22.04+, Debian 12+)
|
|
22
|
+
|
|
23
|
+
> **Platform Notes:**
|
|
24
|
+
> - **Windows:** Use WSL2 (Windows Subsystem for Linux)
|
|
25
|
+
> - **macOS:** Should work but is untested. Please report issues.
|
|
26
|
+
|
|
27
|
+
### Option 1: Standard Installation
|
|
28
|
+
|
|
29
|
+
```bash
|
|
30
|
+
# Clone the repository
|
|
31
|
+
git clone https://github.com/DragonShadows1978/AI-AtlasForge.git
|
|
32
|
+
cd AI-AtlasForge
|
|
33
|
+
|
|
34
|
+
# Run the installer
|
|
35
|
+
./install.sh
|
|
36
|
+
|
|
37
|
+
# Configure your API key
|
|
38
|
+
export ANTHROPIC_API_KEY='your-key-here'
|
|
39
|
+
# Or edit config.yaml / .env
|
|
40
|
+
|
|
41
|
+
# Verify installation
|
|
42
|
+
./verify.sh
|
|
43
|
+
```
|
|
44
|
+
|
|
45
|
+
### Option 2: One-Liner Install
|
|
46
|
+
|
|
47
|
+
```bash
|
|
48
|
+
curl -sSL https://raw.githubusercontent.com/DragonShadows1978/AI-AtlasForge/main/quick_install.sh | bash
|
|
49
|
+
```
|
|
50
|
+
|
|
51
|
+
### Option 3: Docker Installation
|
|
52
|
+
|
|
53
|
+
```bash
|
|
54
|
+
git clone https://github.com/DragonShadows1978/AI-AtlasForge.git
|
|
55
|
+
cd AI-AtlasForge
|
|
56
|
+
docker compose up -d
|
|
57
|
+
# Dashboard at http://localhost:5050
|
|
58
|
+
```
|
|
59
|
+
|
|
60
|
+
For detailed installation options, see [INSTALL.md](INSTALL.md) or [QUICKSTART.md](QUICKSTART.md).
|
|
61
|
+
|
|
62
|
+
### Running Your First Mission
|
|
63
|
+
|
|
64
|
+
1. **Start the Dashboard** (optional, for monitoring):
|
|
65
|
+
```bash
|
|
66
|
+
make dashboard
|
|
67
|
+
# Or: python3 dashboard_v2.py
|
|
68
|
+
# Access at http://localhost:5050
|
|
69
|
+
```
|
|
70
|
+
|
|
71
|
+
2. **Create a Mission**:
|
|
72
|
+
- Via Dashboard: Click "Create Mission" and enter your objectives
|
|
73
|
+
- Via Sample: Run `make sample-mission` to load a hello-world mission
|
|
74
|
+
- Via JSON: Create `state/mission.json` manually
|
|
75
|
+
|
|
76
|
+
3. **Start the Engine**:
|
|
77
|
+
```bash
|
|
78
|
+
make run
|
|
79
|
+
# Or: python3 claude_autonomous.py --mode=rd
|
|
80
|
+
```
|
|
81
|
+
|
|
82
|
+
### Development Commands
|
|
83
|
+
|
|
84
|
+
Run `make help` to see all available commands:
|
|
85
|
+
|
|
86
|
+
```bash
|
|
87
|
+
make install # Full installation
|
|
88
|
+
make verify # Verify installation
|
|
89
|
+
make dashboard # Start dashboard
|
|
90
|
+
make run # Start autonomous agent
|
|
91
|
+
make docker # Start with Docker
|
|
92
|
+
make sample-mission # Load sample mission
|
|
93
|
+
```
|
|
94
|
+
|
|
95
|
+
## Architecture
|
|
96
|
+
|
|
97
|
+
```
|
|
98
|
+
+-------------------+
|
|
99
|
+
| Mission State |
|
|
100
|
+
| (mission.json) |
|
|
101
|
+
+--------+----------+
|
|
102
|
+
|
|
|
103
|
+
+--------------+--------------+
|
|
104
|
+
| |
|
|
105
|
+
+---------v---------+ +--------v--------+
|
|
106
|
+
| AtlasForge | | Dashboard |
|
|
107
|
+
| (Execution Engine)| | (Monitoring) |
|
|
108
|
+
+---------+---------+ +-----------------+
|
|
109
|
+
|
|
|
110
|
+
+---------v---------+
|
|
111
|
+
| R&D Engine |
|
|
112
|
+
| (State Machine) |
|
|
113
|
+
+---------+---------+
|
|
114
|
+
|
|
|
115
|
+
+---------v-------------------+
|
|
116
|
+
| Stage Pipeline |
|
|
117
|
+
| |
|
|
118
|
+
| PLANNING -> BUILDING -> |
|
|
119
|
+
| TESTING -> ANALYZING -> |
|
|
120
|
+
| CYCLE_END -> COMPLETE |
|
|
121
|
+
+-----------------------------+
|
|
122
|
+
```
|
|
123
|
+
|
|
124
|
+
## Mission Lifecycle
|
|
125
|
+
|
|
126
|
+
1. **PLANNING** - Understand objectives, research codebase, create implementation plan
|
|
127
|
+
2. **BUILDING** - Implement the solution
|
|
128
|
+
3. **TESTING** - Validate implementation
|
|
129
|
+
4. **ANALYZING** - Evaluate results, identify issues
|
|
130
|
+
5. **CYCLE_END** - Generate reports, prepare continuation
|
|
131
|
+
6. **COMPLETE** - Mission finished
|
|
132
|
+
|
|
133
|
+
Missions can iterate through multiple cycles until success criteria are met.
|
|
134
|
+
|
|
135
|
+
## Core Components
|
|
136
|
+
|
|
137
|
+
### atlasforge.py
|
|
138
|
+
Main execution loop. Spawns Claude instances, manages state, handles graceful shutdown.
|
|
139
|
+
|
|
140
|
+
### af_engine.py
|
|
141
|
+
State machine for mission execution. Manages stages, enforces constraints, tracks progress.
|
|
142
|
+
|
|
143
|
+
### dashboard_v2.py
|
|
144
|
+
Web-based monitoring interface showing mission status, knowledge base, and analytics.
|
|
145
|
+
|
|
146
|
+
### Knowledge Base
|
|
147
|
+
SQLite database accumulating learnings across all missions:
|
|
148
|
+
- Techniques discovered
|
|
149
|
+
- Insights gained
|
|
150
|
+
- Gotchas encountered
|
|
151
|
+
- Reusable code patterns
|
|
152
|
+
|
|
153
|
+
### Adversarial Testing
|
|
154
|
+
Separate Claude instances that test implementations:
|
|
155
|
+
- RedTeam agents with no implementation knowledge
|
|
156
|
+
- Mutation testing
|
|
157
|
+
- Property-based testing
|
|
158
|
+
|
|
159
|
+
### GlassBox
|
|
160
|
+
Post-mission introspection system:
|
|
161
|
+
- Transcript parsing
|
|
162
|
+
- Agent hierarchy reconstruction
|
|
163
|
+
- Stage timeline visualization
|
|
164
|
+
|
|
165
|
+
## Key Features
|
|
166
|
+
|
|
167
|
+
### Display Layer (Windows)
|
|
168
|
+
Visual environment for graphical application testing:
|
|
169
|
+
- Screenshot capture from virtual display
|
|
170
|
+
- Web-accessible display via noVNC (localhost:6080)
|
|
171
|
+
- Web terminal via ttyd (localhost:7681)
|
|
172
|
+
- Browser support for OAuth flows and web testing
|
|
173
|
+
- Automatic GPU detection with software fallback
|
|
174
|
+
|
|
175
|
+
See [docs/DISPLAY_LAYER.md](workspace/docs/DISPLAY_LAYER.md) for the user guide.
|
|
176
|
+
|
|
177
|
+
### Mission Continuity
|
|
178
|
+
Missions survive context window limits through:
|
|
179
|
+
- Persistent mission.json state
|
|
180
|
+
- Cycle-based iteration
|
|
181
|
+
- Continuation prompts that preserve context
|
|
182
|
+
|
|
183
|
+
### Knowledge Accumulation
|
|
184
|
+
Every mission adds to the knowledge base. The system improves over time as it learns patterns, gotchas, and techniques.
|
|
185
|
+
|
|
186
|
+
### Autonomous Operation
|
|
187
|
+
Designed for unattended execution:
|
|
188
|
+
- Graceful crash recovery
|
|
189
|
+
- Stage checkpointing
|
|
190
|
+
- Automatic cycle progression
|
|
191
|
+
|
|
192
|
+
## Directory Structure
|
|
193
|
+
|
|
194
|
+
```
|
|
195
|
+
AI-AtlasForge/
|
|
196
|
+
+-- atlasforge.py # Main entry point
|
|
197
|
+
+-- af_engine.py # Stage state machine
|
|
198
|
+
+-- dashboard_v2.py # Web dashboard
|
|
199
|
+
+-- adversarial_testing/ # Testing framework
|
|
200
|
+
+-- atlasforge_enhancements/ # Enhancement modules
|
|
201
|
+
+-- workspace/ # Active workspace
|
|
202
|
+
| +-- glassbox/ # Introspection tools
|
|
203
|
+
| +-- artifacts/ # Plans, reports
|
|
204
|
+
| +-- research/ # Notes, findings
|
|
205
|
+
| +-- tests/ # Test scripts
|
|
206
|
+
+-- state/ # Runtime state
|
|
207
|
+
| +-- mission.json # Current mission
|
|
208
|
+
| +-- claude_state.json # Execution state
|
|
209
|
+
+-- missions/ # Mission workspaces
|
|
210
|
+
+-- atlasforge_data/
|
|
211
|
+
| +-- knowledge_base/ # Accumulated learnings
|
|
212
|
+
+-- logs/ # Execution logs
|
|
213
|
+
```
|
|
214
|
+
|
|
215
|
+
## Configuration
|
|
216
|
+
|
|
217
|
+
AI-AtlasForge uses environment variables for configuration:
|
|
218
|
+
|
|
219
|
+
| Variable | Default | Description |
|
|
220
|
+
|----------|---------|-------------|
|
|
221
|
+
| `ATLASFORGE_PORT` | `5050` | Dashboard port |
|
|
222
|
+
| `ATLASFORGE_ROOT` | (script directory) | Base directory |
|
|
223
|
+
| `ATLASFORGE_DEBUG` | `false` | Enable debug logging |
|
|
224
|
+
|
|
225
|
+
## Dashboard Features
|
|
226
|
+
|
|
227
|
+
The web dashboard provides real-time monitoring:
|
|
228
|
+
|
|
229
|
+
- **Mission Status** - Current stage, progress, timing
|
|
230
|
+
- **Activity Feed** - Live log of agent actions
|
|
231
|
+
- **Knowledge Base** - Search and browse learnings
|
|
232
|
+
- **Analytics** - Token usage, cost tracking
|
|
233
|
+
- **Mission Queue** - Queue and schedule missions
|
|
234
|
+
- **GlassBox** - Post-mission analysis
|
|
235
|
+
|
|
236
|
+
## Philosophy
|
|
237
|
+
|
|
238
|
+
**First principles only.** No frameworks hiding integration failures. Every component built from scratch for full visibility.
|
|
239
|
+
|
|
240
|
+
**Speed of machine, not human.** Designed for autonomous operation. Check in when convenient, not when required.
|
|
241
|
+
|
|
242
|
+
**Knowledge accumulates.** Every mission adds to the knowledge base. The system gets better over time.
|
|
243
|
+
|
|
244
|
+
**Trust but verify.** Adversarial testing catches what regular testing misses. The same agent that writes code doesn't validate it.
|
|
245
|
+
|
|
246
|
+
## Requirements
|
|
247
|
+
|
|
248
|
+
- Python 3.10+
|
|
249
|
+
- Node.js 18+ (optional, for dashboard JS modifications)
|
|
250
|
+
- Anthropic API key
|
|
251
|
+
- Linux environment (Ubuntu 22.04+, Debian 12+)
|
|
252
|
+
|
|
253
|
+
### Python Dependencies
|
|
254
|
+
|
|
255
|
+
See `requirements.txt` or `pyproject.toml` for full list.
|
|
256
|
+
|
|
257
|
+
## Documentation
|
|
258
|
+
|
|
259
|
+
- [QUICKSTART.md](QUICKSTART.md) - Get started in 5 minutes
|
|
260
|
+
- [INSTALL.md](INSTALL.md) - Detailed installation guide
|
|
261
|
+
- [USAGE.md](USAGE.md) - How to use AI-AtlasForge
|
|
262
|
+
- [ARCHITECTURE.md](ARCHITECTURE.md) - System architecture
|
|
263
|
+
- [DISPLAY_LAYER.md](workspace/docs/DISPLAY_LAYER.md) - Display Layer user guide (Windows)
|
|
264
|
+
- [TROUBLESHOOTING.md](workspace/docs/TROUBLESHOOTING.md) - Display Layer troubleshooting
|
|
265
|
+
|
|
266
|
+
## License
|
|
267
|
+
|
|
268
|
+
MIT License - see [LICENSE](LICENSE) for details.
|
|
269
|
+
|
|
270
|
+
## Contributing
|
|
271
|
+
|
|
272
|
+
Contributions are welcome! Please feel free to submit issues and pull requests.
|
|
273
|
+
|
|
274
|
+
## Related Projects
|
|
275
|
+
|
|
276
|
+
- **[AI-AfterImage](https://github.com/DragonShadows1978/AI-AfterImage)** - Episodic memory for AI coding agents. Gives Claude Code persistent memory of code it has written across sessions. Works great with AtlasForge for cross-mission code recall.
|
|
277
|
+
|
|
278
|
+
## Acknowledgments
|
|
279
|
+
|
|
280
|
+
Built on Claude by Anthropic. Special thanks to the Claude Code team for making autonomous AI development possible.
|