@covibes/zeroshot 4.2.0 → 5.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +14 -0
- package/README.md +31 -29
- package/cli/index.js +9 -5
- package/lib/settings.js +1 -3
- package/package.json +1 -1
package/CHANGELOG.md
CHANGED
|
@@ -1,3 +1,17 @@
|
|
|
1
|
+
# [5.0.0](https://github.com/covibes/zeroshot/compare/v4.2.0...v5.0.0) (2026-01-07)
|
|
2
|
+
|
|
3
|
+
|
|
4
|
+
* feat!: remove interactive setup wizard ([5438953](https://github.com/covibes/zeroshot/commit/54389536e478be1dce0ab707ac7ef8e4ef6ce26d))
|
|
5
|
+
|
|
6
|
+
|
|
7
|
+
### BREAKING CHANGES
|
|
8
|
+
|
|
9
|
+
* Interactive setup wizard removed. Configure via:
|
|
10
|
+
zeroshot settings set maxModel opus
|
|
11
|
+
zeroshot settings set dockerMounts '["gh","git","ssh"]'
|
|
12
|
+
|
|
13
|
+
Closes: Setup wizard blocking non-interactive usage
|
|
14
|
+
|
|
1
15
|
# [4.2.0](https://github.com/covibes/zeroshot/compare/v4.1.4...v4.2.0) (2026-01-06)
|
|
2
16
|
|
|
3
17
|
|
package/README.md
CHANGED
|
@@ -8,7 +8,24 @@
|
|
|
8
8
|
|
|
9
9
|
> **2024** was the year of LLMs. **2025** was the year of agents. **2026** is the year of agent clusters.
|
|
10
10
|
|
|
11
|
-
**
|
|
11
|
+
**Autonomous engineering teams for Claude Code.**
|
|
12
|
+
|
|
13
|
+
## Install
|
|
14
|
+
|
|
15
|
+
**Platforms**: Linux, macOS
|
|
16
|
+
|
|
17
|
+
```bash
|
|
18
|
+
npm install -g @covibes/zeroshot
|
|
19
|
+
```
|
|
20
|
+
|
|
21
|
+
**Requires**: Node 18+, [Claude Code CLI](https://claude.com/product/claude-code), [GitHub CLI](https://cli.github.com/)
|
|
22
|
+
|
|
23
|
+
```bash
|
|
24
|
+
npm i -g @anthropic-ai/claude-code && claude auth login
|
|
25
|
+
gh auth login
|
|
26
|
+
```
|
|
27
|
+
|
|
28
|
+
---
|
|
12
29
|
|
|
13
30
|
You know the problem. Your AI agent:
|
|
14
31
|
|
|
@@ -44,7 +61,7 @@ with details of what conflicted. Handle the ABA problem where version goes A->B-
|
|
|
44
61
|
<p align="center">
|
|
45
62
|
<img src="./docs/assets/zeroshot-demo.gif" alt="Demo" width="700">
|
|
46
63
|
<br>
|
|
47
|
-
<em>Sped up 100x — 90 minutes,
|
|
64
|
+
<em>Sped up 100x — 90 minutes, 5 iterations until validators approved</em>
|
|
48
65
|
</p>
|
|
49
66
|
|
|
50
67
|
**The full fix cycle.** Initial implementation passed basic tests but validators caught edge cases: race conditions in concurrent updates, ABA problem not fully handled, retry backoff timing issues. Each rejection triggered fixes until all 48 tests passed with 91%+ coverage.
|
|
@@ -59,15 +76,15 @@ A single agent would say "done!" after the first implementation. Here, the adver
|
|
|
59
76
|
|
|
60
77
|
**Zeroshot requires well-defined tasks with clear acceptance criteria.**
|
|
61
78
|
|
|
62
|
-
| Scenario |
|
|
63
|
-
|
|
64
|
-
|
|
|
65
|
-
|
|
|
66
|
-
|
|
|
67
|
-
|
|
|
68
|
-
|
|
|
69
|
-
|
|
|
70
|
-
|
|
|
79
|
+
| Scenario | Use? | Why |
|
|
80
|
+
|----------|:----:|-----|
|
|
81
|
+
| Add rate limiting (sliding window, per-IP, 429) | ✅ | Clear requirements |
|
|
82
|
+
| Refactor auth to JWT | ✅ | Defined end state |
|
|
83
|
+
| Fix login bug | ✅ | Success is measurable |
|
|
84
|
+
| Fix 2410 lint violations | ✅ | Clear completion criteria |
|
|
85
|
+
| Make the app faster | ❌ | Needs exploration first |
|
|
86
|
+
| Improve the codebase | ❌ | No acceptance criteria |
|
|
87
|
+
| Figure out flaky tests | ❌ | Exploratory |
|
|
71
88
|
|
|
72
89
|
**Known unknowns** (implementation details unclear) → Zeroshot handles this. The planner figures it out.
|
|
73
90
|
|
|
@@ -84,23 +101,6 @@ Crash recovery (`zeroshot resume`) means multi-hour tasks survive interruptions.
|
|
|
84
101
|
|
|
85
102
|
---
|
|
86
103
|
|
|
87
|
-
## Install
|
|
88
|
-
|
|
89
|
-
**Platforms**: Linux, macOS
|
|
90
|
-
|
|
91
|
-
```bash
|
|
92
|
-
npm install -g @covibes/zeroshot
|
|
93
|
-
```
|
|
94
|
-
|
|
95
|
-
**Requires**: Node 18+, [Claude Code CLI](https://claude.com/product/claude-code), [GitHub CLI](https://cli.github.com/)
|
|
96
|
-
|
|
97
|
-
```bash
|
|
98
|
-
npm i -g @anthropic-ai/claude-code && claude auth login
|
|
99
|
-
gh auth login
|
|
100
|
-
```
|
|
101
|
-
|
|
102
|
-
---
|
|
103
|
-
|
|
104
104
|
## Commands
|
|
105
105
|
|
|
106
106
|
```bash
|
|
@@ -344,12 +344,14 @@ Full isolation in a fresh container. Your workspace stays untouched. Good for ri
|
|
|
344
344
|
|
|
345
345
|
| Scenario | Recommended |
|
|
346
346
|
| -------- | ----------- |
|
|
347
|
-
| Quick
|
|
347
|
+
| Quick task, review changes yourself | No isolation (default) |
|
|
348
348
|
| PR workflow, code review | `--worktree` or `--pr` |
|
|
349
349
|
| Risky experiment, might break things | `--docker` |
|
|
350
350
|
| Running multiple tasks in parallel | `--docker` |
|
|
351
351
|
| Full automation, no review needed | `--ship` |
|
|
352
352
|
|
|
353
|
+
**Default mode:** Agents are instructed to only modify files (no git commit/push). You review and commit yourself.
|
|
354
|
+
|
|
353
355
|
<details>
|
|
354
356
|
<summary><strong>Docker Credential Mounts</strong></summary>
|
|
355
357
|
|
package/cli/index.js
CHANGED
|
@@ -48,7 +48,7 @@ const {
|
|
|
48
48
|
} = require('../lib/settings');
|
|
49
49
|
const { MOUNT_PRESETS, resolveEnvs } = require('../lib/docker-config');
|
|
50
50
|
const { requirePreflight } = require('../src/preflight');
|
|
51
|
-
|
|
51
|
+
// Setup wizard removed - use: zeroshot settings set <key> <value>
|
|
52
52
|
const { checkForUpdates } = require('./lib/update-checker');
|
|
53
53
|
const { StatusFooter, AGENT_STATE, ACTIVE_STATES } = require('../src/status-footer');
|
|
54
54
|
|
|
@@ -2771,7 +2771,7 @@ const settingsCmd = program.command('settings').description('Manage zeroshot set
|
|
|
2771
2771
|
function formatSettingsList(settings, showUsage = false) {
|
|
2772
2772
|
const DOCKER_KEYS = ['dockerMounts', 'dockerEnvPassthrough', 'dockerContainerHome'];
|
|
2773
2773
|
|
|
2774
|
-
console.log(chalk.bold('\
|
|
2774
|
+
console.log(chalk.bold('\nSettings:\n'));
|
|
2775
2775
|
|
|
2776
2776
|
// Non-docker settings first
|
|
2777
2777
|
for (const [key, value] of Object.entries(settings)) {
|
|
@@ -2861,6 +2861,13 @@ function formatSettingsList(settings, showUsage = false) {
|
|
|
2861
2861
|
console.log(chalk.dim(' zeroshot settings get <key>'));
|
|
2862
2862
|
console.log(chalk.dim(' zeroshot settings reset'));
|
|
2863
2863
|
console.log('');
|
|
2864
|
+
console.log(chalk.dim('Examples:'));
|
|
2865
|
+
console.log(chalk.dim(' zeroshot settings set maxModel opus'));
|
|
2866
|
+
console.log(chalk.dim(' zeroshot settings set dockerMounts \'["gh","git","ssh","aws"]\''));
|
|
2867
|
+
console.log(chalk.dim(' zeroshot settings set dockerEnvPassthrough \'["AWS_*","TF_VAR_*"]\''));
|
|
2868
|
+
console.log('');
|
|
2869
|
+
console.log(chalk.dim('Available mount presets: gh, git, ssh, aws, azure, kube, terraform, gcloud'));
|
|
2870
|
+
console.log('');
|
|
2864
2871
|
}
|
|
2865
2872
|
}
|
|
2866
2873
|
|
|
@@ -4480,10 +4487,7 @@ function printMessage(msg, showClusterId = false, watchMode = false, isActive =
|
|
|
4480
4487
|
|
|
4481
4488
|
// Main async entry point
|
|
4482
4489
|
async function main() {
|
|
4483
|
-
// First-run setup wizard (blocks on first use only)
|
|
4484
|
-
// CRITICAL: Auto-enable quiet mode in test environment to prevent stdin hangs
|
|
4485
4490
|
const isQuiet = process.argv.includes('-q') || process.argv.includes('--quiet') || process.env.NODE_ENV === 'test';
|
|
4486
|
-
await checkFirstRun({ quiet: isQuiet });
|
|
4487
4491
|
|
|
4488
4492
|
// Check for updates (non-blocking if offline)
|
|
4489
4493
|
await checkForUpdates({ quiet: isQuiet });
|
package/lib/settings.js
CHANGED
|
@@ -57,7 +57,7 @@ function validateModelAgainstMax(requestedModel, maxModel) {
|
|
|
57
57
|
|
|
58
58
|
// Default settings
|
|
59
59
|
const DEFAULT_SETTINGS = {
|
|
60
|
-
maxModel: '
|
|
60
|
+
maxModel: 'opus', // Cost ceiling - agents cannot use models above this
|
|
61
61
|
defaultConfig: 'conductor-bootstrap',
|
|
62
62
|
defaultDocker: false,
|
|
63
63
|
strictSchema: true, // true = reliable json output (default), false = live streaming (may crash - see bold-meadow-11)
|
|
@@ -66,8 +66,6 @@ const DEFAULT_SETTINGS = {
|
|
|
66
66
|
autoCheckUpdates: true, // Check npm registry for newer versions
|
|
67
67
|
lastUpdateCheckAt: null, // Unix timestamp of last check (null = never checked)
|
|
68
68
|
lastSeenVersion: null, // Don't re-prompt for same version
|
|
69
|
-
// First-run wizard
|
|
70
|
-
firstRunComplete: false, // Has user completed first-run setup?
|
|
71
69
|
// Docker isolation mounts - preset names or {host, container, readonly?} objects
|
|
72
70
|
// Valid presets: gh, git, ssh, aws, azure, kube, terraform, gcloud
|
|
73
71
|
dockerMounts: ['gh', 'git', 'ssh'],
|