@diegopetrucci/pi-extensions 0.1.14 → 0.1.15
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/README.md
CHANGED
|
@@ -4,6 +4,7 @@ A collection of [pi](https://github.com/earendil-works/pi-mono) agent extensions
|
|
|
4
4
|
|
|
5
5
|
- [`minimal-footer`](./extensions/minimal-footer): Replaces pi's built-in footer with a minimal configurable two-line layout: branch/repo on the first line, context/model on the second, optional `DUMB ZONE`, plus OpenAI Codex 5-hour and 7-day usage when available.
|
|
6
6
|
- [`oracle`](./extensions/oracle): Adds an Amp-style read-only oracle tool that auto-selects the strongest reasoning model on the current provider/subscription, covers pi’s built-in providers with hardcoded rankings, sets reasoning to xhigh by default, and shows live status while running.
|
|
7
|
+
- [`context-cap`](./extensions/context-cap): Caps effective model context windows at 200k tokens by default so pi auto-compacts earlier; toggle temporarily with `/context-cap`.
|
|
7
8
|
- [`permission-gate`](./extensions/permission-gate): Prompts for confirmation before dangerous bash commands like `rm -rf`, `sudo`, and `chmod 777`.
|
|
8
9
|
- [`confirm-destructive`](./extensions/confirm-destructive): Confirms before destructive session actions like clear, switch, and fork.
|
|
9
10
|
- [`notify`](./extensions/notify): Sends configurable terminal, desktop, bell, and sound notifications when pi finishes and is ready for input.
|
|
@@ -21,13 +22,15 @@ pi install npm:@diegopetrucci/pi-extensions
|
|
|
21
22
|
Or pin the GitHub package to this release:
|
|
22
23
|
|
|
23
24
|
```bash
|
|
24
|
-
pi install git:github.com/diegopetrucci/pi-extensions@v0.1.
|
|
25
|
+
pi install git:github.com/diegopetrucci/pi-extensions@v0.1.15
|
|
25
26
|
```
|
|
26
27
|
|
|
27
28
|
Or a specific extension:
|
|
28
29
|
|
|
29
30
|
```bash
|
|
30
31
|
pi install npm:@diegopetrucci/pi-oracle
|
|
32
|
+
# or
|
|
33
|
+
pi install npm:@diegopetrucci/pi-context-cap
|
|
31
34
|
```
|
|
32
35
|
|
|
33
36
|
Then reload pi:
|
|
@@ -0,0 +1,60 @@
|
|
|
1
|
+
# context-cap
|
|
2
|
+
|
|
3
|
+
A pi extension that treats large-context models as having an effective 200k-token context window, so pi's built-in auto-compaction starts earlier.
|
|
4
|
+
|
|
5
|
+
By default, pi auto-compacts when:
|
|
6
|
+
|
|
7
|
+
```text
|
|
8
|
+
contextTokens > model.contextWindow - reserveTokens
|
|
9
|
+
```
|
|
10
|
+
|
|
11
|
+
This extension changes the active model's in-memory `contextWindow` to:
|
|
12
|
+
|
|
13
|
+
```text
|
|
14
|
+
min(originalContextWindow, 200000)
|
|
15
|
+
```
|
|
16
|
+
|
|
17
|
+
With pi's default `reserveTokens` of 16,384, models larger than 200k will proactively compact around 183,616 tokens.
|
|
18
|
+
|
|
19
|
+
## Commands
|
|
20
|
+
|
|
21
|
+
```text
|
|
22
|
+
/context-cap status
|
|
23
|
+
/context-cap off
|
|
24
|
+
/context-cap on
|
|
25
|
+
/context-cap toggle
|
|
26
|
+
```
|
|
27
|
+
|
|
28
|
+
The extension starts enabled by default. Disabling is temporary for the current extension runtime/session; after `/reload`, `/new`, `/resume`, or `/fork`, the extension starts enabled again.
|
|
29
|
+
|
|
30
|
+
## Install
|
|
31
|
+
|
|
32
|
+
### Standalone npm package
|
|
33
|
+
|
|
34
|
+
```bash
|
|
35
|
+
pi install npm:@diegopetrucci/pi-context-cap
|
|
36
|
+
```
|
|
37
|
+
|
|
38
|
+
### Collection package
|
|
39
|
+
|
|
40
|
+
```bash
|
|
41
|
+
pi install npm:@diegopetrucci/pi-extensions
|
|
42
|
+
```
|
|
43
|
+
|
|
44
|
+
### GitHub package
|
|
45
|
+
|
|
46
|
+
```bash
|
|
47
|
+
pi install git:github.com/diegopetrucci/pi-extensions
|
|
48
|
+
```
|
|
49
|
+
|
|
50
|
+
Then reload pi:
|
|
51
|
+
|
|
52
|
+
```text
|
|
53
|
+
/reload
|
|
54
|
+
```
|
|
55
|
+
|
|
56
|
+
## Notes
|
|
57
|
+
|
|
58
|
+
- This extension mutates pi's in-memory model metadata only. It does not edit `models.json`.
|
|
59
|
+
- The cap affects pi logic that reads `model.contextWindow`, including auto-compaction thresholding and UI context-window display.
|
|
60
|
+
- Because pi also uses `model.contextWindow` for some overflow detection, a request that succeeds above 200k tokens on a larger model may be treated as overflow and retried after compaction. Use `/context-cap off` if you need the full model window temporarily.
|
|
@@ -0,0 +1,179 @@
|
|
|
1
|
+
import type { ExtensionAPI, ExtensionContext } from "@earendil-works/pi-coding-agent";
|
|
2
|
+
import type { Model, Api } from "@earendil-works/pi-ai";
|
|
3
|
+
|
|
4
|
+
const DEFAULT_MAX_CONTEXT_WINDOW = 200_000;
|
|
5
|
+
type AnyModel = Model<Api> | Model<any>;
|
|
6
|
+
|
|
7
|
+
const originalContextWindows = new WeakMap<AnyModel, number>();
|
|
8
|
+
const touchedModels = new Set<AnyModel>();
|
|
9
|
+
|
|
10
|
+
type ApplyResult = {
|
|
11
|
+
changed: boolean;
|
|
12
|
+
key: string;
|
|
13
|
+
original: number;
|
|
14
|
+
effective: number;
|
|
15
|
+
};
|
|
16
|
+
|
|
17
|
+
function modelKey(model: AnyModel): string {
|
|
18
|
+
return `${model.provider}/${model.id}`;
|
|
19
|
+
}
|
|
20
|
+
|
|
21
|
+
function getOriginalContextWindow(model: AnyModel): number {
|
|
22
|
+
const existing = originalContextWindows.get(model);
|
|
23
|
+
if (typeof existing === "number") return existing;
|
|
24
|
+
|
|
25
|
+
originalContextWindows.set(model, model.contextWindow);
|
|
26
|
+
touchedModels.add(model);
|
|
27
|
+
return model.contextWindow;
|
|
28
|
+
}
|
|
29
|
+
|
|
30
|
+
function getEffectiveContextWindow(model: AnyModel): number {
|
|
31
|
+
return Math.min(getOriginalContextWindow(model), DEFAULT_MAX_CONTEXT_WINDOW);
|
|
32
|
+
}
|
|
33
|
+
|
|
34
|
+
function applyContextCap(model: AnyModel | undefined): ApplyResult | undefined {
|
|
35
|
+
if (!model) return undefined;
|
|
36
|
+
|
|
37
|
+
const key = modelKey(model);
|
|
38
|
+
const original = getOriginalContextWindow(model);
|
|
39
|
+
const effective = Math.min(original, DEFAULT_MAX_CONTEXT_WINDOW);
|
|
40
|
+
const changed = model.contextWindow !== effective;
|
|
41
|
+
model.contextWindow = effective;
|
|
42
|
+
|
|
43
|
+
return { changed, key, original, effective };
|
|
44
|
+
}
|
|
45
|
+
|
|
46
|
+
function restoreContextWindow(model: AnyModel | undefined): boolean {
|
|
47
|
+
if (!model) return false;
|
|
48
|
+
|
|
49
|
+
const original = originalContextWindows.get(model);
|
|
50
|
+
if (typeof original !== "number" || model.contextWindow === original) return false;
|
|
51
|
+
|
|
52
|
+
model.contextWindow = original;
|
|
53
|
+
return true;
|
|
54
|
+
}
|
|
55
|
+
|
|
56
|
+
function forEachRegistryModel(ctx: ExtensionContext, callback: (model: AnyModel) => void): void {
|
|
57
|
+
try {
|
|
58
|
+
for (const model of ctx.modelRegistry.getAll()) {
|
|
59
|
+
callback(model);
|
|
60
|
+
}
|
|
61
|
+
} catch {
|
|
62
|
+
// Best effort only. The active ctx.model is handled separately by callers.
|
|
63
|
+
}
|
|
64
|
+
}
|
|
65
|
+
|
|
66
|
+
function applyContextCapToSession(ctx: ExtensionContext): number {
|
|
67
|
+
let changed = 0;
|
|
68
|
+
|
|
69
|
+
forEachRegistryModel(ctx, (model) => {
|
|
70
|
+
if (applyContextCap(model)?.changed) changed++;
|
|
71
|
+
});
|
|
72
|
+
|
|
73
|
+
if (applyContextCap(ctx.model)?.changed) changed++;
|
|
74
|
+
return changed;
|
|
75
|
+
}
|
|
76
|
+
|
|
77
|
+
function restoreContextCapForSession(ctx: ExtensionContext): number {
|
|
78
|
+
let changed = 0;
|
|
79
|
+
|
|
80
|
+
forEachRegistryModel(ctx, (model) => {
|
|
81
|
+
if (restoreContextWindow(model)) changed++;
|
|
82
|
+
});
|
|
83
|
+
|
|
84
|
+
if (restoreContextWindow(ctx.model)) changed++;
|
|
85
|
+
return changed;
|
|
86
|
+
}
|
|
87
|
+
|
|
88
|
+
function formatTokens(tokens: number): string {
|
|
89
|
+
return tokens >= 1000 ? `${Math.round(tokens / 1000)}k` : String(tokens);
|
|
90
|
+
}
|
|
91
|
+
|
|
92
|
+
export default function contextCapExtension(pi: ExtensionAPI) {
|
|
93
|
+
let enabled = true;
|
|
94
|
+
|
|
95
|
+
pi.on("session_start", async (_event, ctx) => {
|
|
96
|
+
if (enabled) applyContextCapToSession(ctx);
|
|
97
|
+
});
|
|
98
|
+
|
|
99
|
+
pi.on("model_select", async (event, ctx) => {
|
|
100
|
+
if (!enabled) return;
|
|
101
|
+
|
|
102
|
+
const result = applyContextCap(event.model);
|
|
103
|
+
if (!result || !ctx.hasUI) return;
|
|
104
|
+
|
|
105
|
+
ctx.ui.setStatus(
|
|
106
|
+
"context-cap",
|
|
107
|
+
result.original > DEFAULT_MAX_CONTEXT_WINDOW
|
|
108
|
+
? `ctx cap ${formatTokens(result.effective)}/${formatTokens(result.original)}`
|
|
109
|
+
: undefined,
|
|
110
|
+
);
|
|
111
|
+
});
|
|
112
|
+
|
|
113
|
+
pi.on("session_shutdown", async (_event, ctx) => {
|
|
114
|
+
restoreContextCapForSession(ctx);
|
|
115
|
+
for (const model of touchedModels) restoreContextWindow(model);
|
|
116
|
+
});
|
|
117
|
+
|
|
118
|
+
pi.registerCommand("context-cap", {
|
|
119
|
+
description: "Toggle the 200k effective context-window cap for auto-compaction",
|
|
120
|
+
getArgumentCompletions: (prefix) => {
|
|
121
|
+
const commands = ["on", "off", "toggle", "status"];
|
|
122
|
+
const matches = commands.filter((command) => command.startsWith(prefix.trim()));
|
|
123
|
+
return matches.length > 0 ? matches.map((value) => ({ value, label: value })) : null;
|
|
124
|
+
},
|
|
125
|
+
handler: async (args, ctx) => {
|
|
126
|
+
const action = args.trim().toLowerCase() || "toggle";
|
|
127
|
+
|
|
128
|
+
if (action === "on" || action === "enable") {
|
|
129
|
+
enabled = true;
|
|
130
|
+
const changed = applyContextCapToSession(ctx);
|
|
131
|
+
ctx.ui.setStatus("context-cap", `ctx cap ${formatTokens(DEFAULT_MAX_CONTEXT_WINDOW)}`);
|
|
132
|
+
ctx.ui.notify(`Context cap enabled (${changed} model window(s) capped/restored).`, "info");
|
|
133
|
+
return;
|
|
134
|
+
}
|
|
135
|
+
|
|
136
|
+
if (action === "off" || action === "disable") {
|
|
137
|
+
enabled = false;
|
|
138
|
+
const changed = restoreContextCapForSession(ctx);
|
|
139
|
+
ctx.ui.setStatus("context-cap", undefined);
|
|
140
|
+
ctx.ui.notify(`Context cap disabled for this extension session (${changed} model window(s) restored).`, "info");
|
|
141
|
+
return;
|
|
142
|
+
}
|
|
143
|
+
|
|
144
|
+
if (action === "toggle") {
|
|
145
|
+
if (enabled) {
|
|
146
|
+
enabled = false;
|
|
147
|
+
const changed = restoreContextCapForSession(ctx);
|
|
148
|
+
ctx.ui.setStatus("context-cap", undefined);
|
|
149
|
+
ctx.ui.notify(`Context cap disabled for this extension session (${changed} model window(s) restored).`, "info");
|
|
150
|
+
} else {
|
|
151
|
+
enabled = true;
|
|
152
|
+
const changed = applyContextCapToSession(ctx);
|
|
153
|
+
ctx.ui.setStatus("context-cap", `ctx cap ${formatTokens(DEFAULT_MAX_CONTEXT_WINDOW)}`);
|
|
154
|
+
ctx.ui.notify(`Context cap enabled (${changed} model window(s) capped/restored).`, "info");
|
|
155
|
+
}
|
|
156
|
+
return;
|
|
157
|
+
}
|
|
158
|
+
|
|
159
|
+
if (action === "status") {
|
|
160
|
+
const model = ctx.model;
|
|
161
|
+
const status = enabled ? "enabled" : "disabled";
|
|
162
|
+
if (!model) {
|
|
163
|
+
ctx.ui.notify(`Context cap is ${status}. No model selected.`, "info");
|
|
164
|
+
return;
|
|
165
|
+
}
|
|
166
|
+
|
|
167
|
+
const original = getOriginalContextWindow(model);
|
|
168
|
+
const effective = enabled ? getEffectiveContextWindow(model) : model.contextWindow;
|
|
169
|
+
ctx.ui.notify(
|
|
170
|
+
`Context cap is ${status}. Current model: ${modelKey(model)} (${formatTokens(effective)}/${formatTokens(original)} effective/original).`,
|
|
171
|
+
"info",
|
|
172
|
+
);
|
|
173
|
+
return;
|
|
174
|
+
}
|
|
175
|
+
|
|
176
|
+
ctx.ui.notify("Usage: /context-cap on | off | toggle | status", "warning");
|
|
177
|
+
},
|
|
178
|
+
});
|
|
179
|
+
}
|
|
@@ -0,0 +1,28 @@
|
|
|
1
|
+
{
|
|
2
|
+
"name": "@diegopetrucci/pi-context-cap",
|
|
3
|
+
"version": "0.1.0",
|
|
4
|
+
"description": "A pi extension that caps effective model context windows at 200k tokens for earlier auto-compaction.",
|
|
5
|
+
"keywords": ["pi-package", "pi", "context", "compaction"],
|
|
6
|
+
"license": "MIT",
|
|
7
|
+
"repository": {
|
|
8
|
+
"type": "git",
|
|
9
|
+
"url": "git+https://github.com/diegopetrucci/pi-extensions.git",
|
|
10
|
+
"directory": "extensions/context-cap"
|
|
11
|
+
},
|
|
12
|
+
"files": [
|
|
13
|
+
"index.ts",
|
|
14
|
+
"README.md"
|
|
15
|
+
],
|
|
16
|
+
"publishConfig": {
|
|
17
|
+
"access": "public"
|
|
18
|
+
},
|
|
19
|
+
"pi": {
|
|
20
|
+
"extensions": [
|
|
21
|
+
"index.ts"
|
|
22
|
+
]
|
|
23
|
+
},
|
|
24
|
+
"peerDependencies": {
|
|
25
|
+
"@earendil-works/pi-ai": "*",
|
|
26
|
+
"@earendil-works/pi-coding-agent": "*"
|
|
27
|
+
}
|
|
28
|
+
}
|
package/package.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@diegopetrucci/pi-extensions",
|
|
3
|
-
"version": "0.1.
|
|
4
|
-
"description": "A collection of pi extensions, including a minimal custom footer, an Amp-style oracle, a permission gate for dangerous bash commands, confirm-before-destructive session actions, and terminal notifications when pi is ready for input.",
|
|
3
|
+
"version": "0.1.15",
|
|
4
|
+
"description": "A collection of pi extensions, including a minimal custom footer, an Amp-style oracle, a 200k context cap for auto-compaction, a permission gate for dangerous bash commands, confirm-before-destructive session actions, and terminal notifications when pi is ready for input.",
|
|
5
5
|
"keywords": ["pi-package", "pi", "terminal", "agent"],
|
|
6
6
|
"license": "MIT",
|
|
7
7
|
"repository": {
|
|
@@ -30,6 +30,7 @@
|
|
|
30
30
|
"extensions": [
|
|
31
31
|
"./extensions/minimal-footer/index.ts",
|
|
32
32
|
"./extensions/oracle/index.ts",
|
|
33
|
+
"./extensions/context-cap/index.ts",
|
|
33
34
|
"./extensions/permission-gate/index.ts",
|
|
34
35
|
"./extensions/confirm-destructive/index.ts",
|
|
35
36
|
"./extensions/notify/index.ts"
|