npm - pi-cache-optimizer - Versions diffs - 2.2.1 → 2.3.0 - Mend

pi-cache-optimizer 2.2.1 → 2.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/index.ts +34 -0
package/package.json +1 -1

package/index.ts CHANGED Viewed

@@ -1433,6 +1433,40 @@ export default function (pi: ExtensionAPI) {
   });
   pi.on("before_agent_start", async (event, _ctx) => {
+    // ────────────────────────────────────────────────────────────────
+    // OpenAI Responses API bypass (codex-responses + responses)
+    //
+    // OpenAI's Responses API endpoints — both the Codex backend
+    // (openai-codex-responses, chatgpt.com) and the public
+    // Responses API (openai-responses, api.openai.com / Copilot) —
+    // have two properties that make client-side prompt reordering
+    // unnecessary and potentially harmful:
+    //
+    //  1. Server-managed caching: both APIs send `prompt_cache_key`
+    //     (= Pi session id) in every request body, so the server
+    //     already maintains a stable cache without prefix ordering.
+    //     Client-side reordering adds no cache benefit.
+    //
+    //  2. Stricter content-safety filtering: the Codex backend in
+    //     particular has a product-level safety filter that flags
+    //     reordered prompts (tool snippets / guidelines lifted above
+    //     the assistant role) as potential prompt-injection, returning
+    //     `content_filter` and blocking tool calls (notably
+    //     `subagent`). The public Responses API shares the same
+    //     filter framework and could behave similarly.
+    //
+    // We therefore skip ALL prompt modifications (churn strip, skill
+    // compression, reorder) for these APIs. Third-party providers
+    // that use openai-completions are unaffected.
+    // ────────────────────────────────────────────────────────────────
+    const model = _ctx.model;
+    if (model) {
+      const api = lower(model.api);
+      if (api === "openai-codex-responses" || api === "openai-responses") {
+        return {};
+      }
+    }
     // Step 1: strip per-turn churn from <session-overview>.
     // Removing RECENT COMMITS, Working directory status, and
     // Journal line count makes more of the session-overview stable

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "pi-cache-optimizer",
-  "version": "2.2.1",
+  "version": "2.3.0",
   "description": "Pi extension that improves provider-side KV/prompt cache hit rates (DeepSeek, OpenAI, Claude, Gemini) by reordering the system prompt, requesting long retention, and showing footer cache stats. Renamed from pi-deepseek-cache-optimizer.",
   "keywords": [
     "pi-package",