@agentic-patterns/runtime 0.1.7 → 0.1.9
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/index.cjs +4 -7
- package/dist/index.cjs.map +1 -1
- package/dist/index.d.cts +13 -8
- package/dist/index.d.ts +13 -8
- package/dist/index.js +4 -7
- package/dist/index.js.map +1 -1
- package/package.json +4 -14
package/dist/index.d.cts
CHANGED
|
@@ -1148,16 +1148,21 @@ declare const openrouterProvider: ProviderProtocol;
|
|
|
1148
1148
|
/**
|
|
1149
1149
|
* Ollama — local-only OSS models via HTTP.
|
|
1150
1150
|
*
|
|
1151
|
-
* Default tier map uses the
|
|
1152
|
-
* prioritizes tool-calling and keeps the same grammar across
|
|
1153
|
-
* agents scale between haiku↔sonnet↔opus without prompt
|
|
1151
|
+
* Default tier map uses the qwen3.5/3.6 families because Qwen's team
|
|
1152
|
+
* explicitly prioritizes tool-calling and keeps the same grammar across
|
|
1153
|
+
* sizes — so agents scale between haiku↔sonnet↔opus without prompt
|
|
1154
|
+
* changes. Three sizes selected from a single bench pass on a 4080 Super-
|
|
1155
|
+
* class box:
|
|
1154
1156
|
*
|
|
1155
|
-
*
|
|
1156
|
-
*
|
|
1157
|
-
*
|
|
1158
|
-
* haiku (4B dense) — ~3 GB VRAM, 100+ tok/s
|
|
1157
|
+
* opus (35B MoE, activates 3B/token) — 15.1 GB VRAM + 10.5 GB RAM spill, ~15 tok/s
|
|
1158
|
+
* sonnet (9B dense) — 8.2 GB VRAM, 0 spill, ~98 tok/s
|
|
1159
|
+
* haiku (4B dense) — 3.4 GB VRAM, 0 spill, ~145 tok/s
|
|
1159
1160
|
*
|
|
1160
|
-
*
|
|
1161
|
+
* Earlier qwen3:14b is the same speed class as 3.5:9b and worse at most
|
|
1162
|
+
* tool-calling tasks; 3.5:9b is preferred for the sonnet slot.
|
|
1163
|
+
*
|
|
1164
|
+
* Override with `options.modelId` (or `AGENT_MODEL` env) for any other
|
|
1165
|
+
* family — the tier map is just the default when nothing is pinned.
|
|
1161
1166
|
*/
|
|
1162
1167
|
declare const ollamaProvider: ProviderProtocol;
|
|
1163
1168
|
|
package/dist/index.d.ts
CHANGED
|
@@ -1148,16 +1148,21 @@ declare const openrouterProvider: ProviderProtocol;
|
|
|
1148
1148
|
/**
|
|
1149
1149
|
* Ollama — local-only OSS models via HTTP.
|
|
1150
1150
|
*
|
|
1151
|
-
* Default tier map uses the
|
|
1152
|
-
* prioritizes tool-calling and keeps the same grammar across
|
|
1153
|
-
* agents scale between haiku↔sonnet↔opus without prompt
|
|
1151
|
+
* Default tier map uses the qwen3.5/3.6 families because Qwen's team
|
|
1152
|
+
* explicitly prioritizes tool-calling and keeps the same grammar across
|
|
1153
|
+
* sizes — so agents scale between haiku↔sonnet↔opus without prompt
|
|
1154
|
+
* changes. Three sizes selected from a single bench pass on a 4080 Super-
|
|
1155
|
+
* class box:
|
|
1154
1156
|
*
|
|
1155
|
-
*
|
|
1156
|
-
*
|
|
1157
|
-
*
|
|
1158
|
-
* haiku (4B dense) — ~3 GB VRAM, 100+ tok/s
|
|
1157
|
+
* opus (35B MoE, activates 3B/token) — 15.1 GB VRAM + 10.5 GB RAM spill, ~15 tok/s
|
|
1158
|
+
* sonnet (9B dense) — 8.2 GB VRAM, 0 spill, ~98 tok/s
|
|
1159
|
+
* haiku (4B dense) — 3.4 GB VRAM, 0 spill, ~145 tok/s
|
|
1159
1160
|
*
|
|
1160
|
-
*
|
|
1161
|
+
* Earlier qwen3:14b is the same speed class as 3.5:9b and worse at most
|
|
1162
|
+
* tool-calling tasks; 3.5:9b is preferred for the sonnet slot.
|
|
1163
|
+
*
|
|
1164
|
+
* Override with `options.modelId` (or `AGENT_MODEL` env) for any other
|
|
1165
|
+
* family — the tier map is just the default when nothing is pinned.
|
|
1161
1166
|
*/
|
|
1162
1167
|
declare const ollamaProvider: ProviderProtocol;
|
|
1163
1168
|
|
package/dist/index.js
CHANGED
|
@@ -2149,10 +2149,7 @@ var ClaudeCodeAPIRunner = class extends ClaudeCodeRunner {
|
|
|
2149
2149
|
const sdkOpts = super._buildOptions(agent, options, context);
|
|
2150
2150
|
sdkOpts.tools = [];
|
|
2151
2151
|
if (this._extraDisallowed.length > 0) {
|
|
2152
|
-
sdkOpts.disallowedTools = [
|
|
2153
|
-
...sdkOpts.disallowedTools ?? [],
|
|
2154
|
-
...this._extraDisallowed
|
|
2155
|
-
];
|
|
2152
|
+
sdkOpts.disallowedTools = [...sdkOpts.disallowedTools ?? [], ...this._extraDisallowed];
|
|
2156
2153
|
}
|
|
2157
2154
|
if (!this._disableSandbox && this._isolatedConfigDir) {
|
|
2158
2155
|
const oauth = loadMaxSubOAuth();
|
|
@@ -2506,9 +2503,9 @@ var openrouterProvider = {
|
|
|
2506
2503
|
var ollamaProvider = {
|
|
2507
2504
|
name: "ollama",
|
|
2508
2505
|
tiers: {
|
|
2509
|
-
opus: "qwen3:
|
|
2510
|
-
sonnet: "qwen3:
|
|
2511
|
-
haiku: "qwen3:4b"
|
|
2506
|
+
opus: "qwen3.6:35b-a3b",
|
|
2507
|
+
sonnet: "qwen3.5:9b",
|
|
2508
|
+
haiku: "qwen3.5:4b"
|
|
2512
2509
|
},
|
|
2513
2510
|
envVars: ["OLLAMA_HOST"],
|
|
2514
2511
|
async load(modelId) {
|