@omnicross/core 0.1.0 → 0.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/ApiConverter.cjs +799 -0
- package/dist/ApiConverter.d.cts +82 -0
- package/dist/ApiConverter.d.ts +82 -0
- package/dist/ApiConverter.js +763 -0
- package/dist/BuiltinToolExecutor-BluWyeob.d.ts +81 -0
- package/dist/BuiltinToolExecutor-CS2WpXhM.d.cts +81 -0
- package/dist/CompletionService-7fCmKAP3.d.ts +212 -0
- package/dist/CompletionService-DtOF_War.d.cts +212 -0
- package/dist/{ProviderProxy-f_8ziIhW.d.cts → ProviderProxy-C-xqrkKi.d.ts} +7 -2
- package/dist/{ProviderProxy-vjt8sQQk.d.ts → ProviderProxy-CnMQYN59.d.cts} +7 -2
- package/dist/completion/BuiltinToolExecutor.cjs +327 -0
- package/dist/completion/BuiltinToolExecutor.d.cts +4 -0
- package/dist/completion/BuiltinToolExecutor.d.ts +4 -0
- package/dist/completion/BuiltinToolExecutor.js +296 -0
- package/dist/completion/CompletionService.cjs +3487 -0
- package/dist/completion/CompletionService.d.cts +21 -0
- package/dist/completion/CompletionService.d.ts +21 -0
- package/dist/completion/CompletionService.js +3461 -0
- package/dist/completion/NativeSearchInjector.cjs +196 -0
- package/dist/completion/NativeSearchInjector.d.cts +42 -0
- package/dist/completion/NativeSearchInjector.d.ts +42 -0
- package/dist/completion/NativeSearchInjector.js +167 -0
- package/dist/completion/ProviderSearchInjector.cjs +87 -0
- package/dist/completion/ProviderSearchInjector.d.cts +47 -0
- package/dist/completion/ProviderSearchInjector.d.ts +47 -0
- package/dist/completion/ProviderSearchInjector.js +60 -0
- package/dist/completion/native-search-types.cjs +67 -0
- package/dist/completion/native-search-types.d.cts +3 -0
- package/dist/completion/native-search-types.d.ts +3 -0
- package/dist/completion/native-search-types.js +38 -0
- package/dist/completion/openrouter-headers.cjs +72 -0
- package/dist/completion/openrouter-headers.d.cts +44 -0
- package/dist/completion/openrouter-headers.d.ts +44 -0
- package/dist/completion/openrouter-headers.js +42 -0
- package/dist/completion/openrouter-models.cjs +86 -0
- package/dist/completion/openrouter-models.d.cts +27 -0
- package/dist/completion/openrouter-models.d.ts +27 -0
- package/dist/completion/openrouter-models.js +59 -0
- package/dist/completion/types.cjs +18 -0
- package/dist/completion/types.d.cts +3 -0
- package/dist/completion/types.d.ts +3 -0
- package/dist/completion/types.js +0 -0
- package/dist/completion/url-builder.cjs +138 -0
- package/dist/completion/url-builder.d.cts +87 -0
- package/dist/completion/url-builder.d.ts +87 -0
- package/dist/completion/url-builder.js +104 -0
- package/dist/completion.d.cts +148 -7
- package/dist/completion.d.ts +148 -7
- package/dist/index.cjs +1 -0
- package/dist/index.d.cts +27 -90
- package/dist/index.d.ts +27 -90
- package/dist/index.js +1 -0
- package/dist/outbound-api/routeResolver.cjs +221 -0
- package/dist/outbound-api/routeResolver.d.cts +18 -0
- package/dist/outbound-api/routeResolver.d.ts +18 -0
- package/dist/outbound-api/routeResolver.js +192 -0
- package/dist/outbound-api/subscriptionRegistryPort.d.cts +5 -2
- package/dist/outbound-api/subscriptionRegistryPort.d.ts +5 -2
- package/dist/outbound-api/types.cjs +18 -0
- package/dist/{types-CbCN2NQP.d.ts → outbound-api/types.d.cts} +17 -3
- package/dist/{types-CGGrKqC_.d.cts → outbound-api/types.d.ts} +17 -3
- package/dist/outbound-api/types.js +0 -0
- package/dist/outbound-api.cjs +1 -0
- package/dist/outbound-api.d.cts +14 -87
- package/dist/outbound-api.d.ts +14 -87
- package/dist/outbound-api.js +1 -0
- package/dist/pipeline/AuthSource.cjs +18 -0
- package/dist/pipeline/AuthSource.d.cts +101 -0
- package/dist/pipeline/AuthSource.d.ts +101 -0
- package/dist/pipeline/AuthSource.js +0 -0
- package/dist/pipeline/LlmConfigProviderAuth.cjs +169 -0
- package/dist/pipeline/LlmConfigProviderAuth.d.cts +86 -0
- package/dist/pipeline/LlmConfigProviderAuth.d.ts +86 -0
- package/dist/pipeline/LlmConfigProviderAuth.js +142 -0
- package/dist/pipeline/SubscriptionAuthSource.d.cts +165 -3
- package/dist/pipeline/SubscriptionAuthSource.d.ts +165 -3
- package/dist/pipeline/executeProviderCall.cjs +70 -0
- package/dist/pipeline/executeProviderCall.d.cts +149 -0
- package/dist/pipeline/executeProviderCall.d.ts +149 -0
- package/dist/pipeline/executeProviderCall.js +45 -0
- package/dist/pipeline/resolveProviderChain.cjs +47 -0
- package/dist/pipeline/resolveProviderChain.d.cts +58 -0
- package/dist/pipeline/resolveProviderChain.d.ts +58 -0
- package/dist/pipeline/resolveProviderChain.js +22 -0
- package/dist/pipeline/resolveSubscriptionChain.cjs +68 -0
- package/dist/pipeline/resolveSubscriptionChain.d.cts +68 -0
- package/dist/pipeline/resolveSubscriptionChain.d.ts +68 -0
- package/dist/pipeline/resolveSubscriptionChain.js +43 -0
- package/dist/ports/provider-config-source.cjs +18 -0
- package/dist/ports/provider-config-source.d.cts +51 -0
- package/dist/ports/provider-config-source.d.ts +51 -0
- package/dist/ports/provider-config-source.js +0 -0
- package/dist/ports/web-search-backend.cjs +18 -0
- package/dist/ports/web-search-backend.d.cts +29 -0
- package/dist/ports/web-search-backend.d.ts +29 -0
- package/dist/ports/web-search-backend.js +0 -0
- package/dist/ports.d.cts +10 -7
- package/dist/ports.d.ts +10 -7
- package/dist/provider-proxy/ProviderProxy.cjs +4643 -0
- package/dist/provider-proxy/ProviderProxy.d.cts +16 -0
- package/dist/provider-proxy/ProviderProxy.d.ts +16 -0
- package/dist/provider-proxy/ProviderProxy.js +4618 -0
- package/dist/provider-proxy/ingress/providerProxyShared.d.cts +5 -2
- package/dist/provider-proxy/ingress/providerProxyShared.d.ts +5 -2
- package/dist/provider-proxy/types.d.cts +406 -8
- package/dist/provider-proxy/types.d.ts +406 -8
- package/dist/provider-proxy.cjs +1 -0
- package/dist/provider-proxy.d.cts +8 -5
- package/dist/provider-proxy.d.ts +8 -5
- package/dist/provider-proxy.js +1 -0
- package/dist/routeResolver-BrbK6ja9.d.cts +88 -0
- package/dist/routeResolver-HE-ZO0fO.d.ts +88 -0
- package/dist/transformer/anthropicBetaInject.cjs +51 -0
- package/dist/transformer/anthropicBetaInject.d.cts +20 -0
- package/dist/transformer/anthropicBetaInject.d.ts +20 -0
- package/dist/transformer/anthropicBetaInject.js +25 -0
- package/dist/transformer/transformers/AnthropicTransformer.cjs +1017 -0
- package/dist/transformer/transformers/AnthropicTransformer.d.cts +148 -0
- package/dist/transformer/transformers/AnthropicTransformer.d.ts +148 -0
- package/dist/transformer/transformers/AnthropicTransformer.js +990 -0
- package/dist/transformer/transformers/ReasoningTransformer.cjs +273 -0
- package/dist/transformer/transformers/ReasoningTransformer.d.cts +47 -0
- package/dist/transformer/transformers/ReasoningTransformer.d.ts +47 -0
- package/dist/transformer/transformers/ReasoningTransformer.js +253 -0
- package/dist/transformer/transformers.cjs +3206 -0
- package/dist/transformer/transformers.d.cts +100 -0
- package/dist/transformer/transformers.d.ts +100 -0
- package/dist/transformer/transformers.js +3174 -0
- package/dist/transformer.d.cts +8 -31
- package/dist/transformer.d.ts +8 -31
- package/dist/types-BScIHmPr.d.cts +153 -0
- package/dist/types-BScIHmPr.d.ts +153 -0
- package/package.json +3 -3
- package/dist/SubscriptionAuthSource-Cr4fVEYY.d.cts +0 -264
- package/dist/SubscriptionAuthSource-D89zmiSS.d.ts +0 -264
- package/dist/index-BTSmc9Sm.d.ts +0 -645
- package/dist/index-DXazdTzZ.d.cts +0 -645
- package/dist/types-DCzHkhJt.d.ts +0 -467
- package/dist/types-DZIQbgp0.d.cts +0 -467
|
@@ -0,0 +1,273 @@
|
|
|
1
|
+
"use strict";
|
|
2
|
+
var __defProp = Object.defineProperty;
|
|
3
|
+
var __getOwnPropDesc = Object.getOwnPropertyDescriptor;
|
|
4
|
+
var __getOwnPropNames = Object.getOwnPropertyNames;
|
|
5
|
+
var __hasOwnProp = Object.prototype.hasOwnProperty;
|
|
6
|
+
var __export = (target, all) => {
|
|
7
|
+
for (var name in all)
|
|
8
|
+
__defProp(target, name, { get: all[name], enumerable: true });
|
|
9
|
+
};
|
|
10
|
+
var __copyProps = (to, from, except, desc) => {
|
|
11
|
+
if (from && typeof from === "object" || typeof from === "function") {
|
|
12
|
+
for (let key of __getOwnPropNames(from))
|
|
13
|
+
if (!__hasOwnProp.call(to, key) && key !== except)
|
|
14
|
+
__defProp(to, key, { get: () => from[key], enumerable: !(desc = __getOwnPropDesc(from, key)) || desc.enumerable });
|
|
15
|
+
}
|
|
16
|
+
return to;
|
|
17
|
+
};
|
|
18
|
+
var __toCommonJS = (mod) => __copyProps(__defProp({}, "__esModule", { value: true }), mod);
|
|
19
|
+
|
|
20
|
+
// src/transformer/transformers/ReasoningTransformer.ts
|
|
21
|
+
var ReasoningTransformer_exports = {};
|
|
22
|
+
__export(ReasoningTransformer_exports, {
|
|
23
|
+
ReasoningTransformer: () => ReasoningTransformer
|
|
24
|
+
});
|
|
25
|
+
module.exports = __toCommonJS(ReasoningTransformer_exports);
|
|
26
|
+
var import_thinking_config = require("@omnicross/contracts/thinking-config");
|
|
27
|
+
var ReasoningTransformer = class {
|
|
28
|
+
static TransformerName = "reasoning";
|
|
29
|
+
name = "reasoning";
|
|
30
|
+
logger;
|
|
31
|
+
enabled;
|
|
32
|
+
constructor(options) {
|
|
33
|
+
this.enabled = options?.enable !== false;
|
|
34
|
+
}
|
|
35
|
+
/**
|
|
36
|
+
* Transform request: convert reasoning config to thinking parameters
|
|
37
|
+
* Uses model-specific budget calculation based on effort level
|
|
38
|
+
*/
|
|
39
|
+
async transformRequestIn(request, provider, _context) {
|
|
40
|
+
const extendedRequest = request;
|
|
41
|
+
const modelId = request.model;
|
|
42
|
+
if (!this.enabled) {
|
|
43
|
+
extendedRequest.thinking = {
|
|
44
|
+
type: "disabled",
|
|
45
|
+
budget_tokens: -1
|
|
46
|
+
};
|
|
47
|
+
extendedRequest.enable_thinking = false;
|
|
48
|
+
return extendedRequest;
|
|
49
|
+
}
|
|
50
|
+
if (request.reasoning) {
|
|
51
|
+
const effortLevel = request.reasoning.effort || "none";
|
|
52
|
+
const userMaxTokens = request.reasoning.max_tokens || request.max_tokens;
|
|
53
|
+
const calculatedBudget = (0, import_thinking_config.calculateThinkingBudget)(modelId, effortLevel, userMaxTokens);
|
|
54
|
+
const providerName = provider.name?.toLowerCase() || "";
|
|
55
|
+
if (providerName === "anthropic" || providerName.includes("claude")) {
|
|
56
|
+
const thinkingConfig = (0, import_thinking_config.buildAnthropicThinking)(modelId, effortLevel, userMaxTokens);
|
|
57
|
+
if (thinkingConfig) {
|
|
58
|
+
extendedRequest.thinking = thinkingConfig;
|
|
59
|
+
} else {
|
|
60
|
+
extendedRequest.thinking = {
|
|
61
|
+
type: "disabled"
|
|
62
|
+
};
|
|
63
|
+
}
|
|
64
|
+
} else if (providerName === "openai" || modelId.match(/^o[134]/i)) {
|
|
65
|
+
const reasoningEffort = (0, import_thinking_config.getOpenAIReasoningEffort)(effortLevel);
|
|
66
|
+
if (reasoningEffort) {
|
|
67
|
+
extendedRequest.reasoning_effort = reasoningEffort;
|
|
68
|
+
}
|
|
69
|
+
extendedRequest.thinking = {
|
|
70
|
+
type: effortLevel === "none" ? "disabled" : "enabled",
|
|
71
|
+
budget_tokens: calculatedBudget
|
|
72
|
+
};
|
|
73
|
+
} else if (providerName === "deepseek" && modelId?.startsWith("deepseek-v4")) {
|
|
74
|
+
extendedRequest.thinking = {
|
|
75
|
+
type: effortLevel === "none" ? "disabled" : "enabled",
|
|
76
|
+
budget_tokens: calculatedBudget
|
|
77
|
+
};
|
|
78
|
+
if (effortLevel !== "none") {
|
|
79
|
+
extendedRequest.reasoning_effort = effortLevel === "high" ? "max" : "high";
|
|
80
|
+
}
|
|
81
|
+
} else if (providerName === "deepseek" || providerName === "qwen" || providerName === "alibaba") {
|
|
82
|
+
const qwenConfig = (0, import_thinking_config.buildQwenThinkingConfig)(effortLevel, userMaxTokens);
|
|
83
|
+
extendedRequest.enable_thinking = qwenConfig.enable_thinking;
|
|
84
|
+
if (qwenConfig.thinking_budget) {
|
|
85
|
+
extendedRequest.thinking_budget = qwenConfig.thinking_budget;
|
|
86
|
+
}
|
|
87
|
+
extendedRequest.thinking = {
|
|
88
|
+
type: qwenConfig.enable_thinking ? "enabled" : "disabled",
|
|
89
|
+
budget_tokens: calculatedBudget
|
|
90
|
+
};
|
|
91
|
+
} else {
|
|
92
|
+
extendedRequest.thinking = {
|
|
93
|
+
type: effortLevel === "none" ? "disabled" : "enabled",
|
|
94
|
+
budget_tokens: calculatedBudget
|
|
95
|
+
};
|
|
96
|
+
extendedRequest.enable_thinking = effortLevel !== "none";
|
|
97
|
+
}
|
|
98
|
+
this.logger?.debug(`[ReasoningTransformer] Model: ${modelId}, Effort: ${effortLevel}, Budget: ${calculatedBudget}`);
|
|
99
|
+
}
|
|
100
|
+
return extendedRequest;
|
|
101
|
+
}
|
|
102
|
+
/**
|
|
103
|
+
* Transform response: convert reasoning_content to thinking blocks
|
|
104
|
+
*/
|
|
105
|
+
async transformResponseOut(response, _context) {
|
|
106
|
+
if (!this.enabled) return response;
|
|
107
|
+
const contentType = response.headers.get("Content-Type") ?? "";
|
|
108
|
+
if (contentType.includes("application/json")) {
|
|
109
|
+
return this.handleJsonResponse(response);
|
|
110
|
+
} else if (contentType.includes("stream") || contentType.includes("text/event-stream")) {
|
|
111
|
+
return this.handleStreamResponse(response);
|
|
112
|
+
}
|
|
113
|
+
return response;
|
|
114
|
+
}
|
|
115
|
+
/**
|
|
116
|
+
* Handle JSON (non-streaming) response
|
|
117
|
+
*/
|
|
118
|
+
async handleJsonResponse(response) {
|
|
119
|
+
const jsonResponse = await response.json();
|
|
120
|
+
if (jsonResponse.choices?.[0]?.message?.reasoning_content) {
|
|
121
|
+
jsonResponse.thinking = {
|
|
122
|
+
content: jsonResponse.choices[0].message.reasoning_content
|
|
123
|
+
};
|
|
124
|
+
delete jsonResponse.choices[0].message.reasoning_content;
|
|
125
|
+
}
|
|
126
|
+
return new Response(JSON.stringify(jsonResponse), {
|
|
127
|
+
status: response.status,
|
|
128
|
+
statusText: response.statusText,
|
|
129
|
+
headers: response.headers
|
|
130
|
+
});
|
|
131
|
+
}
|
|
132
|
+
/**
|
|
133
|
+
* Handle streaming response - convert reasoning_content to thinking blocks
|
|
134
|
+
*/
|
|
135
|
+
handleStreamResponse(response) {
|
|
136
|
+
if (!response.body) {
|
|
137
|
+
return response;
|
|
138
|
+
}
|
|
139
|
+
const decoder = new TextDecoder();
|
|
140
|
+
const encoder = new TextEncoder();
|
|
141
|
+
let reasoningContent = "";
|
|
142
|
+
let isReasoningComplete = false;
|
|
143
|
+
let buffer = "";
|
|
144
|
+
const stream = new ReadableStream({
|
|
145
|
+
start: async (controller) => {
|
|
146
|
+
const reader = response.body.getReader();
|
|
147
|
+
const processLine = (line) => {
|
|
148
|
+
this.logger?.debug("Processing reasoning line:", line);
|
|
149
|
+
if (line.startsWith("data: ") && line.trim() !== "data: [DONE]") {
|
|
150
|
+
try {
|
|
151
|
+
const data = JSON.parse(line.slice(6));
|
|
152
|
+
if (data.choices?.[0]?.delta?.reasoning_content) {
|
|
153
|
+
reasoningContent += data.choices[0].delta.reasoning_content;
|
|
154
|
+
const thinkingChunk = {
|
|
155
|
+
...data,
|
|
156
|
+
choices: [
|
|
157
|
+
{
|
|
158
|
+
...data.choices[0],
|
|
159
|
+
delta: {
|
|
160
|
+
...data.choices[0].delta,
|
|
161
|
+
thinking: {
|
|
162
|
+
content: data.choices[0].delta.reasoning_content
|
|
163
|
+
}
|
|
164
|
+
}
|
|
165
|
+
}
|
|
166
|
+
]
|
|
167
|
+
};
|
|
168
|
+
delete thinkingChunk.choices[0].delta.reasoning_content;
|
|
169
|
+
const thinkingLine = `data: ${JSON.stringify(thinkingChunk)}
|
|
170
|
+
|
|
171
|
+
`;
|
|
172
|
+
controller.enqueue(encoder.encode(thinkingLine));
|
|
173
|
+
return;
|
|
174
|
+
}
|
|
175
|
+
if ((data.choices?.[0]?.delta?.content || data.choices?.[0]?.delta?.tool_calls) && reasoningContent && !isReasoningComplete) {
|
|
176
|
+
isReasoningComplete = true;
|
|
177
|
+
const signature = Date.now().toString();
|
|
178
|
+
const thinkingChunk = {
|
|
179
|
+
...data,
|
|
180
|
+
choices: [
|
|
181
|
+
{
|
|
182
|
+
...data.choices[0],
|
|
183
|
+
delta: {
|
|
184
|
+
...data.choices[0].delta,
|
|
185
|
+
content: null,
|
|
186
|
+
thinking: {
|
|
187
|
+
signature
|
|
188
|
+
}
|
|
189
|
+
}
|
|
190
|
+
}
|
|
191
|
+
]
|
|
192
|
+
};
|
|
193
|
+
delete thinkingChunk.choices[0].delta.reasoning_content;
|
|
194
|
+
const thinkingLine = `data: ${JSON.stringify(thinkingChunk)}
|
|
195
|
+
|
|
196
|
+
`;
|
|
197
|
+
controller.enqueue(encoder.encode(thinkingLine));
|
|
198
|
+
}
|
|
199
|
+
if (data.choices?.[0]?.delta?.reasoning_content) {
|
|
200
|
+
delete data.choices[0].delta.reasoning_content;
|
|
201
|
+
}
|
|
202
|
+
if (data.choices?.[0]?.delta && Object.keys(data.choices[0].delta).length > 0) {
|
|
203
|
+
if (isReasoningComplete) {
|
|
204
|
+
data.choices[0].index++;
|
|
205
|
+
}
|
|
206
|
+
const modifiedLine = `data: ${JSON.stringify(data)}
|
|
207
|
+
|
|
208
|
+
`;
|
|
209
|
+
controller.enqueue(encoder.encode(modifiedLine));
|
|
210
|
+
}
|
|
211
|
+
} catch (_e) {
|
|
212
|
+
controller.enqueue(encoder.encode(line + "\n"));
|
|
213
|
+
}
|
|
214
|
+
} else {
|
|
215
|
+
controller.enqueue(encoder.encode(line + "\n"));
|
|
216
|
+
}
|
|
217
|
+
};
|
|
218
|
+
try {
|
|
219
|
+
while (true) {
|
|
220
|
+
const { done, value } = await reader.read();
|
|
221
|
+
if (done) {
|
|
222
|
+
if (buffer.trim()) {
|
|
223
|
+
const lines2 = buffer.split("\n");
|
|
224
|
+
for (const line of lines2) {
|
|
225
|
+
if (line.trim()) {
|
|
226
|
+
controller.enqueue(encoder.encode(line + "\n"));
|
|
227
|
+
}
|
|
228
|
+
}
|
|
229
|
+
}
|
|
230
|
+
break;
|
|
231
|
+
}
|
|
232
|
+
const chunk = decoder.decode(value, { stream: true });
|
|
233
|
+
buffer += chunk;
|
|
234
|
+
const lines = buffer.split("\n");
|
|
235
|
+
buffer = lines.pop() || "";
|
|
236
|
+
for (const line of lines) {
|
|
237
|
+
if (!line.trim()) continue;
|
|
238
|
+
try {
|
|
239
|
+
processLine(line);
|
|
240
|
+
} catch (error) {
|
|
241
|
+
this.logger?.error("Error processing reasoning stream line:", error);
|
|
242
|
+
controller.enqueue(encoder.encode(line + "\n"));
|
|
243
|
+
}
|
|
244
|
+
}
|
|
245
|
+
}
|
|
246
|
+
} catch (error) {
|
|
247
|
+
this.logger?.error("Reasoning stream error:", error);
|
|
248
|
+
controller.error(error);
|
|
249
|
+
} finally {
|
|
250
|
+
try {
|
|
251
|
+
reader.releaseLock();
|
|
252
|
+
} catch (e) {
|
|
253
|
+
this.logger?.error("Error releasing reader lock:", e);
|
|
254
|
+
}
|
|
255
|
+
controller.close();
|
|
256
|
+
}
|
|
257
|
+
}
|
|
258
|
+
});
|
|
259
|
+
return new Response(stream, {
|
|
260
|
+
status: response.status,
|
|
261
|
+
statusText: response.statusText,
|
|
262
|
+
headers: new Headers({
|
|
263
|
+
"Content-Type": "text/event-stream",
|
|
264
|
+
"Cache-Control": "no-cache",
|
|
265
|
+
Connection: "keep-alive"
|
|
266
|
+
})
|
|
267
|
+
});
|
|
268
|
+
}
|
|
269
|
+
};
|
|
270
|
+
// Annotate the CommonJS export names for ESM import in node:
|
|
271
|
+
0 && (module.exports = {
|
|
272
|
+
ReasoningTransformer
|
|
273
|
+
});
|
|
@@ -0,0 +1,47 @@
|
|
|
1
|
+
import { Transformer, TransformerLogger, TransformerOptions, UnifiedChatRequest, LLMProvider, TransformerContext } from '../types.cjs';
|
|
2
|
+
|
|
3
|
+
/**
|
|
4
|
+
* ReasoningTransformer - Transformer for reasoning/thinking mode support
|
|
5
|
+
*
|
|
6
|
+
* Handles:
|
|
7
|
+
* - Converting reasoning config to thinking API parameters
|
|
8
|
+
* - Converting reasoning_content in responses to thinking blocks
|
|
9
|
+
* - Calculating thinking budget based on model and effort level
|
|
10
|
+
*
|
|
11
|
+
* @module transformer/transformers/ReasoningTransformer
|
|
12
|
+
*/
|
|
13
|
+
|
|
14
|
+
/**
|
|
15
|
+
* ReasoningTransformer handles reasoning/thinking mode for compatible models
|
|
16
|
+
*
|
|
17
|
+
* Features:
|
|
18
|
+
* - Converts reasoning config to thinking API parameters
|
|
19
|
+
* - Can be enabled/disabled via options
|
|
20
|
+
* - Converts reasoning_content in stream responses to thinking blocks
|
|
21
|
+
*/
|
|
22
|
+
declare class ReasoningTransformer implements Transformer {
|
|
23
|
+
static TransformerName: string;
|
|
24
|
+
name: string;
|
|
25
|
+
logger?: TransformerLogger;
|
|
26
|
+
private enabled;
|
|
27
|
+
constructor(options?: TransformerOptions);
|
|
28
|
+
/**
|
|
29
|
+
* Transform request: convert reasoning config to thinking parameters
|
|
30
|
+
* Uses model-specific budget calculation based on effort level
|
|
31
|
+
*/
|
|
32
|
+
transformRequestIn(request: UnifiedChatRequest, provider: LLMProvider, _context: TransformerContext): Promise<Record<string, unknown>>;
|
|
33
|
+
/**
|
|
34
|
+
* Transform response: convert reasoning_content to thinking blocks
|
|
35
|
+
*/
|
|
36
|
+
transformResponseOut(response: Response, _context: TransformerContext): Promise<Response>;
|
|
37
|
+
/**
|
|
38
|
+
* Handle JSON (non-streaming) response
|
|
39
|
+
*/
|
|
40
|
+
private handleJsonResponse;
|
|
41
|
+
/**
|
|
42
|
+
* Handle streaming response - convert reasoning_content to thinking blocks
|
|
43
|
+
*/
|
|
44
|
+
private handleStreamResponse;
|
|
45
|
+
}
|
|
46
|
+
|
|
47
|
+
export { ReasoningTransformer };
|
|
@@ -0,0 +1,47 @@
|
|
|
1
|
+
import { Transformer, TransformerLogger, TransformerOptions, UnifiedChatRequest, LLMProvider, TransformerContext } from '../types.js';
|
|
2
|
+
|
|
3
|
+
/**
|
|
4
|
+
* ReasoningTransformer - Transformer for reasoning/thinking mode support
|
|
5
|
+
*
|
|
6
|
+
* Handles:
|
|
7
|
+
* - Converting reasoning config to thinking API parameters
|
|
8
|
+
* - Converting reasoning_content in responses to thinking blocks
|
|
9
|
+
* - Calculating thinking budget based on model and effort level
|
|
10
|
+
*
|
|
11
|
+
* @module transformer/transformers/ReasoningTransformer
|
|
12
|
+
*/
|
|
13
|
+
|
|
14
|
+
/**
|
|
15
|
+
* ReasoningTransformer handles reasoning/thinking mode for compatible models
|
|
16
|
+
*
|
|
17
|
+
* Features:
|
|
18
|
+
* - Converts reasoning config to thinking API parameters
|
|
19
|
+
* - Can be enabled/disabled via options
|
|
20
|
+
* - Converts reasoning_content in stream responses to thinking blocks
|
|
21
|
+
*/
|
|
22
|
+
declare class ReasoningTransformer implements Transformer {
|
|
23
|
+
static TransformerName: string;
|
|
24
|
+
name: string;
|
|
25
|
+
logger?: TransformerLogger;
|
|
26
|
+
private enabled;
|
|
27
|
+
constructor(options?: TransformerOptions);
|
|
28
|
+
/**
|
|
29
|
+
* Transform request: convert reasoning config to thinking parameters
|
|
30
|
+
* Uses model-specific budget calculation based on effort level
|
|
31
|
+
*/
|
|
32
|
+
transformRequestIn(request: UnifiedChatRequest, provider: LLMProvider, _context: TransformerContext): Promise<Record<string, unknown>>;
|
|
33
|
+
/**
|
|
34
|
+
* Transform response: convert reasoning_content to thinking blocks
|
|
35
|
+
*/
|
|
36
|
+
transformResponseOut(response: Response, _context: TransformerContext): Promise<Response>;
|
|
37
|
+
/**
|
|
38
|
+
* Handle JSON (non-streaming) response
|
|
39
|
+
*/
|
|
40
|
+
private handleJsonResponse;
|
|
41
|
+
/**
|
|
42
|
+
* Handle streaming response - convert reasoning_content to thinking blocks
|
|
43
|
+
*/
|
|
44
|
+
private handleStreamResponse;
|
|
45
|
+
}
|
|
46
|
+
|
|
47
|
+
export { ReasoningTransformer };
|
|
@@ -0,0 +1,253 @@
|
|
|
1
|
+
// src/transformer/transformers/ReasoningTransformer.ts
|
|
2
|
+
import {
|
|
3
|
+
buildAnthropicThinking,
|
|
4
|
+
buildQwenThinkingConfig,
|
|
5
|
+
calculateThinkingBudget,
|
|
6
|
+
getOpenAIReasoningEffort
|
|
7
|
+
} from "@omnicross/contracts/thinking-config";
|
|
8
|
+
var ReasoningTransformer = class {
|
|
9
|
+
static TransformerName = "reasoning";
|
|
10
|
+
name = "reasoning";
|
|
11
|
+
logger;
|
|
12
|
+
enabled;
|
|
13
|
+
constructor(options) {
|
|
14
|
+
this.enabled = options?.enable !== false;
|
|
15
|
+
}
|
|
16
|
+
/**
|
|
17
|
+
* Transform request: convert reasoning config to thinking parameters
|
|
18
|
+
* Uses model-specific budget calculation based on effort level
|
|
19
|
+
*/
|
|
20
|
+
async transformRequestIn(request, provider, _context) {
|
|
21
|
+
const extendedRequest = request;
|
|
22
|
+
const modelId = request.model;
|
|
23
|
+
if (!this.enabled) {
|
|
24
|
+
extendedRequest.thinking = {
|
|
25
|
+
type: "disabled",
|
|
26
|
+
budget_tokens: -1
|
|
27
|
+
};
|
|
28
|
+
extendedRequest.enable_thinking = false;
|
|
29
|
+
return extendedRequest;
|
|
30
|
+
}
|
|
31
|
+
if (request.reasoning) {
|
|
32
|
+
const effortLevel = request.reasoning.effort || "none";
|
|
33
|
+
const userMaxTokens = request.reasoning.max_tokens || request.max_tokens;
|
|
34
|
+
const calculatedBudget = calculateThinkingBudget(modelId, effortLevel, userMaxTokens);
|
|
35
|
+
const providerName = provider.name?.toLowerCase() || "";
|
|
36
|
+
if (providerName === "anthropic" || providerName.includes("claude")) {
|
|
37
|
+
const thinkingConfig = buildAnthropicThinking(modelId, effortLevel, userMaxTokens);
|
|
38
|
+
if (thinkingConfig) {
|
|
39
|
+
extendedRequest.thinking = thinkingConfig;
|
|
40
|
+
} else {
|
|
41
|
+
extendedRequest.thinking = {
|
|
42
|
+
type: "disabled"
|
|
43
|
+
};
|
|
44
|
+
}
|
|
45
|
+
} else if (providerName === "openai" || modelId.match(/^o[134]/i)) {
|
|
46
|
+
const reasoningEffort = getOpenAIReasoningEffort(effortLevel);
|
|
47
|
+
if (reasoningEffort) {
|
|
48
|
+
extendedRequest.reasoning_effort = reasoningEffort;
|
|
49
|
+
}
|
|
50
|
+
extendedRequest.thinking = {
|
|
51
|
+
type: effortLevel === "none" ? "disabled" : "enabled",
|
|
52
|
+
budget_tokens: calculatedBudget
|
|
53
|
+
};
|
|
54
|
+
} else if (providerName === "deepseek" && modelId?.startsWith("deepseek-v4")) {
|
|
55
|
+
extendedRequest.thinking = {
|
|
56
|
+
type: effortLevel === "none" ? "disabled" : "enabled",
|
|
57
|
+
budget_tokens: calculatedBudget
|
|
58
|
+
};
|
|
59
|
+
if (effortLevel !== "none") {
|
|
60
|
+
extendedRequest.reasoning_effort = effortLevel === "high" ? "max" : "high";
|
|
61
|
+
}
|
|
62
|
+
} else if (providerName === "deepseek" || providerName === "qwen" || providerName === "alibaba") {
|
|
63
|
+
const qwenConfig = buildQwenThinkingConfig(effortLevel, userMaxTokens);
|
|
64
|
+
extendedRequest.enable_thinking = qwenConfig.enable_thinking;
|
|
65
|
+
if (qwenConfig.thinking_budget) {
|
|
66
|
+
extendedRequest.thinking_budget = qwenConfig.thinking_budget;
|
|
67
|
+
}
|
|
68
|
+
extendedRequest.thinking = {
|
|
69
|
+
type: qwenConfig.enable_thinking ? "enabled" : "disabled",
|
|
70
|
+
budget_tokens: calculatedBudget
|
|
71
|
+
};
|
|
72
|
+
} else {
|
|
73
|
+
extendedRequest.thinking = {
|
|
74
|
+
type: effortLevel === "none" ? "disabled" : "enabled",
|
|
75
|
+
budget_tokens: calculatedBudget
|
|
76
|
+
};
|
|
77
|
+
extendedRequest.enable_thinking = effortLevel !== "none";
|
|
78
|
+
}
|
|
79
|
+
this.logger?.debug(`[ReasoningTransformer] Model: ${modelId}, Effort: ${effortLevel}, Budget: ${calculatedBudget}`);
|
|
80
|
+
}
|
|
81
|
+
return extendedRequest;
|
|
82
|
+
}
|
|
83
|
+
/**
|
|
84
|
+
* Transform response: convert reasoning_content to thinking blocks
|
|
85
|
+
*/
|
|
86
|
+
async transformResponseOut(response, _context) {
|
|
87
|
+
if (!this.enabled) return response;
|
|
88
|
+
const contentType = response.headers.get("Content-Type") ?? "";
|
|
89
|
+
if (contentType.includes("application/json")) {
|
|
90
|
+
return this.handleJsonResponse(response);
|
|
91
|
+
} else if (contentType.includes("stream") || contentType.includes("text/event-stream")) {
|
|
92
|
+
return this.handleStreamResponse(response);
|
|
93
|
+
}
|
|
94
|
+
return response;
|
|
95
|
+
}
|
|
96
|
+
/**
|
|
97
|
+
* Handle JSON (non-streaming) response
|
|
98
|
+
*/
|
|
99
|
+
async handleJsonResponse(response) {
|
|
100
|
+
const jsonResponse = await response.json();
|
|
101
|
+
if (jsonResponse.choices?.[0]?.message?.reasoning_content) {
|
|
102
|
+
jsonResponse.thinking = {
|
|
103
|
+
content: jsonResponse.choices[0].message.reasoning_content
|
|
104
|
+
};
|
|
105
|
+
delete jsonResponse.choices[0].message.reasoning_content;
|
|
106
|
+
}
|
|
107
|
+
return new Response(JSON.stringify(jsonResponse), {
|
|
108
|
+
status: response.status,
|
|
109
|
+
statusText: response.statusText,
|
|
110
|
+
headers: response.headers
|
|
111
|
+
});
|
|
112
|
+
}
|
|
113
|
+
/**
|
|
114
|
+
* Handle streaming response - convert reasoning_content to thinking blocks
|
|
115
|
+
*/
|
|
116
|
+
handleStreamResponse(response) {
|
|
117
|
+
if (!response.body) {
|
|
118
|
+
return response;
|
|
119
|
+
}
|
|
120
|
+
const decoder = new TextDecoder();
|
|
121
|
+
const encoder = new TextEncoder();
|
|
122
|
+
let reasoningContent = "";
|
|
123
|
+
let isReasoningComplete = false;
|
|
124
|
+
let buffer = "";
|
|
125
|
+
const stream = new ReadableStream({
|
|
126
|
+
start: async (controller) => {
|
|
127
|
+
const reader = response.body.getReader();
|
|
128
|
+
const processLine = (line) => {
|
|
129
|
+
this.logger?.debug("Processing reasoning line:", line);
|
|
130
|
+
if (line.startsWith("data: ") && line.trim() !== "data: [DONE]") {
|
|
131
|
+
try {
|
|
132
|
+
const data = JSON.parse(line.slice(6));
|
|
133
|
+
if (data.choices?.[0]?.delta?.reasoning_content) {
|
|
134
|
+
reasoningContent += data.choices[0].delta.reasoning_content;
|
|
135
|
+
const thinkingChunk = {
|
|
136
|
+
...data,
|
|
137
|
+
choices: [
|
|
138
|
+
{
|
|
139
|
+
...data.choices[0],
|
|
140
|
+
delta: {
|
|
141
|
+
...data.choices[0].delta,
|
|
142
|
+
thinking: {
|
|
143
|
+
content: data.choices[0].delta.reasoning_content
|
|
144
|
+
}
|
|
145
|
+
}
|
|
146
|
+
}
|
|
147
|
+
]
|
|
148
|
+
};
|
|
149
|
+
delete thinkingChunk.choices[0].delta.reasoning_content;
|
|
150
|
+
const thinkingLine = `data: ${JSON.stringify(thinkingChunk)}
|
|
151
|
+
|
|
152
|
+
`;
|
|
153
|
+
controller.enqueue(encoder.encode(thinkingLine));
|
|
154
|
+
return;
|
|
155
|
+
}
|
|
156
|
+
if ((data.choices?.[0]?.delta?.content || data.choices?.[0]?.delta?.tool_calls) && reasoningContent && !isReasoningComplete) {
|
|
157
|
+
isReasoningComplete = true;
|
|
158
|
+
const signature = Date.now().toString();
|
|
159
|
+
const thinkingChunk = {
|
|
160
|
+
...data,
|
|
161
|
+
choices: [
|
|
162
|
+
{
|
|
163
|
+
...data.choices[0],
|
|
164
|
+
delta: {
|
|
165
|
+
...data.choices[0].delta,
|
|
166
|
+
content: null,
|
|
167
|
+
thinking: {
|
|
168
|
+
signature
|
|
169
|
+
}
|
|
170
|
+
}
|
|
171
|
+
}
|
|
172
|
+
]
|
|
173
|
+
};
|
|
174
|
+
delete thinkingChunk.choices[0].delta.reasoning_content;
|
|
175
|
+
const thinkingLine = `data: ${JSON.stringify(thinkingChunk)}
|
|
176
|
+
|
|
177
|
+
`;
|
|
178
|
+
controller.enqueue(encoder.encode(thinkingLine));
|
|
179
|
+
}
|
|
180
|
+
if (data.choices?.[0]?.delta?.reasoning_content) {
|
|
181
|
+
delete data.choices[0].delta.reasoning_content;
|
|
182
|
+
}
|
|
183
|
+
if (data.choices?.[0]?.delta && Object.keys(data.choices[0].delta).length > 0) {
|
|
184
|
+
if (isReasoningComplete) {
|
|
185
|
+
data.choices[0].index++;
|
|
186
|
+
}
|
|
187
|
+
const modifiedLine = `data: ${JSON.stringify(data)}
|
|
188
|
+
|
|
189
|
+
`;
|
|
190
|
+
controller.enqueue(encoder.encode(modifiedLine));
|
|
191
|
+
}
|
|
192
|
+
} catch (_e) {
|
|
193
|
+
controller.enqueue(encoder.encode(line + "\n"));
|
|
194
|
+
}
|
|
195
|
+
} else {
|
|
196
|
+
controller.enqueue(encoder.encode(line + "\n"));
|
|
197
|
+
}
|
|
198
|
+
};
|
|
199
|
+
try {
|
|
200
|
+
while (true) {
|
|
201
|
+
const { done, value } = await reader.read();
|
|
202
|
+
if (done) {
|
|
203
|
+
if (buffer.trim()) {
|
|
204
|
+
const lines2 = buffer.split("\n");
|
|
205
|
+
for (const line of lines2) {
|
|
206
|
+
if (line.trim()) {
|
|
207
|
+
controller.enqueue(encoder.encode(line + "\n"));
|
|
208
|
+
}
|
|
209
|
+
}
|
|
210
|
+
}
|
|
211
|
+
break;
|
|
212
|
+
}
|
|
213
|
+
const chunk = decoder.decode(value, { stream: true });
|
|
214
|
+
buffer += chunk;
|
|
215
|
+
const lines = buffer.split("\n");
|
|
216
|
+
buffer = lines.pop() || "";
|
|
217
|
+
for (const line of lines) {
|
|
218
|
+
if (!line.trim()) continue;
|
|
219
|
+
try {
|
|
220
|
+
processLine(line);
|
|
221
|
+
} catch (error) {
|
|
222
|
+
this.logger?.error("Error processing reasoning stream line:", error);
|
|
223
|
+
controller.enqueue(encoder.encode(line + "\n"));
|
|
224
|
+
}
|
|
225
|
+
}
|
|
226
|
+
}
|
|
227
|
+
} catch (error) {
|
|
228
|
+
this.logger?.error("Reasoning stream error:", error);
|
|
229
|
+
controller.error(error);
|
|
230
|
+
} finally {
|
|
231
|
+
try {
|
|
232
|
+
reader.releaseLock();
|
|
233
|
+
} catch (e) {
|
|
234
|
+
this.logger?.error("Error releasing reader lock:", e);
|
|
235
|
+
}
|
|
236
|
+
controller.close();
|
|
237
|
+
}
|
|
238
|
+
}
|
|
239
|
+
});
|
|
240
|
+
return new Response(stream, {
|
|
241
|
+
status: response.status,
|
|
242
|
+
statusText: response.statusText,
|
|
243
|
+
headers: new Headers({
|
|
244
|
+
"Content-Type": "text/event-stream",
|
|
245
|
+
"Cache-Control": "no-cache",
|
|
246
|
+
Connection: "keep-alive"
|
|
247
|
+
})
|
|
248
|
+
});
|
|
249
|
+
}
|
|
250
|
+
};
|
|
251
|
+
export {
|
|
252
|
+
ReasoningTransformer
|
|
253
|
+
};
|