npm - utilitas - Versions diffs - 1999.1.97 → 1999.1.99 - Mend

utilitas 1999.1.97 → 1999.1.99

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/README.md +2 -2
package/dist/utilitas.lite.mjs +1 -1
package/dist/utilitas.lite.mjs.map +1 -1
package/lib/alan.mjs +172 -244
package/lib/gen.mjs +2 -2
package/lib/manifest.mjs +1 -1
package/package.json +1 -1

package/lib/alan.mjs CHANGED Viewed

@@ -45,31 +45,33 @@ You may be provided with some tools(functions) to help you gather information an
 const _NEED = ['js-tiktoken', 'OpenAI'];
 const [
-    OPENAI, GEMINI, OLLAMA, GEMINI_25_FLASH, NOVA, DEEPSEEK_R1, MD_CODE,
-    CLOUD_SONNET_45, AUDIO, WAV, ATTACHMENTS, OPENAI_VOICE,
-    GPT_REASONING_EFFORT, THINK, THINK_STR, THINK_END, TOOLS_STR, TOOLS_END,
-    TOOLS, TEXT, OK, FUNC, GPT_51, GPT_51_CODEX, GEMMA_3_27B, ANTHROPIC, v8k, ais,
+    OPENAI, GEMINI, OLLAMA, NOVA, DEEPSEEK_R1, MD_CODE, CLOUD_SONNET_45, AUDIO,
+    WAV, ATTACHMENTS, OPENAI_VOICE, GPT_REASONING_EFFORT, THINK, THINK_STR,
+    THINK_END, TOOLS_STR, TOOLS_END, TOOLS, TEXT, OK, FUNC, GPT_51,
+    GPT_51_CODEX, GPT_5_IMAGE, GEMMA_3_27B, ANTHROPIC, v8k, ais,
     MAX_TOOL_RECURSION, LOG, name, user, system, assistant, MODEL, JSON_OBJECT,
     tokenSafeRatio, CONTENT_IS_REQUIRED, OPENAI_HI_RES_SIZE, k, kT, m, minute,
     hour, gb, trimTailing, GEMINI_25_FLASH_IMAGE, IMAGE, JINA, JINA_DEEPSEARCH,
-    GEMINI_30_PRO, SILICONFLOW, SF_DEEPSEEK_R1, MAX_TIRE, OPENROUTER_API,
-    OPENROUTER, AUTO, TOOL,
+    SILICONFLOW, SF_DEEPSEEK_R1, MAX_TIRE, OPENROUTER_API, OPENROUTER, AUTO,
+    TOOL, S_OPENAI, S_GOOGLE, S_ANTHROPIC, ONLINE,
 ] = [
-        'OpenAI', 'Gemini', 'Ollama', 'gemini-2.5-flash-preview-09-2025',
-        'nova', 'deepseek-r1', '```', 'anthropic/claude-sonnet-4.5', 'audio',
-        'wav', '[ATTACHMENTS]', 'OPENAI_VOICE', 'medium', 'think', '<think>',
-        '</think>', '<tools>', '</tools>', 'tools', 'text', 'OK', 'function',
-        'gpt-5.1', 'gpt-5.1-codex', 'gemma3:27b', 'Anthropic', 7680 * 4320, [],
-        30, { log: true }, 'Alan', 'user', { role: 'system' }, 'assistant',
-        'model', 'json_object', 1.1, 'Content is required.', 2048 * 2048,
-        x => 1024 * x, x => 1000 * x, x => 1024 * 1024 * x, x => 60 * x,
-        x => 60 * 60 * x, x => 1024 * 1024 * 1024 * x,
-        x => x.replace(/[\.\s]*$/, ''), 'gemini-2.5-flash-image', 'image',
-        'Jina', 'jina-deepsearch-v1', 'gemini-3-pro-preview', 'SiliconFlow',
-        'Pro/deepseek-ai/DeepSeek-R1', 768 * 768,
+        'OpenAI', 'Gemini', 'Ollama', 'nova', 'deepseek-r1', '```',
+        'claude-sonnet-4.5', 'audio', 'wav', '[ATTACHMENTS]', 'OPENAI_VOICE',
+        'medium', 'think', '<think>', '</think>', '<tools>', '</tools>',
+        'tools', 'text', 'OK', 'function', 'gpt-5.1', 'gpt-5.1-codex',
+        'gpt-5-image', 'gemma3:27b', 'Anthropic', 7680 * 4320, [], 30,
+        { log: true }, 'Alan', 'user', { role: 'system' }, 'assistant', 'model',
+        'json_object', 1.1, 'Content is required.', 2048 * 2048, x => 1024 * x,
+        x => 1000 * x, x => 1024 * 1024 * x, x => 60 * x, x => 60 * 60 * x,
+        x => 1024 * 1024 * 1024 * x, x => x.replace(/[\.\s]*$/, ''),
+        'gemini-2.5-flash-image', 'image', 'Jina', 'jina-deepsearch-v1',
+        'SiliconFlow', 'Pro/deepseek-ai/DeepSeek-R1', 768 * 768,
         'https://openrouter.ai/api/v1', 'OpenRouter', 'openrouter/auto', 'tool',
+        'openai', 'google', 'anthropic', ':online',
     ];
+const [GEMINI_25_FLASH, GEMINI_30_PRO]
+    = [`gemini-2.5-flash${ONLINE}`, `gemini-3-pro-preview${ONLINE}`];
 const [tool, messages, text]
     = [type => ({ type }), messages => ({ messages }), text => ({ text })];
 const [CODE_INTERPRETER, RETRIEVAL, FUNCTION]
@@ -88,7 +90,7 @@ const getProviderIcon = provider => PROVIDER_ICONS[provider] || '🔮';
 const libOpenAi = async opts => await need('openai', { ...opts, raw: true });
 const OpenAI = async opts => new (await libOpenAi(opts)).OpenAI(opts);
 const OPENAI_RULES = {
-    source: 'openai',
+    source: S_OPENAI, icon: '⚛️',
     contextWindow: kT(400), maxOutputTokens: k(128),
     imageCostTokens: ~~(OPENAI_HI_RES_SIZE / MAX_TIRE * 140 + 70),
     maxFileSize: m(50), maxImageSize: OPENAI_HI_RES_SIZE,
@@ -101,7 +103,7 @@ const OPENAI_RULES = {
 };
 const GEMINI_RULES = {
-    source: 'google',
+    source: S_GOOGLE, icon: '♊️',
     json: true, audioCostTokens: 1000 * 1000 * 1, // 8.4 hours => 1 million tokens
     imageCostTokens: ~~(v8k / MAX_TIRE * 258), maxAudioLength: hour(8.4),
     maxAudioPerPrompt: 1, maxFileSize: m(20), maxImagePerPrompt: 3000,
@@ -118,7 +120,7 @@ const GEMINI_RULES = {
 };
 const DEEPSEEK_R1_RULES = {
-    contextWindow: kT(128), maxOutputTokens: k(8),
+    icon: '🐬', contextWindow: kT(128), maxOutputTokens: k(8),
     reasoning: true,
 };
@@ -126,29 +128,30 @@ const DEEPSEEK_R1_RULES = {
 // https://cloud.google.com/vertex-ai/docs/generative-ai/learn/models
 // https://openrouter.ai/docs/features/multimodal/audio (only support input audio)
 const MODELS = {
-    [GPT_51]: { ...OPENAI_RULES, fast: true },
-    [GPT_51_CODEX]: { ...OPENAI_RULES },
-    [GEMINI_25_FLASH_IMAGE]: {
-        ...GEMINI_RULES, contextWindow: k(64), maxOutputTokens: k(32),
-        fast: true, image: true,
-    },
+    // fast and balanced models
     [GEMINI_25_FLASH]: {
         ...GEMINI_RULES, contextWindow: m(1), maxOutputTokens: k(64),
         fast: true, reasoning: true, tools: true,
+        json: false, // issue with json output via OpenRouter
+        // https://gemini.google.com/app/c680748b3307790b
     },
+    // strong and fast
+    [GPT_51]: { ...OPENAI_RULES, fast: true },
+    // stronger but slow
     [GEMINI_30_PRO]: {
         ...GEMINI_RULES, contextWindow: m(1), maxOutputTokens: k(64),
         reasoning: true, tools: true,
     },
-    [GEMMA_3_27B]: {
-        contextWindow: kT(128), maxOutputTokens: k(8),
-        imageCostTokens: 256, maxImageSize: 896 * 896,
-        supportedMimeTypes: [MIME_PNG, MIME_JPEG, MIME_GIF],
-        fast: true, json: true, vision: true,
-        defaultProvider: OLLAMA,
+    // models with unique capabilities
+    [GEMINI_25_FLASH_IMAGE]: {
+        ...GEMINI_RULES, icon: '🍌', label: 'Nano Banana',
+        contextWindow: k(64), maxOutputTokens: k(32),
+        fast: true, image: true,
     },
+    [GPT_51_CODEX]: { ...OPENAI_RULES },
+    [GPT_5_IMAGE]: { ...OPENAI_RULES, image: true },
     [JINA_DEEPSEARCH]: {
-        contextWindow: Infinity, maxInputTokens: Infinity,
+        label: '✴️', contextWindow: Infinity, maxInputTokens: Infinity,
         maxOutputTokens: Infinity, imageCostTokens: 0, maxImageSize: Infinity,
         supportedMimeTypes: [MIME_PNG, MIME_JPEG, MIME_TEXT, MIME_WEBP, MIME_PDF],
         reasoning: true, json: true, vision: true,
@@ -157,6 +160,7 @@ const MODELS = {
     [DEEPSEEK_R1]: DEEPSEEK_R1_RULES,
     [SF_DEEPSEEK_R1]: { ...DEEPSEEK_R1_RULES, defaultProvider: SILICONFLOW },
     [CLOUD_SONNET_45]: {
+        source: S_ANTHROPIC, icon: '✳️',
         contextWindow: kT(200), maxOutputTokens: kT(64),
         documentCostTokens: 3000 * 10, maxDocumentFile: m(32),
         maxDocumentPages: 100, imageCostTokens: ~~(v8k / 750),
@@ -165,6 +169,14 @@ const MODELS = {
         json: true, reasoning: true, tools: true, vision: true,
         defaultProvider: OPENROUTER,
     },
+    // best local model
+    [GEMMA_3_27B]: {
+        label: '❇️', contextWindow: kT(128), maxOutputTokens: k(8),
+        imageCostTokens: 256, maxImageSize: 896 * 896,
+        supportedMimeTypes: [MIME_PNG, MIME_JPEG, MIME_GIF],
+        fast: true, json: true, vision: true,
+        defaultProvider: OLLAMA,
+    },
     // https://docs.anthropic.com/en/docs/build-with-claude/vision
     // https://cloud.google.com/vertex-ai/generative-ai/docs/partner-models/claude/sonnet-4-5
 };
@@ -184,46 +196,47 @@ for (const n in MODELS) {
         ATTACHMENT_TOKEN_COST, MODELS[n].imageCostTokens || 0
     ) : MODELS[n].imageCostTokens;
 }
-MODELS[AUTO] = { name: AUTO, defaultProvider: OPENROUTER, };
-for (const n of [GPT_51, GPT_51_CODEX, GEMINI_30_PRO, GEMINI_25_FLASH]) {
-    // get the most restrictive limits
-    for (const key of [
-        'contextWindow', 'maxInputTokens', 'maxDocumentFile', 'maxAudioLength',
-        'maxImagePerPrompt', 'maxFileSize', 'maxImageSize', 'maxOutputTokens',
-        'maxAudioPerPrompt', 'maxDocumentPages', 'maxUrlSize', 'maxVideoLength',
-        'maxVideoPerPrompt',
-    ]) {
-        MODELS[AUTO][key] = Math.min(
-            MODELS[AUTO][key] || Infinity, MODELS[n][key] || Infinity,
-        );
-    }
-    // get the most permissive costs
-    for (const key of [
-        'documentCostTokens', 'imageCostTokens', 'audioCostTokens',
-    ]) {
-        MODELS[AUTO][key] = Math.max(
-            MODELS[AUTO][key] || 0, MODELS[n][key] || 0,
-        );
-    }
-    // combine supported types
-    for (const key of [
-        'supportedAudioTypes', 'supportedDocTypes', 'supportedMimeTypes',
-    ]) {
-        MODELS[AUTO][key] = [...new Set(
-            [...MODELS[AUTO][key] || [], ...MODELS[n][key] || []]
-        )];
-    }
-    // for other features, if any model supports it, then AUTO supports it
-    for (const key of [
-        'json', 'reasoning', 'tools', 'vision', 'fast', 'deepsearch', 'image',
-    ]) {
-        MODELS[AUTO][key] = MODELS[AUTO][key] || MODELS[n][key];
-    }
-    // catch first possible support
-    for (const key of ['audio']) {
-        MODELS[AUTO][key] = MODELS[AUTO][key] || MODELS[n][key];
-    }
-};
+// Auto model have some issues with tools and reasoning, so we disable them here
+// MODELS[AUTO] = { name: AUTO, defaultProvider: OPENROUTER, };
+// for (const n of [GPT_51, GPT_51_CODEX, GEMINI_30_PRO, GEMINI_25_FLASH]) {
+//     // get the most restrictive limits
+//     for (const key of [
+//         'contextWindow', 'maxInputTokens', 'maxDocumentFile', 'maxAudioLength',
+//         'maxImagePerPrompt', 'maxFileSize', 'maxImageSize', 'maxOutputTokens',
+//         'maxAudioPerPrompt', 'maxDocumentPages', 'maxUrlSize', 'maxVideoLength',
+//         'maxVideoPerPrompt',
+//     ]) {
+//         MODELS[AUTO][key] = Math.min(
+//             MODELS[AUTO][key] || Infinity, MODELS[n][key] || Infinity,
+//         );
+//     }
+//     // get the most permissive costs
+//     for (const key of [
+//         'documentCostTokens', 'imageCostTokens', 'audioCostTokens',
+//     ]) {
+//         MODELS[AUTO][key] = Math.max(
+//             MODELS[AUTO][key] || 0, MODELS[n][key] || 0,
+//         );
+//     }
+//     // combine supported types
+//     for (const key of [
+//         'supportedAudioTypes', 'supportedDocTypes', 'supportedMimeTypes',
+//     ]) {
+//         MODELS[AUTO][key] = [...new Set(
+//             [...MODELS[AUTO][key] || [], ...MODELS[n][key] || []]
+//         )];
+//     }
+//     // for other features, if any model supports it, then AUTO supports it
+//     for (const key of [
+//         'json', 'reasoning', 'tools', 'vision', 'fast', 'deepsearch', 'image',
+//     ]) {
+//         MODELS[AUTO][key] = MODELS[AUTO][key] || MODELS[n][key];
+//     }
+//     // catch first possible support
+//     for (const key of ['audio']) {
+//         MODELS[AUTO][key] = MODELS[AUTO][key] || MODELS[n][key];
+//     }
+// };
 // Default models for each provider
 const DEFAULT_MODELS = {
@@ -255,7 +268,7 @@ const tokenRatioByCharacters = Math.max(
 );
-let tokeniser;
+let tokeniser, _tools;
 const unifyProvider = provider => {
     assert(provider = (provider || '').trim(), 'AI provider is required.');
@@ -300,7 +313,7 @@ const tools = [
             }
         },
         func: async args => (await distill(args?.url))?.summary,
-        showReq: true,
+        showReq: true, replaced: ONLINE,
     },
     {
         def: {
@@ -321,12 +334,11 @@ const tools = [
             }
         },
         func: async args => await search(args?.keyword),
-        showReq: true,
-        depend: checkSearch,
+        showReq: true, replaced: ONLINE, depend: checkSearch,
     },
 ];
-const toolsOpenAI = async () => {
+const packTools = async () => {
     const _tools = [];
     for (const t of tools) {
         (t.depend ? await t.depend() : true) ? _tools.push(t) : log(
@@ -342,8 +354,8 @@ const buildAiId = (provider, model) => [
 ].map(x => ensureString(x, { case: 'SNAKE' })).join('_');
 const buildAiName = (provider, model) => [
-    getProviderIcon(provider), provider,
-    `(${isOpenrouter(provider, model) ? `${model.source}/` : ''}${model.name})`
+    model?.icon || getProviderIcon(provider), provider,
+    `(${isOpenrouter(provider, model) ? `${model.source}/` : ''}${model.label || model.name})`
 ].join(' ');
 const buildAiFeatures = model => Object.entries(FEATURE_ICONS).map(
@@ -383,6 +395,7 @@ const init = async (options = {}) => {
     }
     assert(models.length,
         `Model name or description is required for provider: ${provider}.`);
+    _tools || (_tools = await packTools());
     switch (provider) {
         case JINA:
             assertApiKey(provider, options);
@@ -444,6 +457,8 @@ const packAi = (ais, options = {}) => {
 };
 const getAi = async (id, options = {}) => {
+    options?.select || (options.select = {});
+    options?.jsonMode && (options.select.json = true);
     if (id) {
         const ai = ais.find(x => x.id === id);
         assert(ai, `AI not found: ${id}.`);
@@ -571,9 +586,11 @@ const getInfoEnd = text => Math.max(...[THINK_END, TOOLS_END].map(x => {
 // @todo: escape ``` in think and tools
 const packResp = async (resp, options) => {
+    // print(resp);
+    // return;
     if (options?.raw) { return resp; }
     let [
-        txt, audio, images, references, simpleText, referencesMarkdown, end,
+        txt, audio, images, annotations, simpleText, annotationsMarkdown, end,
         json, audioMimeType,
     ] = [
             resp.text || '',                                                    // ChatGPT / Claude / Gemini / Ollama
@@ -609,39 +626,25 @@ const packResp = async (resp, options) => {
     else if (options?.simple && options?.imageMode) { return images; }
     else if (options?.simple) { return simpleText; }
     else if (options?.jsonMode) { txt = simpleText; }
-    // references debug codes:
-    // references = {
-    //     "segments": [
-    //         {
-    //             "startIndex": 387,
-    //             "endIndex": 477,
-    //             "text": "It also provides live weather reports from Shanghai weather stations and weather warnings.",
-    //             "indices": [
-    //                 0
-    //             ],
-    //             "confidence": [
-    //                 0.94840443
-    //             ]
-    //         },
-    //     ],
-    //     "links": [
-    //         {
-    //             "uri": "https://vertexaisearch.cloud.google.com/grounding-api-redirect/AYygrcRVExzEYZU-23c6gKNSOJjLvSpI4CHtVmYJZaTLKd5N9GF-38GNyC2c9arn689-dmmpMh0Vd85x0kQp0IVY7BQMl1ugEYzy_IlDF-L3wFqf9xWHelAZF4cJa2LnWeUQsjyyTnYFRUs7nhlVoDVu1qYF0uLtVIjdyl5NH0PM92A=",
-    //             "title": "weather-forecast.com"
-    //         },
-    //     ]
-    // };
-    if (references?.segments?.length && references?.links?.length) {
-        for (let i = references.segments.length - 1; i >= 0; i--) {
-            let idx = txt.indexOf(references.segments[i].text);
-            if (idx < 0) { continue; }
-            idx += references.segments[i].text.length;
-            txt = txt.slice(0, idx)
-                + references.segments[i].indices.map(y => ` (${y + 1})`).join('')
-                + txt.slice(idx);
-        }
-        referencesMarkdown = 'References:\n\n' + references.links.map(
-            (x, i) => `${i + 1}. [${x.title}](${x.uri})`
+    // annotations debug codes:
+    // annotations = [
+    //     {
+    //         "type": "url_citation",
+    //         "url_citation": {
+    //             "end_index": 0,
+    //             "start_index": 0,
+    //             "title": "在線時鐘- 目前時間- 線上時鐘- 時鐘線上 - 鬧鐘",
+    //             "url": "https://naozhong.tw/shijian/",
+    //             "content": "- [鬧鐘](https://naozhong.tw/)\n- [計時器](https://naozhong.tw/jishiqi/)\n- [碼錶](https://naozhong.tw/miaobiao/)\n- [時間](https://naozhong.tw/shijian/)\n\n# 現在時間\n\n加入\n\n- [編輯](javascript:;)\n- [移至頂端](javascript:;)\n- [上移](javascript:;)\n- [下移](javascript:;)\n- [刪除](javascript:;)\n\n# 最常用\n\n| | |\n| --- | --- |\n| [台北](https://naozhong.tw/shijian/%E5%8F%B0%E5%8C%97/) | 10:09:14 |\n| [北京，中國](https://naozhong.tw/shijian/%E5%8C%97%E4%BA%AC-%E4%B8%AD%E5%9C%8B/) | 10:09:14 |\n| [上海，中國](https://naozhong.tw/shijian/%E4%B8%8A%E6%B5%B7-%E4%B8%AD%E5%9C%8B/) | 10:09:14 |\n| [烏魯木齊，中國](https://naozhong.tw/shijian/%E7%83%8F%E9%AD%AF%"
+    //         }
+    //     },
+    // ];
+    if (annotations?.length) {
+        annotations = annotations.filter(x => x?.type === 'url_citation').map(
+            x => ({ type: x.type, ...x.url_citation })
+        );
+        annotationsMarkdown = 'References:\n\n' + annotations.map(
+            (x, i) => `${i + 1}. [${x.title}](${x.url})`
         ).join('\n');
     }
     txt = txt.split('\n');
@@ -672,11 +675,14 @@ const packResp = async (resp, options) => {
     !options?.delta && !options?.processing && (txt = txt.trim());
     return {
         ...text(txt), ...options?.jsonMode ? { json } : {},
-        ...references ? { references } : {},
-        ...referencesMarkdown ? { referencesMarkdown } : {},
+        ...annotations ? { annotations } : {},
+        ...annotationsMarkdown ? { annotationsMarkdown } : {},
         ...audio ? { audio } : {}, ...images?.length ? { images } : {},
         processing: !!options?.processing,
-        model: options?.model,
+        model: [
+            options.provider, options?.router?.provider,
+            options?.router?.model || options?.model,
+        ].filter(x => x).join('/'),
     };
 };
@@ -790,11 +796,13 @@ const promptOpenAI = async (aiId, content, options = {}) => {
     let { provider, client, model } = await getAi(aiId);
     let [
         result, resultAudio, resultImages, resultReasoning, event, resultTools,
-        responded, modalities, source, reasoningEnd
+        responded, modalities, source, reasoningEnd, reasoning_details,
+        annotations,
     ] = [
             options.result ?? '', Buffer.alloc(0), [], '', null, [], false,
-            options.modalities, model?.source, false
+            options.modalities, model?.source, false, [], [],
         ];
+    options.provider = provider;
     options.model = options.model || model.name;
     const { history }
         = await buildPrompts(MODELS[options.model], content, options);
@@ -806,8 +814,13 @@ const promptOpenAI = async (aiId, content, options = {}) => {
     } else if (!modalities && model.image) {
         modalities = [TEXT, IMAGE];
     }
-    const googleImageMode = source === 'google' && modalities?.has?.(IMAGE);
-    const targetModel = `${isOpenrouter(provider, model) ? `${source}/` : ''}${options.model}`;
+    const googleImageMode = source === S_GOOGLE && modalities?.has?.(IMAGE);
+    // pricy: https://openrouter.ai/docs/features/web-search
+    const ext = ''; // options.jsonMode ? '' : ONLINE;
+    const targetModel = `${isOpenrouter(provider, model) ? `${source}/` : ''}${options.model}${ext}`;
+    const packedTools = (targetModel.endsWith(ONLINE)
+        ? _tools.filter(x => x?.replaced !== ONLINE)
+        : _tools).map(x => x.def);
     const resp = await client.chat.completions.create({
         model: targetModel, ...history,
         ...options.jsonMode ? { response_format: { type: JSON_OBJECT } } : {},
@@ -816,14 +829,15 @@ const promptOpenAI = async (aiId, content, options = {}) => {
             modalities?.find?.(x => x === AUDIO)
             && { voice: DEFAULT_MODELS[OPENAI_VOICE], format: 'pcm16' }
         ), ...model?.tools && !googleImageMode ? {
-            tools: options.tools ?? (await toolsOpenAI()).map(x => x.def),
-            tool_choice: 'auto',
-        } : {},
-        store: true, stream: true,
+            tools: options.tools ?? packedTools, tool_choice: 'auto',
+        } : {}, store: true, stream: true,
         reasoning_effort: options.reasoning_effort,
     });
     for await (event of resp) {
         // print(JSON.stringify(event, null, 2));
+        event?.provider && event?.model && (options.router = {
+            provider: event.provider, model: event.model,
+        });
         event = event?.choices?.[0] || {};
         const delta = event.delta || {};
         let [delteReasoning, deltaText] = [
@@ -836,6 +850,22 @@ const promptOpenAI = async (aiId, content, options = {}) => {
         const deltaAudio = delta.audio?.data ? await convert(
             delta.audio.data, { input: BASE64, expected: BUFFER }
         ) : Buffer.alloc(0);
+        delta?.annotations?.length && annotations.push(...delta.annotations);
+        // for anthropic reasoning details need to be merged in streaming
+        if (delta?.reasoning_details?.length) {
+            reasoning_details.length || reasoning_details.push({});
+            for (const item of delta.reasoning_details) {
+                for (const key in item) {
+                    if (key === 'text') {
+                        reasoning_details[0][key] = (
+                            reasoning_details[0][key] || ''
+                        ) + item[key];
+                        continue;
+                    }
+                    reasoning_details[0][key] = item[key];
+                }
+            }
+        }
         for (const x of delta.tool_calls || []) {
             let curFunc = resultTools.find(y => y.index === x.index);
             curFunc || (resultTools.push(curFunc = {}));
@@ -851,9 +881,11 @@ const promptOpenAI = async (aiId, content, options = {}) => {
         options.result && deltaText
             && (responded = responded || (deltaText = `\n\n${deltaText}`));
         resultReasoning += delteReasoning;
+        // the \n\n is needed for Interleaved Thinking:
+        // tools => reasoning => tools => reasoning ...
         delteReasoning && delteReasoning === resultReasoning
-            && (delteReasoning = `${THINK_STR}\n${delteReasoning}`);
-        resultReasoning && deltaText && !reasoningEnd && (
+            && (delteReasoning = `${result ? '\n\n' : ''}${THINK_STR}\n${delteReasoning}`);
+        resultReasoning && (deltaText || delta.tool_calls?.length) && !reasoningEnd && (
             reasoningEnd = delteReasoning = `${delteReasoning}${THINK_END}\n\n`
         );
         deltaText = delteReasoning + deltaText;
@@ -873,7 +905,19 @@ const promptOpenAI = async (aiId, content, options = {}) => {
         role: assistant, text: result, tool_calls: resultTools,
         ...resultImages.length ? { images: resultImages } : {},
         ...resultAudio.length ? { audio: { data: resultAudio } } : {},
+        ...annotations.length ? { annotations } : {},
     };
+    switch (source) {
+        case S_ANTHROPIC:
+            event.content = reasoning_details.map(x => ({
+                type: 'thinking', thinking: x.text,
+                ...x.signature ? { signature: x.signature } : {},
+            }));
+            break;
+        case S_GOOGLE:
+            reasoning_details?.length
+                && (event.reasoning_details = reasoning_details);
+    }
     const { toolsResult, toolsResponse }
         = await handleToolsCall(event, { ...options, result });
     if (toolsResult.length
@@ -886,122 +930,6 @@ const promptOpenAI = async (aiId, content, options = {}) => {
     return await packResp(event, options);
 };
-// const packGeminiReferences = (chunks, supports) => {
-//     let references = null;
-//     if (chunks?.length && supports?.length) {
-//         references = { segments: [], links: [] };
-//         supports.map(s => references.segments.push({
-//             ...s.segment, indices: s.groundingChunkIndices,
-//             confidence: s.confidenceScores,
-//         }));
-//         chunks.map(c => references.links.push(c.web));
-//     }
-//     return references;
-// };
-// const promptGemini = async (aiId, content, options = {}) => {
-//     let { provider, client, model } = await getAi(aiId);
-//     let [
-//         event, result, text, thinking, references, functionCalls, responded,
-//         images, thinkEnd,
-//     ] = [null, options.result ?? '', '', '', null, [], false, [], false];
-//     options.model = options.model || model.name;
-//     model?.image === true && (options.imageMode = true);
-//     assert(!(options.imageMode && !model.image), 'Image mode is not supported.');
-//     if (options.imageMode && String.isString(model.image)) {
-//         options.model = model.image;
-//         options.imageMode = true;
-//         model = MODELS[options.model];
-//     }
-//     options.flavor = GEMINI;
-//     const { systemPrompt: systemInstruction, history, prompt }
-//         = await buildPrompts(model, content, options);
-//     const responseModalities = options.modalities
-//         || (options.imageMode ? [TEXT, IMAGE] : undefined)
-//         || (options.audioMode ? [TEXT, AUDIO] : undefined);
-//     const chat = client.chats.create({
-//         model: options.model, history, config: {
-//             responseMimeType: options.jsonMode ? MIME_JSON : MIME_TEXT,
-//             ...model.reasoning ? {
-//                 thinkingConfig: { includeThoughts: true },
-//             } : {}, systemInstruction, responseModalities,
-//             ...options?.config || {}, ...model?.tools && !options.jsonMode
-//                 && ![GEMINI_25_FLASH_IMAGE].includes(options.model)
-//                 ? (options.tools ?? {
-//                     tools: [
-//                         // @todo: Gemini will failed when using these tools together.
-//                         // https://ai.google.dev/gemini-api/docs/function-calling
-//                         // { codeExecution: {} },
-//                         // { googleSearch: {} },
-//                         // { urlContext: {} },
-//                         // @todo: test these tools in next version 👆
-//                         {
-//                             functionDeclarations: (
-//                                 await toolsGemini({ provider })
-//                             ).map(x => x.def)
-//                         },
-//                     ], toolConfig: { functionCallingConfig: { mode: 'AUTO' } },
-//                 }) : {},
-//         },
-//     });
-//     const resp = await chat.sendMessageStream({ message: prompt });
-//     for await (const chunk of resp) {
-//         assert(
-//             !chunk?.promptFeedback?.blockReason,
-//             chunk?.promptFeedback?.blockReason
-//         );
-//         event = chunk?.candidates?.[0];
-//         let [deltaText, deltaThink, deltaImages] = ['', '', []];
-//         event?.content?.parts?.map(x => {
-//             if (x.text && x.thought) { deltaThink = x.text; }
-//             else if (x.text) { deltaText = x.text; }
-//             else if (x.functionCall) { functionCalls.push(x); }
-//             else if (x.inlineData?.mimeType === MIME_PNG) {
-//                 deltaImages.push(x.inlineData);
-//                 images.push(x.inlineData);
-//             }
-//         });
-//         text += deltaText;
-//         thinking += deltaThink;
-//         deltaThink && deltaThink === thinking
-//             && (deltaThink = `${THINK_STR}\n${deltaThink}`);
-//         thinking && deltaText && !thinkEnd
-//             && (thinkEnd = deltaThink = `${deltaThink}${THINK_END}\n\n`);
-//         deltaText = deltaThink + deltaText;
-//         const rfc = packGeminiReferences(
-//             event?.groundingMetadata?.groundingChunks,
-//             event?.groundingMetadata?.groundingSupports
-//         );
-//         rfc && (references = rfc);
-//         options.result && deltaText
-//             && (responded = responded || (deltaText = `\n\n${deltaText}`));
-//         result += deltaText;
-//         (deltaText || deltaImages.length) && await streamResp({
-//             text: options.delta ? deltaText : result,
-//             images: options.delta ? deltaImages : images,
-//         }, options);
-//     }
-//     event = {
-//         role: MODEL, parts: [
-//             ...thinking ? [{ thought: true, text: thinking }] : [],
-//             ...text ? [{ text }] : [],
-//             ...functionCalls,
-//         ],
-//     };
-//     const { toolsResult, toolsResponse } = await handleToolsCall(
-//         event, { ...options, result, flavor: GEMINI }
-//     );
-//     if (toolsResult.length
-//         && countToolCalls(toolsResponse) < MAX_TOOL_RECURSION) {
-//         return promptGemini(aiId, content, {
-//             ...options || {}, result: toolsResponse,
-//             toolsResult: [...options?.toolsResult || [], ...toolsResult],
-//         });
-//     }
-//     return await packResp({
-//         text: mergeMsgs(toolsResponse, toolsResult), images, references,
-//     }, options);
-// };
 const initChat = async (options = {}) => {
     if (options.sessions) {

package/lib/gen.mjs CHANGED Viewed

@@ -10,11 +10,11 @@ const _NEED = ['OpenAI', '@google/genai'];
 const log = (cnt, opt) => _log(cnt, import.meta.url, { time: 1, ...opt || {} });
 const [
     clients, OPENAI, GEMINI, BASE64, FILE, BUFFER, ERROR_GENERATING,
-    IMAGEN_MODEL, OPENAI_MODEL, VEO_MODEL,
+    IMAGEN_MODEL, OPENAI_MODEL, VEO_MODEL, IMAGEN_UPSCALE_MODEL,
 ] = [
         {}, 'OPENAI', 'GEMINI', 'BASE64', 'FILE', 'BUFFER',
         'Error generating media.', 'imagen-4.0-ultra-generate-001',
-        'gpt-image-1', 'veo-3.1-generate-preview',
+        'gpt-image-1', 'veo-3.1-generate-preview', 'imagen-4.0-upscale-preview',
     ];
 const init = async (options) => {

package/lib/manifest.mjs CHANGED Viewed

@@ -1,7 +1,7 @@
 const manifest = {
     "name": "utilitas",
     "description": "Just another common utility for JavaScript.",
-    "version": "1999.1.97",
+    "version": "1999.1.99",
     "private": false,
     "homepage": "https://github.com/Leask/utilitas",
     "main": "index.mjs",

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
     "name": "utilitas",
     "description": "Just another common utility for JavaScript.",
-    "version": "1999.1.97",
+    "version": "1999.1.99",
     "private": false,
     "homepage": "https://github.com/Leask/utilitas",
     "main": "index.mjs",