npm - @botpress/cognitive - Versions diffs - 0.1.42 → 0.1.44 - Mend

@botpress/cognitive 0.1.42 → 0.1.44

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/dist/index.d.ts CHANGED Viewed

@@ -18979,7 +18979,7 @@ declare class Cognitive {
     private _generateContent;
 }
-type Models = 'auto' | 'best' | 'fast' | 'reasoning' | 'cheapest' | 'balance' | 'recommended' | 'reasoning' | 'general-purpose' | 'low-cost' | 'vision' | 'coding' | 'function-calling' | 'agents' | 'storytelling' | 'preview' | 'roleplay' | 'anthropic:claude-3-5-haiku-20241022' | 'anthropic:claude-3-5-sonnet-20240620' | 'anthropic:claude-3-5-sonnet-20241022' | 'anthropic:claude-3-7-sonnet-20250219' | 'anthropic:claude-3-haiku-20240307' | 'anthropic:claude-sonnet-4-20250514' | 'cerebras:gpt-oss-120b' | 'cerebras:llama-4-scout-17b-16e-instruct' | 'cerebras:llama3.1-8b' | 'cerebras:llama3.3-70b' | 'cerebras:qwen-3-32b' | 'fireworks:deepseek-r1' | 'fireworks:deepseek-r1-0528' | 'fireworks:deepseek-r1-basic' | 'fireworks:deepseek-v3-0324' | 'fireworks:gpt-oss-120b' | 'fireworks:gpt-oss-20b' | 'fireworks:llama-v3p1-8b-instruct' | 'fireworks:llama-v3p3-70b-instruct' | 'fireworks:llama4-maverick-instruct-basic' | 'fireworks:llama4-scout-instruct-basic' | 'fireworks:mixtral-8x22b-instruct' | 'fireworks:mixtral-8x7b-instruct' | 'fireworks:mythomax-l2-13b' | 'google-ai:gemini-2.5-flash' | 'google-ai:gemini-2.5-pro' | 'google-ai:models/gemini-2.0-flash' | 'groq:deepseek-r1-distill-llama-70b' | 'groq:gemma2-9b-it' | 'groq:llama-3.1-8b-instant' | 'groq:llama-3.3-70b-versatile' | 'groq:openai/gpt-oss-120b' | 'groq:openai/gpt-oss-20b' | 'openai:gpt-4.1-2025-04-14' | 'openai:gpt-4.1-mini-2025-04-14' | 'openai:gpt-4.1-nano-2025-04-14' | 'openai:gpt-4o-2024-11-20' | 'openai:gpt-4o-mini-2024-07-18' | 'openai:gpt-5-2025-08-07' | 'openai:gpt-5-mini-2025-08-07' | 'openai:gpt-5-nano-2025-08-07' | 'openai:o1-2024-12-17' | 'openai:o1-mini-2024-09-12' | 'openai:o3-2025-04-16' | 'openai:o3-mini-2025-01-31' | 'openai:o4-mini-2025-04-16' | 'openrouter:gpt-oss-120b' | ({} & string);
+type Models = 'auto' | 'best' | 'fast' | 'reasoning' | 'cheapest' | 'balance' | 'recommended' | 'reasoning' | 'general-purpose' | 'low-cost' | 'vision' | 'coding' | 'function-calling' | 'agents' | 'storytelling' | 'preview' | 'roleplay' | 'anthropic:claude-3-5-haiku-20241022' | 'anthropic:claude-3-5-sonnet-20240620' | 'anthropic:claude-3-5-sonnet-20241022' | 'anthropic:claude-3-7-sonnet-20250219' | 'anthropic:claude-3-haiku-20240307' | 'anthropic:claude-sonnet-4-20250514' | 'cerebras:gpt-oss-120b' | 'cerebras:llama-4-scout-17b-16e-instruct' | 'cerebras:llama3.1-8b' | 'cerebras:llama3.3-70b' | 'cerebras:qwen-3-32b' | 'fireworks-ai:deepseek-r1' | 'fireworks-ai:deepseek-r1-0528' | 'fireworks-ai:deepseek-r1-basic' | 'fireworks-ai:deepseek-v3-0324' | 'fireworks-ai:gpt-oss-120b' | 'fireworks-ai:gpt-oss-20b' | 'fireworks-ai:llama-v3p1-8b-instruct' | 'fireworks-ai:llama-v3p3-70b-instruct' | 'fireworks-ai:llama4-maverick-instruct-basic' | 'fireworks-ai:llama4-scout-instruct-basic' | 'fireworks-ai:mixtral-8x22b-instruct' | 'fireworks-ai:mixtral-8x7b-instruct' | 'fireworks-ai:mythomax-l2-13b' | 'google-ai:gemini-2.5-flash' | 'google-ai:gemini-2.5-pro' | 'google-ai:models/gemini-2.0-flash' | 'groq:deepseek-r1-distill-llama-70b' | 'groq:gemma2-9b-it' | 'groq:llama-3.1-8b-instant' | 'groq:llama-3.3-70b-versatile' | 'groq:openai/gpt-oss-120b' | 'groq:openai/gpt-oss-20b' | 'openai:gpt-4.1-2025-04-14' | 'openai:gpt-4.1-mini-2025-04-14' | 'openai:gpt-4.1-nano-2025-04-14' | 'openai:gpt-4o-2024-11-20' | 'openai:gpt-4o-mini-2024-07-18' | 'openai:gpt-5-2025-08-07' | 'openai:gpt-5-mini-2025-08-07' | 'openai:gpt-5-nano-2025-08-07' | 'openai:o1-2024-12-17' | 'openai:o1-mini-2024-09-12' | 'openai:o3-2025-04-16' | 'openai:o3-mini-2025-01-31' | 'openai:o4-mini-2025-04-16' | 'openrouter:gpt-oss-120b' | 'xai:grok-3' | 'xai:grok-3-mini' | 'xai:grok-4-0709' | 'xai:grok-4-fast-non-reasoning' | 'xai:grok-4-fast-reasoning' | 'xai:grok-code-fast-1' | ({} & string);
 type CognitiveRequest = {
     /**
      * @minItems 1
@@ -19055,13 +19055,17 @@ type CognitiveResponse = {
         model?: string;
         usage: {
             inputTokens: number;
+            inputCost: number;
             outputTokens: number;
-            reasoningTokens?: number;
+            outputCost: number;
         };
         cost?: number;
         cached?: boolean;
+        /**
+         * Time it took for the provider to respond to the LLM query
+         */
         latency?: number;
-        stopReason?: string;
+        stopReason?: 'stop' | 'length' | 'content_filter' | 'error';
         reasoningEffort?: string;
         warnings?: {
             type: 'parameter_ignored' | 'provider_limitation' | 'deprecated_model' | 'fallback_used';

package/dist/index.mjs CHANGED Viewed

@@ -1311,6 +1311,96 @@ var models = {
     tags: ["low-cost", "general-purpose"],
     lifecycle: "live"
   },
+  "xai:grok-code-fast-1": {
+    id: "xai:grok-code-fast-1",
+    name: "Grok Code Fast 1",
+    description: "Fast coding-optimized Grok model with large context window.",
+    input: {
+      maxTokens: 256e3,
+      costPer1MTokens: 0.2
+    },
+    output: {
+      maxTokens: 32768,
+      costPer1MTokens: 1.5
+    },
+    tags: ["coding", "general-purpose", "low-cost"],
+    lifecycle: "live"
+  },
+  "xai:grok-4-fast-reasoning": {
+    id: "xai:grok-4-fast-reasoning",
+    name: "Grok 4 Fast (Reasoning)",
+    description: "Advanced fast Grok model with reasoning and very large context.",
+    input: {
+      maxTokens: 2e6,
+      costPer1MTokens: 0.2
+    },
+    output: {
+      maxTokens: 128e3,
+      costPer1MTokens: 0.5
+    },
+    tags: ["reasoning", "recommended", "general-purpose"],
+    lifecycle: "live"
+  },
+  "xai:grok-4-fast-non-reasoning": {
+    id: "xai:grok-4-fast-non-reasoning",
+    name: "Grok 4 Fast (Non-Reasoning)",
+    description: "Fast, cost-effective Grok model for non-reasoning tasks.",
+    input: {
+      maxTokens: 2e6,
+      costPer1MTokens: 0.2
+    },
+    output: {
+      maxTokens: 128e3,
+      costPer1MTokens: 0.5
+    },
+    tags: ["low-cost", "recommended", "general-purpose"],
+    lifecycle: "live"
+  },
+  "xai:grok-4-0709": {
+    id: "xai:grok-4-0709",
+    name: "Grok 4 (0709)",
+    description: "Comprehensive Grok 4 model for general-purpose tasks.",
+    input: {
+      maxTokens: 256e3,
+      costPer1MTokens: 3
+    },
+    output: {
+      maxTokens: 32768,
+      costPer1MTokens: 15
+    },
+    tags: ["reasoning", "general-purpose"],
+    lifecycle: "live"
+  },
+  "xai:grok-3-mini": {
+    id: "xai:grok-3-mini",
+    name: "Grok 3 Mini",
+    description: "Lightweight Grok model for cost-sensitive workloads.",
+    input: {
+      maxTokens: 131072,
+      costPer1MTokens: 0.3
+    },
+    output: {
+      maxTokens: 16384,
+      costPer1MTokens: 0.5
+    },
+    tags: ["low-cost", "general-purpose"],
+    lifecycle: "live"
+  },
+  "xai:grok-3": {
+    id: "xai:grok-3",
+    name: "Grok 3",
+    description: "Enterprise-grade Grok model for general-purpose tasks.",
+    input: {
+      maxTokens: 131072,
+      costPer1MTokens: 3
+    },
+    output: {
+      maxTokens: 16384,
+      costPer1MTokens: 15
+    },
+    tags: ["general-purpose"],
+    lifecycle: "live"
+  },
   "openrouter:gpt-oss-120b": {
     id: "openrouter:gpt-oss-120b",
     name: "GPT-OSS 120B (Preview)",
@@ -1326,8 +1416,8 @@ var models = {
     tags: ["preview", "general-purpose", "reasoning"],
     lifecycle: "live"
   },
-  "fireworks:gpt-oss-20b": {
-    id: "fireworks:gpt-oss-20b",
+  "fireworks-ai:gpt-oss-20b": {
+    id: "fireworks-ai:gpt-oss-20b",
     name: "GPT-OSS 20B",
     description: "gpt-oss-20b is a compact, open-weight language model optimized for low-latency. It shares the same training foundation and capabilities as the GPT-OSS 120B model, with faster responses and lower cost.",
     input: {
@@ -1342,8 +1432,8 @@ var models = {
     lifecycle: "live",
     aliases: ["accounts/fireworks/models/gpt-oss-20b"]
   },
-  "fireworks:gpt-oss-120b": {
-    id: "fireworks:gpt-oss-120b",
+  "fireworks-ai:gpt-oss-120b": {
+    id: "fireworks-ai:gpt-oss-120b",
     name: "GPT-OSS 120B",
     description: "gpt-oss-120b is a high-performance, open-weight language model designed for production-grade, general-purpose use cases. It excels at complex reasoning and supports configurable reasoning effort, full chain-of-thought transparency for easier debugging and trust, and native agentic capabilities for function calling, tool use, and structured outputs.",
     input: {
@@ -1358,8 +1448,8 @@ var models = {
     lifecycle: "live",
     aliases: ["accounts/fireworks/models/gpt-oss-120b"]
   },
-  "fireworks:deepseek-r1-0528": {
-    id: "fireworks:deepseek-r1-0528",
+  "fireworks-ai:deepseek-r1-0528": {
+    id: "fireworks-ai:deepseek-r1-0528",
     name: "DeepSeek R1 0528",
     description: "The updated DeepSeek R1 0528 model delivers major improvements in reasoning, inference, and accuracy through enhanced post-training optimization and greater computational resources. It now performs at a level approaching top-tier models like OpenAI o3 and Gemini 2.5 Pro, with notable gains in complex tasks such as math and programming. The update also reduces hallucinations, improves function calling, and enhances the coding experience.",
     input: {
@@ -1374,8 +1464,8 @@ var models = {
     lifecycle: "live",
     aliases: ["accounts/fireworks/models/deepseek-r1-0528"]
   },
-  "fireworks:deepseek-v3-0324": {
-    id: "fireworks:deepseek-v3-0324",
+  "fireworks-ai:deepseek-v3-0324": {
+    id: "fireworks-ai:deepseek-v3-0324",
     name: "DeepSeek V3 0324",
     description: "DeepSeek V3, a 685B-parameter, mixture-of-experts model, is the latest iteration of the flagship chat model family from the DeepSeek team. It succeeds the DeepSeek V3 model and performs really well on a variety of tasks.",
     input: {
@@ -1390,8 +1480,8 @@ var models = {
     lifecycle: "live",
     aliases: ["accounts/fireworks/models/deepseek-v3-0324"]
   },
-  "fireworks:llama4-maverick-instruct-basic": {
-    id: "fireworks:llama4-maverick-instruct-basic",
+  "fireworks-ai:llama4-maverick-instruct-basic": {
+    id: "fireworks-ai:llama4-maverick-instruct-basic",
     name: "Llama 4 Maverick Instruct (Basic)",
     description: "Llama 4 Maverick 17B Instruct (128E) is a high-capacity multimodal language model from Meta, built on a mixture-of-experts (MoE) architecture with 128 experts and 17 billion active parameters per forward pass (400B total). It supports multilingual text and image input, and produces multilingual text and code output across 12 supported languages. Optimized for vision-language tasks, Maverick is instruction-tuned for assistant-like behavior, image reasoning, and general-purpose multimodal interaction, and suited for research and commercial applications requiring advanced multimodal understanding and high model throughput.",
     input: {
@@ -1406,8 +1496,8 @@ var models = {
     lifecycle: "live",
     aliases: ["accounts/fireworks/models/llama4-maverick-instruct-basic"]
   },
-  "fireworks:llama4-scout-instruct-basic": {
-    id: "fireworks:llama4-scout-instruct-basic",
+  "fireworks-ai:llama4-scout-instruct-basic": {
+    id: "fireworks-ai:llama4-scout-instruct-basic",
     name: "Llama 4 Scout Instruct (Basic)",
     description: "Llama 4 Scout 17B Instruct (16E) is a mixture-of-experts (MoE) language model developed by Meta, uses 16 experts per forward pass, activating 17 billion parameters out of a total of 109B. It supports native multimodal input (text and image) and multilingual output (text and code) across 12 supported languages. Designed for assistant-style interaction and visual reasoning, it is instruction-tuned for use in multilingual chat, captioning, and image understanding tasks.",
     input: {
@@ -1422,8 +1512,8 @@ var models = {
     lifecycle: "live",
     aliases: ["accounts/fireworks/models/llama4-scout-instruct-basic"]
   },
-  "fireworks:llama-v3p3-70b-instruct": {
-    id: "fireworks:llama-v3p3-70b-instruct",
+  "fireworks-ai:llama-v3p3-70b-instruct": {
+    id: "fireworks-ai:llama-v3p3-70b-instruct",
     name: "Llama 3.3 70B Instruct",
     description: "Llama 3.3 70B Instruct is the December update of Llama 3.1 70B. The model improves upon Llama 3.1 70B (released July 2024) with advances in tool calling, multilingual text support, math and coding. The model achieves industry leading results in reasoning, math and instruction following and provides similar performance as 3.1 405B but with significant speed and cost improvements.",
     input: {
@@ -1438,8 +1528,8 @@ var models = {
     lifecycle: "live",
     aliases: ["accounts/fireworks/models/llama-v3p3-70b-instruct"]
   },
-  "fireworks:deepseek-r1": {
-    id: "fireworks:deepseek-r1",
+  "fireworks-ai:deepseek-r1": {
+    id: "fireworks-ai:deepseek-r1",
     name: "DeepSeek R1 (Fast)",
     description: "This version of the R1 model has a perfect balance between speed and cost-efficiency for real-time interactive experiences, with speeds up to 90 tokens per second.\n\nDeepSeek-R1 is a state-of-the-art large language model optimized with reinforcement learning and cold-start data for exceptional reasoning, math, and code performance. **Note**: This model will always use a temperature of 0.6 as recommended by DeepSeek.",
     input: {
@@ -1454,8 +1544,8 @@ var models = {
     lifecycle: "live",
     aliases: ["accounts/fireworks/models/deepseek-r1"]
   },
-  "fireworks:deepseek-r1-basic": {
-    id: "fireworks:deepseek-r1-basic",
+  "fireworks-ai:deepseek-r1-basic": {
+    id: "fireworks-ai:deepseek-r1-basic",
     name: "DeepSeek R1 (Basic)",
     description: 'This version of the R1 model is optimized for throughput and cost-effectiveness and has a lower cost but slightly higher latency than the "Fast" version of the model.\n\nDeepSeek-R1 is a state-of-the-art large language model optimized with reinforcement learning and cold-start data for exceptional reasoning, math, and code performance. **Note**: This model will always use a temperature of 0.6 as recommended by DeepSeek.',
     input: {
@@ -1470,8 +1560,8 @@ var models = {
     lifecycle: "live",
     aliases: ["accounts/fireworks/models/deepseek-r1-basic"]
   },
-  "fireworks:deepseek-v3": {
-    id: "fireworks:deepseek-v3",
+  "fireworks-ai:deepseek-v3": {
+    id: "fireworks-ai:deepseek-v3",
     name: "DeepSeek V3",
     description: "A a strong Mixture-of-Experts (MoE) language model with 671B total parameters with 37B activated for each token from Deepseek.",
     input: {
@@ -1486,8 +1576,8 @@ var models = {
     lifecycle: "deprecated",
     aliases: ["accounts/fireworks/models/deepseek-v3"]
   },
-  "fireworks:llama-v3p1-405b-instruct": {
-    id: "fireworks:llama-v3p1-405b-instruct",
+  "fireworks-ai:llama-v3p1-405b-instruct": {
+    id: "fireworks-ai:llama-v3p1-405b-instruct",
     name: "Llama 3.1 405B Instruct",
     description: "The Meta Llama 3.1 collection of multilingual large language models (LLMs) is a collection of pretrained and instruction tuned generative models in 8B, 70B and 405B sizes. The Llama 3.1 instruction tuned text only models (8B, 70B, 405B) are optimized for multilingual dialogue use cases and outperform many of the available open source and closed chat models on common industry benchmarks.",
     input: {
@@ -1502,8 +1592,8 @@ var models = {
     lifecycle: "deprecated",
     aliases: ["accounts/fireworks/models/llama-v3p1-405b-instruct"]
   },
-  "fireworks:llama-v3p1-70b-instruct": {
-    id: "fireworks:llama-v3p1-70b-instruct",
+  "fireworks-ai:llama-v3p1-70b-instruct": {
+    id: "fireworks-ai:llama-v3p1-70b-instruct",
     name: "Llama 3.1 70B Instruct",
     description: "The Meta Llama 3.1 collection of multilingual large language models (LLMs) is a collection of pretrained and instruction tuned generative models in 8B, 70B and 405B sizes. The Llama 3.1 instruction tuned text only models (8B, 70B, 405B) are optimized for multilingual dialogue use cases and outperform many of the available open source and closed chat models on common industry benchmarks.",
     input: {
@@ -1518,8 +1608,8 @@ var models = {
     lifecycle: "deprecated",
     aliases: ["accounts/fireworks/models/llama-v3p1-70b-instruct"]
   },
-  "fireworks:llama-v3p1-8b-instruct": {
-    id: "fireworks:llama-v3p1-8b-instruct",
+  "fireworks-ai:llama-v3p1-8b-instruct": {
+    id: "fireworks-ai:llama-v3p1-8b-instruct",
     name: "Llama 3.1 8B Instruct",
     description: "The Meta Llama 3.1 collection of multilingual large language models (LLMs) is a collection of pretrained and instruction tuned generative models in 8B, 70B and 405B sizes. The Llama 3.1 instruction tuned text only models (8B, 70B, 405B) are optimized for multilingual dialogue use cases and outperform many of the available open source and closed chat models on common industry benchmarks.",
     input: {
@@ -1534,8 +1624,8 @@ var models = {
     lifecycle: "live",
     aliases: ["accounts/fireworks/models/llama-v3p1-8b-instruct"]
   },
-  "fireworks:mixtral-8x22b-instruct": {
-    id: "fireworks:mixtral-8x22b-instruct",
+  "fireworks-ai:mixtral-8x22b-instruct": {
+    id: "fireworks-ai:mixtral-8x22b-instruct",
     name: "Mixtral MoE 8x22B Instruct",
     description: "Mistral MoE 8x22B Instruct v0.1 model with Sparse Mixture of Experts. Fine tuned for instruction following.",
     input: {
@@ -1550,8 +1640,8 @@ var models = {
     lifecycle: "live",
     aliases: ["accounts/fireworks/models/mixtral-8x22b-instruct"]
   },
-  "fireworks:mixtral-8x7b-instruct": {
-    id: "fireworks:mixtral-8x7b-instruct",
+  "fireworks-ai:mixtral-8x7b-instruct": {
+    id: "fireworks-ai:mixtral-8x7b-instruct",
     name: "Mixtral MoE 8x7B Instruct",
     description: "Mistral MoE 8x7B Instruct v0.1 model with Sparse Mixture of Experts. Fine tuned for instruction following",
     input: {
@@ -1566,8 +1656,8 @@ var models = {
     lifecycle: "live",
     aliases: ["accounts/fireworks/models/mixtral-8x7b-instruct"]
   },
-  "fireworks:mythomax-l2-13b": {
-    id: "fireworks:mythomax-l2-13b",
+  "fireworks-ai:mythomax-l2-13b": {
+    id: "fireworks-ai:mythomax-l2-13b",
     name: "MythoMax L2 13b",
     description: "MythoMax L2 is designed to excel at both roleplaying and storytelling, and is an improved variant of the previous MythoMix model, combining the MythoLogic-L2 and Huginn models.",
     input: {
@@ -1582,8 +1672,8 @@ var models = {
     lifecycle: "live",
     aliases: ["accounts/fireworks/models/mythomax-l2-13b"]
   },
-  "fireworks:gemma2-9b-it": {
-    id: "fireworks:gemma2-9b-it",
+  "fireworks-ai:gemma2-9b-it": {
+    id: "fireworks-ai:gemma2-9b-it",
     name: "Gemma 2 9B Instruct",
     description: "Redesigned for outsized performance and unmatched efficiency, Gemma 2 optimizes for blazing-fast inference on diverse hardware. Gemma is a family of lightweight, state-of-the-art open models from Google, built from the same research and technology used to create the Gemini models. They are text-to-text, decoder-only large language models, available in English, with open weights, pre-trained variants, and instruction-tuned variants. Gemma models are well-suited for a variety of text generation tasks, including question answering, summarization, and reasoning.",
     input: {
@@ -1717,7 +1807,7 @@ var CognitiveBeta = class {
     }
     const res = await this._withServerRetry(
       () => this._axiosClient.post(
-        "/v1/generate-text-stream",
+        "/v2/cognitive/generate-text-stream",
         { ...request, stream: true },
         {
           responseType: "stream",