@letta-ai/letta-client 1.7.12 → 1.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (47) hide show
  1. package/CHANGELOG.md +30 -0
  2. package/package.json +12 -1
  3. package/resources/agents/agents.d.mts +309 -7
  4. package/resources/agents/agents.d.mts.map +1 -1
  5. package/resources/agents/agents.d.ts +309 -7
  6. package/resources/agents/agents.d.ts.map +1 -1
  7. package/resources/agents/agents.js.map +1 -1
  8. package/resources/agents/agents.mjs.map +1 -1
  9. package/resources/agents/messages.d.mts +163 -2
  10. package/resources/agents/messages.d.mts.map +1 -1
  11. package/resources/agents/messages.d.ts +163 -2
  12. package/resources/agents/messages.d.ts.map +1 -1
  13. package/resources/conversations/conversations.d.mts +306 -6
  14. package/resources/conversations/conversations.d.mts.map +1 -1
  15. package/resources/conversations/conversations.d.ts +306 -6
  16. package/resources/conversations/conversations.d.ts.map +1 -1
  17. package/resources/conversations/conversations.js.map +1 -1
  18. package/resources/conversations/conversations.mjs.map +1 -1
  19. package/resources/conversations/messages.d.mts +112 -2
  20. package/resources/conversations/messages.d.mts.map +1 -1
  21. package/resources/conversations/messages.d.ts +112 -2
  22. package/resources/conversations/messages.d.ts.map +1 -1
  23. package/resources/models/models.d.mts +13 -3
  24. package/resources/models/models.d.mts.map +1 -1
  25. package/resources/models/models.d.ts +13 -3
  26. package/resources/models/models.d.ts.map +1 -1
  27. package/resources/models/models.js.map +1 -1
  28. package/resources/models/models.mjs.map +1 -1
  29. package/resources/tools.d.mts +5 -0
  30. package/resources/tools.d.mts.map +1 -1
  31. package/resources/tools.d.ts +5 -0
  32. package/resources/tools.d.ts.map +1 -1
  33. package/src/resources/agents/agents.ts +387 -1
  34. package/src/resources/agents/messages.ts +187 -1
  35. package/src/resources/conversations/conversations.ts +384 -0
  36. package/src/resources/conversations/messages.ts +140 -0
  37. package/src/resources/models/models.ts +16 -1
  38. package/src/resources/tools.ts +5 -0
  39. package/src/version.ts +1 -1
  40. package/version.d.mts +1 -1
  41. package/version.d.mts.map +1 -1
  42. package/version.d.ts +1 -1
  43. package/version.d.ts.map +1 -1
  44. package/version.js +1 -1
  45. package/version.js.map +1 -1
  46. package/version.mjs +1 -1
  47. package/version.mjs.map +1 -1
package/CHANGELOG.md CHANGED
@@ -1,5 +1,35 @@
1
1
  # Changelog
2
2
 
3
+ ## 1.8.0 (2026-03-20)
4
+
5
+ Full Changelog: [v1.7.12...v1.8.0](https://github.com/letta-ai/letta-node/compare/v1.7.12...v1.8.0)
6
+
7
+ ### Features
8
+
9
+ * add zai coding provider ([88e56a9](https://github.com/letta-ai/letta-node/commit/88e56a9498385d6a37f2c96806c882a856cd6f68))
10
+ * always create otid for request ([488b66b](https://github.com/letta-ai/letta-node/commit/488b66b6443a290d49e84a2d25d11b4c0b007822))
11
+
12
+
13
+ ### Bug Fixes
14
+
15
+ * surface error when system prompt is large during compaction ([be4ef7f](https://github.com/letta-ai/letta-node/commit/be4ef7f6d547247430cda5f72e7bce1939896c27))
16
+
17
+
18
+ ### Chores
19
+
20
+ * **internal:** tweak CI branches ([176a3a7](https://github.com/letta-ai/letta-node/commit/176a3a71f8c12afb5cf27a4e9913509a2f4a360c))
21
+ * **internal:** update dependencies to address dependabot vulnerabilities ([2074604](https://github.com/letta-ai/letta-node/commit/20746042d8107a5fd2a5a59152c583593bade6a8))
22
+
23
+
24
+ ### Documentation
25
+
26
+ * add OTID field description for idempotency context ([7c59ce1](https://github.com/letta-ai/letta-node/commit/7c59ce1f8c38d8172e44b91fafee619dd0403c0d))
27
+
28
+
29
+ ### Refactors
30
+
31
+ * **sglang:** use input_ids instead of text in native adapter ([08679c1](https://github.com/letta-ai/letta-node/commit/08679c16d8ce0818fe8f72e77ae5dd366affc819))
32
+
3
33
  ## 1.7.12 (2026-03-09)
4
34
 
5
35
  Full Changelog: [v1.7.11...v1.7.12](https://github.com/letta-ai/letta-node/compare/v1.7.11...v1.7.12)
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@letta-ai/letta-client",
3
- "version": "1.7.12",
3
+ "version": "1.8.0",
4
4
  "description": "The official TypeScript library for the Letta API",
5
5
  "author": "Letta <>",
6
6
  "types": "./index.d.ts",
@@ -25,6 +25,17 @@
25
25
  "fix": "./scripts/format"
26
26
  },
27
27
  "dependencies": {},
28
+ "overrides": {
29
+ "minimatch": "^9.0.5"
30
+ },
31
+ "pnpm": {
32
+ "overrides": {
33
+ "minimatch": "^9.0.5"
34
+ }
35
+ },
36
+ "resolutions": {
37
+ "minimatch": "^9.0.5"
38
+ },
28
39
  "exports": {
29
40
  ".": {
30
41
  "require": {
@@ -269,7 +269,7 @@ export interface AgentState {
269
269
  /**
270
270
  * The model settings used by the agent.
271
271
  */
272
- model_settings?: OpenAIModelSettings | AnthropicModelSettings | GoogleAIModelSettings | GoogleVertexModelSettings | AzureModelSettings | XaiModelSettings | AgentState.ZaiModelSettings | GroqModelSettings | DeepseekModelSettings | TogetherModelSettings | BedrockModelSettings | AgentState.OpenRouterModelSettings | AgentState.ChatGptoAuthModelSettings | null;
272
+ model_settings?: OpenAIModelSettings | AgentState.SgLangModelSettings | AnthropicModelSettings | GoogleAIModelSettings | GoogleVertexModelSettings | AzureModelSettings | XaiModelSettings | AgentState.ZaiModelSettings | GroqModelSettings | DeepseekModelSettings | TogetherModelSettings | BedrockModelSettings | AgentState.OpenRouterModelSettings | AgentState.ChatGptoAuthModelSettings | null;
273
273
  /**
274
274
  * @deprecated Deprecated: Use `managed_group` field instead. The multi-agent group
275
275
  * that this agent manages.
@@ -525,7 +525,7 @@ export declare namespace AgentState {
525
525
  /**
526
526
  * Optional model settings used to override defaults for the summarizer model.
527
527
  */
528
- model_settings?: AgentsAPI.OpenAIModelSettings | AgentsAPI.AnthropicModelSettings | AgentsAPI.GoogleAIModelSettings | AgentsAPI.GoogleVertexModelSettings | AgentsAPI.AzureModelSettings | AgentsAPI.XaiModelSettings | CompactionSettings.ZaiModelSettings | AgentsAPI.GroqModelSettings | AgentsAPI.DeepseekModelSettings | AgentsAPI.TogetherModelSettings | AgentsAPI.BedrockModelSettings | CompactionSettings.OpenRouterModelSettings | CompactionSettings.ChatGptoAuthModelSettings | null;
528
+ model_settings?: AgentsAPI.OpenAIModelSettings | CompactionSettings.SgLangModelSettings | AgentsAPI.AnthropicModelSettings | AgentsAPI.GoogleAIModelSettings | AgentsAPI.GoogleVertexModelSettings | AgentsAPI.AzureModelSettings | AgentsAPI.XaiModelSettings | CompactionSettings.ZaiModelSettings | AgentsAPI.GroqModelSettings | AgentsAPI.DeepseekModelSettings | AgentsAPI.TogetherModelSettings | AgentsAPI.BedrockModelSettings | CompactionSettings.OpenRouterModelSettings | CompactionSettings.ChatGptoAuthModelSettings | null;
529
529
  /**
530
530
  * The prompt to use for summarization. If None, uses mode-specific default.
531
531
  */
@@ -542,6 +542,56 @@ export declare namespace AgentState {
542
542
  sliding_window_percentage?: number;
543
543
  }
544
544
  namespace CompactionSettings {
545
+ /**
546
+ * SGLang model configuration (OpenAI-compatible runtime with SGLang-specific
547
+ * parsing).
548
+ */
549
+ interface SgLangModelSettings {
550
+ /**
551
+ * The maximum number of tokens the model can generate.
552
+ */
553
+ max_output_tokens?: number;
554
+ /**
555
+ * Whether to enable parallel tool calling.
556
+ */
557
+ parallel_tool_calls?: boolean;
558
+ /**
559
+ * The type of the provider.
560
+ */
561
+ provider_type?: 'sglang';
562
+ /**
563
+ * The reasoning configuration for the model.
564
+ */
565
+ reasoning?: SgLangModelSettings.Reasoning;
566
+ /**
567
+ * The response format for the model.
568
+ */
569
+ response_format?: AgentsAPI.TextResponseFormat | AgentsAPI.JsonSchemaResponseFormat | AgentsAPI.JsonObjectResponseFormat | null;
570
+ /**
571
+ * Enable strict mode for tool calling. When true, tool outputs are guaranteed to
572
+ * match JSON schemas.
573
+ */
574
+ strict?: boolean;
575
+ /**
576
+ * The temperature of the model.
577
+ */
578
+ temperature?: number;
579
+ /**
580
+ * SGLang tool call parser name (for example 'glm47', 'qwen25', or 'hermes').
581
+ */
582
+ tool_call_parser?: string | null;
583
+ }
584
+ namespace SgLangModelSettings {
585
+ /**
586
+ * The reasoning configuration for the model.
587
+ */
588
+ interface Reasoning {
589
+ /**
590
+ * The reasoning effort to use when generating text reasoning models
591
+ */
592
+ reasoning_effort?: 'none' | 'minimal' | 'low' | 'medium' | 'high' | 'xhigh';
593
+ }
594
+ }
545
595
  /**
546
596
  * Z.ai (ZhipuAI) model configuration (OpenAI-compatible).
547
597
  */
@@ -756,6 +806,56 @@ export declare namespace AgentState {
756
806
  termination_token?: string | null;
757
807
  turns_counter?: number | null;
758
808
  }
809
+ /**
810
+ * SGLang model configuration (OpenAI-compatible runtime with SGLang-specific
811
+ * parsing).
812
+ */
813
+ interface SgLangModelSettings {
814
+ /**
815
+ * The maximum number of tokens the model can generate.
816
+ */
817
+ max_output_tokens?: number;
818
+ /**
819
+ * Whether to enable parallel tool calling.
820
+ */
821
+ parallel_tool_calls?: boolean;
822
+ /**
823
+ * The type of the provider.
824
+ */
825
+ provider_type?: 'sglang';
826
+ /**
827
+ * The reasoning configuration for the model.
828
+ */
829
+ reasoning?: SgLangModelSettings.Reasoning;
830
+ /**
831
+ * The response format for the model.
832
+ */
833
+ response_format?: AgentsAPI.TextResponseFormat | AgentsAPI.JsonSchemaResponseFormat | AgentsAPI.JsonObjectResponseFormat | null;
834
+ /**
835
+ * Enable strict mode for tool calling. When true, tool outputs are guaranteed to
836
+ * match JSON schemas.
837
+ */
838
+ strict?: boolean;
839
+ /**
840
+ * The temperature of the model.
841
+ */
842
+ temperature?: number;
843
+ /**
844
+ * SGLang tool call parser name (for example 'glm47', 'qwen25', or 'hermes').
845
+ */
846
+ tool_call_parser?: string | null;
847
+ }
848
+ namespace SgLangModelSettings {
849
+ /**
850
+ * The reasoning configuration for the model.
851
+ */
852
+ interface Reasoning {
853
+ /**
854
+ * The reasoning effort to use when generating text reasoning models
855
+ */
856
+ reasoning_effort?: 'none' | 'minimal' | 'low' | 'medium' | 'high' | 'xhigh';
857
+ }
858
+ }
759
859
  /**
760
860
  * Z.ai (ZhipuAI) model configuration (OpenAI-compatible).
761
861
  */
@@ -1344,7 +1444,9 @@ export interface MessageCreate {
1344
1444
  */
1345
1445
  name?: string | null;
1346
1446
  /**
1347
- * The offline threading id associated with this message
1447
+ * The offline threading id (OTID). Set by the client to deduplicate requests. Used
1448
+ * for idempotency in background streaming mode — each message in a request must
1449
+ * have a unique OTID. Retries of the same request should reuse the same OTIDs.
1348
1450
  */
1349
1451
  otid?: string | null;
1350
1452
  /**
@@ -1679,7 +1781,7 @@ export interface AgentCreateParams {
1679
1781
  /**
1680
1782
  * The model settings for the agent.
1681
1783
  */
1682
- model_settings?: OpenAIModelSettings | AnthropicModelSettings | GoogleAIModelSettings | GoogleVertexModelSettings | AzureModelSettings | XaiModelSettings | AgentCreateParams.ZaiModelSettings | GroqModelSettings | DeepseekModelSettings | TogetherModelSettings | BedrockModelSettings | AgentCreateParams.OpenRouterModelSettings | AgentCreateParams.ChatGptoAuthModelSettings | null;
1784
+ model_settings?: OpenAIModelSettings | AgentCreateParams.SgLangModelSettings | AnthropicModelSettings | GoogleAIModelSettings | GoogleVertexModelSettings | AzureModelSettings | XaiModelSettings | AgentCreateParams.ZaiModelSettings | GroqModelSettings | DeepseekModelSettings | TogetherModelSettings | BedrockModelSettings | AgentCreateParams.OpenRouterModelSettings | AgentCreateParams.ChatGptoAuthModelSettings | null;
1683
1785
  /**
1684
1786
  * The name of the agent.
1685
1787
  */
@@ -1792,7 +1894,7 @@ export declare namespace AgentCreateParams {
1792
1894
  /**
1793
1895
  * Optional model settings used to override defaults for the summarizer model.
1794
1896
  */
1795
- model_settings?: AgentsAPI.OpenAIModelSettings | AgentsAPI.AnthropicModelSettings | AgentsAPI.GoogleAIModelSettings | AgentsAPI.GoogleVertexModelSettings | AgentsAPI.AzureModelSettings | AgentsAPI.XaiModelSettings | CompactionSettings.ZaiModelSettings | AgentsAPI.GroqModelSettings | AgentsAPI.DeepseekModelSettings | AgentsAPI.TogetherModelSettings | AgentsAPI.BedrockModelSettings | CompactionSettings.OpenRouterModelSettings | CompactionSettings.ChatGptoAuthModelSettings | null;
1897
+ model_settings?: AgentsAPI.OpenAIModelSettings | CompactionSettings.SgLangModelSettings | AgentsAPI.AnthropicModelSettings | AgentsAPI.GoogleAIModelSettings | AgentsAPI.GoogleVertexModelSettings | AgentsAPI.AzureModelSettings | AgentsAPI.XaiModelSettings | CompactionSettings.ZaiModelSettings | AgentsAPI.GroqModelSettings | AgentsAPI.DeepseekModelSettings | AgentsAPI.TogetherModelSettings | AgentsAPI.BedrockModelSettings | CompactionSettings.OpenRouterModelSettings | CompactionSettings.ChatGptoAuthModelSettings | null;
1796
1898
  /**
1797
1899
  * The prompt to use for summarization. If None, uses mode-specific default.
1798
1900
  */
@@ -1809,6 +1911,56 @@ export declare namespace AgentCreateParams {
1809
1911
  sliding_window_percentage?: number;
1810
1912
  }
1811
1913
  namespace CompactionSettings {
1914
+ /**
1915
+ * SGLang model configuration (OpenAI-compatible runtime with SGLang-specific
1916
+ * parsing).
1917
+ */
1918
+ interface SgLangModelSettings {
1919
+ /**
1920
+ * The maximum number of tokens the model can generate.
1921
+ */
1922
+ max_output_tokens?: number;
1923
+ /**
1924
+ * Whether to enable parallel tool calling.
1925
+ */
1926
+ parallel_tool_calls?: boolean;
1927
+ /**
1928
+ * The type of the provider.
1929
+ */
1930
+ provider_type?: 'sglang';
1931
+ /**
1932
+ * The reasoning configuration for the model.
1933
+ */
1934
+ reasoning?: SgLangModelSettings.Reasoning;
1935
+ /**
1936
+ * The response format for the model.
1937
+ */
1938
+ response_format?: AgentsAPI.TextResponseFormat | AgentsAPI.JsonSchemaResponseFormat | AgentsAPI.JsonObjectResponseFormat | null;
1939
+ /**
1940
+ * Enable strict mode for tool calling. When true, tool outputs are guaranteed to
1941
+ * match JSON schemas.
1942
+ */
1943
+ strict?: boolean;
1944
+ /**
1945
+ * The temperature of the model.
1946
+ */
1947
+ temperature?: number;
1948
+ /**
1949
+ * SGLang tool call parser name (for example 'glm47', 'qwen25', or 'hermes').
1950
+ */
1951
+ tool_call_parser?: string | null;
1952
+ }
1953
+ namespace SgLangModelSettings {
1954
+ /**
1955
+ * The reasoning configuration for the model.
1956
+ */
1957
+ interface Reasoning {
1958
+ /**
1959
+ * The reasoning effort to use when generating text reasoning models
1960
+ */
1961
+ reasoning_effort?: 'none' | 'minimal' | 'low' | 'medium' | 'high' | 'xhigh';
1962
+ }
1963
+ }
1812
1964
  /**
1813
1965
  * Z.ai (ZhipuAI) model configuration (OpenAI-compatible).
1814
1966
  */
@@ -1915,6 +2067,56 @@ export declare namespace AgentCreateParams {
1915
2067
  }
1916
2068
  }
1917
2069
  }
2070
+ /**
2071
+ * SGLang model configuration (OpenAI-compatible runtime with SGLang-specific
2072
+ * parsing).
2073
+ */
2074
+ interface SgLangModelSettings {
2075
+ /**
2076
+ * The maximum number of tokens the model can generate.
2077
+ */
2078
+ max_output_tokens?: number;
2079
+ /**
2080
+ * Whether to enable parallel tool calling.
2081
+ */
2082
+ parallel_tool_calls?: boolean;
2083
+ /**
2084
+ * The type of the provider.
2085
+ */
2086
+ provider_type?: 'sglang';
2087
+ /**
2088
+ * The reasoning configuration for the model.
2089
+ */
2090
+ reasoning?: SgLangModelSettings.Reasoning;
2091
+ /**
2092
+ * The response format for the model.
2093
+ */
2094
+ response_format?: AgentsAPI.TextResponseFormat | AgentsAPI.JsonSchemaResponseFormat | AgentsAPI.JsonObjectResponseFormat | null;
2095
+ /**
2096
+ * Enable strict mode for tool calling. When true, tool outputs are guaranteed to
2097
+ * match JSON schemas.
2098
+ */
2099
+ strict?: boolean;
2100
+ /**
2101
+ * The temperature of the model.
2102
+ */
2103
+ temperature?: number;
2104
+ /**
2105
+ * SGLang tool call parser name (for example 'glm47', 'qwen25', or 'hermes').
2106
+ */
2107
+ tool_call_parser?: string | null;
2108
+ }
2109
+ namespace SgLangModelSettings {
2110
+ /**
2111
+ * The reasoning configuration for the model.
2112
+ */
2113
+ interface Reasoning {
2114
+ /**
2115
+ * The reasoning effort to use when generating text reasoning models
2116
+ */
2117
+ reasoning_effort?: 'none' | 'minimal' | 'low' | 'medium' | 'high' | 'xhigh';
2118
+ }
2119
+ }
1918
2120
  /**
1919
2121
  * Z.ai (ZhipuAI) model configuration (OpenAI-compatible).
1920
2122
  */
@@ -2137,7 +2339,7 @@ export interface AgentUpdateParams {
2137
2339
  /**
2138
2340
  * The model settings for the agent.
2139
2341
  */
2140
- model_settings?: OpenAIModelSettings | AnthropicModelSettings | GoogleAIModelSettings | GoogleVertexModelSettings | AzureModelSettings | XaiModelSettings | AgentUpdateParams.ZaiModelSettings | GroqModelSettings | DeepseekModelSettings | TogetherModelSettings | BedrockModelSettings | AgentUpdateParams.OpenRouterModelSettings | AgentUpdateParams.ChatGptoAuthModelSettings | null;
2342
+ model_settings?: OpenAIModelSettings | AgentUpdateParams.SgLangModelSettings | AnthropicModelSettings | GoogleAIModelSettings | GoogleVertexModelSettings | AzureModelSettings | XaiModelSettings | AgentUpdateParams.ZaiModelSettings | GroqModelSettings | DeepseekModelSettings | TogetherModelSettings | BedrockModelSettings | AgentUpdateParams.OpenRouterModelSettings | AgentUpdateParams.ChatGptoAuthModelSettings | null;
2141
2343
  /**
2142
2344
  * The name of the agent.
2143
2345
  */
@@ -2233,7 +2435,7 @@ export declare namespace AgentUpdateParams {
2233
2435
  /**
2234
2436
  * Optional model settings used to override defaults for the summarizer model.
2235
2437
  */
2236
- model_settings?: AgentsAPI.OpenAIModelSettings | AgentsAPI.AnthropicModelSettings | AgentsAPI.GoogleAIModelSettings | AgentsAPI.GoogleVertexModelSettings | AgentsAPI.AzureModelSettings | AgentsAPI.XaiModelSettings | CompactionSettings.ZaiModelSettings | AgentsAPI.GroqModelSettings | AgentsAPI.DeepseekModelSettings | AgentsAPI.TogetherModelSettings | AgentsAPI.BedrockModelSettings | CompactionSettings.OpenRouterModelSettings | CompactionSettings.ChatGptoAuthModelSettings | null;
2438
+ model_settings?: AgentsAPI.OpenAIModelSettings | CompactionSettings.SgLangModelSettings | AgentsAPI.AnthropicModelSettings | AgentsAPI.GoogleAIModelSettings | AgentsAPI.GoogleVertexModelSettings | AgentsAPI.AzureModelSettings | AgentsAPI.XaiModelSettings | CompactionSettings.ZaiModelSettings | AgentsAPI.GroqModelSettings | AgentsAPI.DeepseekModelSettings | AgentsAPI.TogetherModelSettings | AgentsAPI.BedrockModelSettings | CompactionSettings.OpenRouterModelSettings | CompactionSettings.ChatGptoAuthModelSettings | null;
2237
2439
  /**
2238
2440
  * The prompt to use for summarization. If None, uses mode-specific default.
2239
2441
  */
@@ -2250,6 +2452,56 @@ export declare namespace AgentUpdateParams {
2250
2452
  sliding_window_percentage?: number;
2251
2453
  }
2252
2454
  namespace CompactionSettings {
2455
+ /**
2456
+ * SGLang model configuration (OpenAI-compatible runtime with SGLang-specific
2457
+ * parsing).
2458
+ */
2459
+ interface SgLangModelSettings {
2460
+ /**
2461
+ * The maximum number of tokens the model can generate.
2462
+ */
2463
+ max_output_tokens?: number;
2464
+ /**
2465
+ * Whether to enable parallel tool calling.
2466
+ */
2467
+ parallel_tool_calls?: boolean;
2468
+ /**
2469
+ * The type of the provider.
2470
+ */
2471
+ provider_type?: 'sglang';
2472
+ /**
2473
+ * The reasoning configuration for the model.
2474
+ */
2475
+ reasoning?: SgLangModelSettings.Reasoning;
2476
+ /**
2477
+ * The response format for the model.
2478
+ */
2479
+ response_format?: AgentsAPI.TextResponseFormat | AgentsAPI.JsonSchemaResponseFormat | AgentsAPI.JsonObjectResponseFormat | null;
2480
+ /**
2481
+ * Enable strict mode for tool calling. When true, tool outputs are guaranteed to
2482
+ * match JSON schemas.
2483
+ */
2484
+ strict?: boolean;
2485
+ /**
2486
+ * The temperature of the model.
2487
+ */
2488
+ temperature?: number;
2489
+ /**
2490
+ * SGLang tool call parser name (for example 'glm47', 'qwen25', or 'hermes').
2491
+ */
2492
+ tool_call_parser?: string | null;
2493
+ }
2494
+ namespace SgLangModelSettings {
2495
+ /**
2496
+ * The reasoning configuration for the model.
2497
+ */
2498
+ interface Reasoning {
2499
+ /**
2500
+ * The reasoning effort to use when generating text reasoning models
2501
+ */
2502
+ reasoning_effort?: 'none' | 'minimal' | 'low' | 'medium' | 'high' | 'xhigh';
2503
+ }
2504
+ }
2253
2505
  /**
2254
2506
  * Z.ai (ZhipuAI) model configuration (OpenAI-compatible).
2255
2507
  */
@@ -2356,6 +2608,56 @@ export declare namespace AgentUpdateParams {
2356
2608
  }
2357
2609
  }
2358
2610
  }
2611
+ /**
2612
+ * SGLang model configuration (OpenAI-compatible runtime with SGLang-specific
2613
+ * parsing).
2614
+ */
2615
+ interface SgLangModelSettings {
2616
+ /**
2617
+ * The maximum number of tokens the model can generate.
2618
+ */
2619
+ max_output_tokens?: number;
2620
+ /**
2621
+ * Whether to enable parallel tool calling.
2622
+ */
2623
+ parallel_tool_calls?: boolean;
2624
+ /**
2625
+ * The type of the provider.
2626
+ */
2627
+ provider_type?: 'sglang';
2628
+ /**
2629
+ * The reasoning configuration for the model.
2630
+ */
2631
+ reasoning?: SgLangModelSettings.Reasoning;
2632
+ /**
2633
+ * The response format for the model.
2634
+ */
2635
+ response_format?: AgentsAPI.TextResponseFormat | AgentsAPI.JsonSchemaResponseFormat | AgentsAPI.JsonObjectResponseFormat | null;
2636
+ /**
2637
+ * Enable strict mode for tool calling. When true, tool outputs are guaranteed to
2638
+ * match JSON schemas.
2639
+ */
2640
+ strict?: boolean;
2641
+ /**
2642
+ * The temperature of the model.
2643
+ */
2644
+ temperature?: number;
2645
+ /**
2646
+ * SGLang tool call parser name (for example 'glm47', 'qwen25', or 'hermes').
2647
+ */
2648
+ tool_call_parser?: string | null;
2649
+ }
2650
+ namespace SgLangModelSettings {
2651
+ /**
2652
+ * The reasoning configuration for the model.
2653
+ */
2654
+ interface Reasoning {
2655
+ /**
2656
+ * The reasoning effort to use when generating text reasoning models
2657
+ */
2658
+ reasoning_effort?: 'none' | 'minimal' | 'low' | 'medium' | 'high' | 'xhigh';
2659
+ }
2660
+ }
2359
2661
  /**
2360
2662
  * Z.ai (ZhipuAI) model configuration (OpenAI-compatible).
2361
2663
  */