weave-typescript 0.40.0 → 0.42.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -3,204 +3,204 @@
3
3
  // versions:
4
4
  // protoc-gen-ts_proto v2.11.8
5
5
  // protoc unknown
6
- // source: weaveapi/inference/v1/inference.proto
6
+ // source: weaveapi/gateway/v1/gateway.proto
7
7
  Object.defineProperty(exports, "__esModule", { value: true });
8
- exports.OpenAIImageData = exports.OpenAICompatibilityServiceGenerateImageRequest = exports.OpenAICompatibilityServiceCreateEmbeddingResponse = exports.OpenAIEmbeddingData = exports.OpenAICompatibilityServiceCreateEmbeddingRequest = exports.OpenAICompatibilityServiceStreamChatCompletionResponse = exports.OpenAICompatibilityServiceStreamChatCompletionRequest = exports.OpenAIChatDeltaChoice = exports.OpenAICompatibilityServiceCreateChatCompletionResponse = exports.OpenAIChatChoice = exports.OpenAICompatibilityServiceCreateChatCompletionRequest = exports.OpenAIChatToolCall = exports.OpenAIFunctionCall = exports.OpenAIResponseFormat = exports.OpenAIToolDefinition = exports.OpenAIFunctionDefinition = exports.OpenAIChatMessage = exports.CallMCPResponse = exports.CallMCPRequest = exports.GenerateImagesResponse = exports.GenerateImagesRequest = exports.CreateEmbeddingsResponse = exports.CreateEmbeddingsRequest = exports.CallToolsResponse = exports.CallToolsRequest = exports.StreamChatCompletionResponse = exports.StreamChatCompletionRequest = exports.CreateChatCompletionResponse = exports.CreateChatCompletionRequest = exports.GeneratedImage = exports.EmbeddingVector = exports.EmbeddingInput = exports.ChatMessage = exports.InferenceContentPart = exports.ToolResult = exports.ToolCall = exports.ToolDefinition = exports.StructuredOutputSchema = exports.InferenceGenerationConfig = exports.InferenceUsage = exports.InferenceTokenUsageBreakdown = exports.ResolvedInferenceContext = exports.InferenceRequestContext = exports.InferenceTokenKind = exports.ImageDeliveryMode = exports.ToolChoiceMode = exports.InferenceFinishReason = exports.InferenceMessageRole = exports.InferenceOperationType = exports.protobufPackage = void 0;
9
- exports.AnthropicCompatibilityServiceStreamMessagesResponse = exports.AnthropicCompatibilityServiceStreamMessagesRequest = exports.AnthropicCompatibilityServiceCreateMessageResponse = exports.AnthropicUsage = exports.AnthropicContentBlock = exports.AnthropicCompatibilityServiceCreateMessageRequest = exports.AnthropicToolDefinition = exports.AnthropicMessage = exports.OpenAICompatibilityServiceGenerateImageResponse = void 0;
10
- exports.inferenceOperationTypeFromJSON = inferenceOperationTypeFromJSON;
11
- exports.inferenceOperationTypeToJSON = inferenceOperationTypeToJSON;
12
- exports.inferenceMessageRoleFromJSON = inferenceMessageRoleFromJSON;
13
- exports.inferenceMessageRoleToJSON = inferenceMessageRoleToJSON;
14
- exports.inferenceFinishReasonFromJSON = inferenceFinishReasonFromJSON;
15
- exports.inferenceFinishReasonToJSON = inferenceFinishReasonToJSON;
8
+ exports.OpenAICompatibilityServiceGenerateImageRequest = exports.OpenAICompatibilityServiceCreateEmbeddingResponse = exports.OpenAIEmbeddingData = exports.OpenAICompatibilityServiceCreateEmbeddingRequest = exports.OpenAICompatibilityServiceStreamChatCompletionResponse = exports.OpenAICompatibilityServiceStreamChatCompletionRequest = exports.OpenAIChatDeltaChoice = exports.OpenAICompatibilityServiceCreateChatCompletionResponse = exports.OpenAIChatChoice = exports.OpenAICompatibilityServiceCreateChatCompletionRequest = exports.OpenAIChatToolCall = exports.OpenAIFunctionCall = exports.OpenAIResponseFormat = exports.OpenAIToolDefinition = exports.OpenAIFunctionDefinition = exports.OpenAIChatMessage = exports.CallMCPResponse = exports.CallMCPRequest = exports.GenerateImagesResponse = exports.GenerateImagesRequest = exports.CreateEmbeddingsResponse = exports.CreateEmbeddingsRequest = exports.CallToolsResponse = exports.CallToolsRequest = exports.StreamChatCompletionResponse = exports.StreamChatCompletionRequest = exports.CreateChatCompletionResponse = exports.CreateChatCompletionRequest = exports.GeneratedImage = exports.EmbeddingVector = exports.EmbeddingInput = exports.ChatMessage = exports.ContentPart = exports.ToolResult = exports.ToolCallDelta = exports.ToolCall = exports.ToolDefinition = exports.StructuredOutputSchema = exports.GenerationConfig = exports.Usage = exports.TokenUsageBreakdown = exports.ResolvedModelRoute = exports.RequestContext = exports.TokenKind = exports.ImageDeliveryMode = exports.ToolChoiceMode = exports.FinishReason = exports.MessageRole = exports.ModelOperation = exports.protobufPackage = void 0;
9
+ exports.AnthropicCompatibilityServiceStreamMessagesResponse = exports.AnthropicCompatibilityServiceStreamMessagesRequest = exports.AnthropicCompatibilityServiceCreateMessageResponse = exports.AnthropicUsage = exports.AnthropicContentBlock = exports.AnthropicCompatibilityServiceCreateMessageRequest = exports.AnthropicToolDefinition = exports.AnthropicMessage = exports.OpenAICompatibilityServiceGenerateImageResponse = exports.OpenAIImageData = void 0;
10
+ exports.modelOperationFromJSON = modelOperationFromJSON;
11
+ exports.modelOperationToJSON = modelOperationToJSON;
12
+ exports.messageRoleFromJSON = messageRoleFromJSON;
13
+ exports.messageRoleToJSON = messageRoleToJSON;
14
+ exports.finishReasonFromJSON = finishReasonFromJSON;
15
+ exports.finishReasonToJSON = finishReasonToJSON;
16
16
  exports.toolChoiceModeFromJSON = toolChoiceModeFromJSON;
17
17
  exports.toolChoiceModeToJSON = toolChoiceModeToJSON;
18
18
  exports.imageDeliveryModeFromJSON = imageDeliveryModeFromJSON;
19
19
  exports.imageDeliveryModeToJSON = imageDeliveryModeToJSON;
20
- exports.inferenceTokenKindFromJSON = inferenceTokenKindFromJSON;
21
- exports.inferenceTokenKindToJSON = inferenceTokenKindToJSON;
20
+ exports.tokenKindFromJSON = tokenKindFromJSON;
21
+ exports.tokenKindToJSON = tokenKindToJSON;
22
22
  /* eslint-disable */
23
23
  const wire_1 = require("@bufbuild/protobuf/wire");
24
24
  const struct_pb_1 = require("../../../google/protobuf/struct.pb");
25
25
  const timestamp_pb_1 = require("../../../google/protobuf/timestamp.pb");
26
26
  const provider_pb_1 = require("../../provider/v1/provider.pb");
27
- exports.protobufPackage = "weaveapi.inference.v1";
28
- /** InferenceOperationType identifies one canonical execution capability. */
29
- var InferenceOperationType;
30
- (function (InferenceOperationType) {
31
- InferenceOperationType[InferenceOperationType["INFERENCE_OPERATION_TYPE_UNSPECIFIED"] = 0] = "INFERENCE_OPERATION_TYPE_UNSPECIFIED";
32
- InferenceOperationType[InferenceOperationType["INFERENCE_OPERATION_TYPE_CHAT_COMPLETION"] = 1] = "INFERENCE_OPERATION_TYPE_CHAT_COMPLETION";
33
- InferenceOperationType[InferenceOperationType["INFERENCE_OPERATION_TYPE_STREAM_CHAT_COMPLETION"] = 2] = "INFERENCE_OPERATION_TYPE_STREAM_CHAT_COMPLETION";
34
- InferenceOperationType[InferenceOperationType["INFERENCE_OPERATION_TYPE_STRUCTURED_OUTPUT"] = 3] = "INFERENCE_OPERATION_TYPE_STRUCTURED_OUTPUT";
35
- InferenceOperationType[InferenceOperationType["INFERENCE_OPERATION_TYPE_TOOL_CALLING"] = 4] = "INFERENCE_OPERATION_TYPE_TOOL_CALLING";
36
- InferenceOperationType[InferenceOperationType["INFERENCE_OPERATION_TYPE_EMBEDDINGS"] = 5] = "INFERENCE_OPERATION_TYPE_EMBEDDINGS";
37
- InferenceOperationType[InferenceOperationType["INFERENCE_OPERATION_TYPE_IMAGE_GENERATION"] = 6] = "INFERENCE_OPERATION_TYPE_IMAGE_GENERATION";
38
- InferenceOperationType[InferenceOperationType["INFERENCE_OPERATION_TYPE_MCP_CALL"] = 7] = "INFERENCE_OPERATION_TYPE_MCP_CALL";
39
- InferenceOperationType[InferenceOperationType["UNRECOGNIZED"] = -1] = "UNRECOGNIZED";
40
- })(InferenceOperationType || (exports.InferenceOperationType = InferenceOperationType = {}));
41
- function inferenceOperationTypeFromJSON(object) {
27
+ exports.protobufPackage = "weaveapi.gateway.v1";
28
+ /** ModelOperation identifies one model gateway capability. */
29
+ var ModelOperation;
30
+ (function (ModelOperation) {
31
+ ModelOperation[ModelOperation["MODEL_OPERATION_UNSPECIFIED"] = 0] = "MODEL_OPERATION_UNSPECIFIED";
32
+ ModelOperation[ModelOperation["MODEL_OPERATION_CHAT_COMPLETION"] = 1] = "MODEL_OPERATION_CHAT_COMPLETION";
33
+ ModelOperation[ModelOperation["MODEL_OPERATION_STREAM_CHAT_COMPLETION"] = 2] = "MODEL_OPERATION_STREAM_CHAT_COMPLETION";
34
+ ModelOperation[ModelOperation["MODEL_OPERATION_STRUCTURED_OUTPUT"] = 3] = "MODEL_OPERATION_STRUCTURED_OUTPUT";
35
+ ModelOperation[ModelOperation["MODEL_OPERATION_TOOL_CALLING"] = 4] = "MODEL_OPERATION_TOOL_CALLING";
36
+ ModelOperation[ModelOperation["MODEL_OPERATION_EMBEDDINGS"] = 5] = "MODEL_OPERATION_EMBEDDINGS";
37
+ ModelOperation[ModelOperation["MODEL_OPERATION_IMAGE_GENERATION"] = 6] = "MODEL_OPERATION_IMAGE_GENERATION";
38
+ ModelOperation[ModelOperation["MODEL_OPERATION_MCP_CALL"] = 7] = "MODEL_OPERATION_MCP_CALL";
39
+ ModelOperation[ModelOperation["UNRECOGNIZED"] = -1] = "UNRECOGNIZED";
40
+ })(ModelOperation || (exports.ModelOperation = ModelOperation = {}));
41
+ function modelOperationFromJSON(object) {
42
42
  switch (object) {
43
43
  case 0:
44
- case "INFERENCE_OPERATION_TYPE_UNSPECIFIED":
45
- return InferenceOperationType.INFERENCE_OPERATION_TYPE_UNSPECIFIED;
44
+ case "MODEL_OPERATION_UNSPECIFIED":
45
+ return ModelOperation.MODEL_OPERATION_UNSPECIFIED;
46
46
  case 1:
47
- case "INFERENCE_OPERATION_TYPE_CHAT_COMPLETION":
48
- return InferenceOperationType.INFERENCE_OPERATION_TYPE_CHAT_COMPLETION;
47
+ case "MODEL_OPERATION_CHAT_COMPLETION":
48
+ return ModelOperation.MODEL_OPERATION_CHAT_COMPLETION;
49
49
  case 2:
50
- case "INFERENCE_OPERATION_TYPE_STREAM_CHAT_COMPLETION":
51
- return InferenceOperationType.INFERENCE_OPERATION_TYPE_STREAM_CHAT_COMPLETION;
50
+ case "MODEL_OPERATION_STREAM_CHAT_COMPLETION":
51
+ return ModelOperation.MODEL_OPERATION_STREAM_CHAT_COMPLETION;
52
52
  case 3:
53
- case "INFERENCE_OPERATION_TYPE_STRUCTURED_OUTPUT":
54
- return InferenceOperationType.INFERENCE_OPERATION_TYPE_STRUCTURED_OUTPUT;
53
+ case "MODEL_OPERATION_STRUCTURED_OUTPUT":
54
+ return ModelOperation.MODEL_OPERATION_STRUCTURED_OUTPUT;
55
55
  case 4:
56
- case "INFERENCE_OPERATION_TYPE_TOOL_CALLING":
57
- return InferenceOperationType.INFERENCE_OPERATION_TYPE_TOOL_CALLING;
56
+ case "MODEL_OPERATION_TOOL_CALLING":
57
+ return ModelOperation.MODEL_OPERATION_TOOL_CALLING;
58
58
  case 5:
59
- case "INFERENCE_OPERATION_TYPE_EMBEDDINGS":
60
- return InferenceOperationType.INFERENCE_OPERATION_TYPE_EMBEDDINGS;
59
+ case "MODEL_OPERATION_EMBEDDINGS":
60
+ return ModelOperation.MODEL_OPERATION_EMBEDDINGS;
61
61
  case 6:
62
- case "INFERENCE_OPERATION_TYPE_IMAGE_GENERATION":
63
- return InferenceOperationType.INFERENCE_OPERATION_TYPE_IMAGE_GENERATION;
62
+ case "MODEL_OPERATION_IMAGE_GENERATION":
63
+ return ModelOperation.MODEL_OPERATION_IMAGE_GENERATION;
64
64
  case 7:
65
- case "INFERENCE_OPERATION_TYPE_MCP_CALL":
66
- return InferenceOperationType.INFERENCE_OPERATION_TYPE_MCP_CALL;
65
+ case "MODEL_OPERATION_MCP_CALL":
66
+ return ModelOperation.MODEL_OPERATION_MCP_CALL;
67
67
  case -1:
68
68
  case "UNRECOGNIZED":
69
69
  default:
70
- return InferenceOperationType.UNRECOGNIZED;
70
+ return ModelOperation.UNRECOGNIZED;
71
71
  }
72
72
  }
73
- function inferenceOperationTypeToJSON(object) {
73
+ function modelOperationToJSON(object) {
74
74
  switch (object) {
75
- case InferenceOperationType.INFERENCE_OPERATION_TYPE_UNSPECIFIED:
76
- return "INFERENCE_OPERATION_TYPE_UNSPECIFIED";
77
- case InferenceOperationType.INFERENCE_OPERATION_TYPE_CHAT_COMPLETION:
78
- return "INFERENCE_OPERATION_TYPE_CHAT_COMPLETION";
79
- case InferenceOperationType.INFERENCE_OPERATION_TYPE_STREAM_CHAT_COMPLETION:
80
- return "INFERENCE_OPERATION_TYPE_STREAM_CHAT_COMPLETION";
81
- case InferenceOperationType.INFERENCE_OPERATION_TYPE_STRUCTURED_OUTPUT:
82
- return "INFERENCE_OPERATION_TYPE_STRUCTURED_OUTPUT";
83
- case InferenceOperationType.INFERENCE_OPERATION_TYPE_TOOL_CALLING:
84
- return "INFERENCE_OPERATION_TYPE_TOOL_CALLING";
85
- case InferenceOperationType.INFERENCE_OPERATION_TYPE_EMBEDDINGS:
86
- return "INFERENCE_OPERATION_TYPE_EMBEDDINGS";
87
- case InferenceOperationType.INFERENCE_OPERATION_TYPE_IMAGE_GENERATION:
88
- return "INFERENCE_OPERATION_TYPE_IMAGE_GENERATION";
89
- case InferenceOperationType.INFERENCE_OPERATION_TYPE_MCP_CALL:
90
- return "INFERENCE_OPERATION_TYPE_MCP_CALL";
91
- case InferenceOperationType.UNRECOGNIZED:
75
+ case ModelOperation.MODEL_OPERATION_UNSPECIFIED:
76
+ return "MODEL_OPERATION_UNSPECIFIED";
77
+ case ModelOperation.MODEL_OPERATION_CHAT_COMPLETION:
78
+ return "MODEL_OPERATION_CHAT_COMPLETION";
79
+ case ModelOperation.MODEL_OPERATION_STREAM_CHAT_COMPLETION:
80
+ return "MODEL_OPERATION_STREAM_CHAT_COMPLETION";
81
+ case ModelOperation.MODEL_OPERATION_STRUCTURED_OUTPUT:
82
+ return "MODEL_OPERATION_STRUCTURED_OUTPUT";
83
+ case ModelOperation.MODEL_OPERATION_TOOL_CALLING:
84
+ return "MODEL_OPERATION_TOOL_CALLING";
85
+ case ModelOperation.MODEL_OPERATION_EMBEDDINGS:
86
+ return "MODEL_OPERATION_EMBEDDINGS";
87
+ case ModelOperation.MODEL_OPERATION_IMAGE_GENERATION:
88
+ return "MODEL_OPERATION_IMAGE_GENERATION";
89
+ case ModelOperation.MODEL_OPERATION_MCP_CALL:
90
+ return "MODEL_OPERATION_MCP_CALL";
91
+ case ModelOperation.UNRECOGNIZED:
92
92
  default:
93
93
  return "UNRECOGNIZED";
94
94
  }
95
95
  }
96
- /** InferenceMessageRole identifies one participant role in a canonical message. */
97
- var InferenceMessageRole;
98
- (function (InferenceMessageRole) {
99
- InferenceMessageRole[InferenceMessageRole["INFERENCE_MESSAGE_ROLE_UNSPECIFIED"] = 0] = "INFERENCE_MESSAGE_ROLE_UNSPECIFIED";
100
- InferenceMessageRole[InferenceMessageRole["INFERENCE_MESSAGE_ROLE_SYSTEM"] = 1] = "INFERENCE_MESSAGE_ROLE_SYSTEM";
101
- InferenceMessageRole[InferenceMessageRole["INFERENCE_MESSAGE_ROLE_USER"] = 2] = "INFERENCE_MESSAGE_ROLE_USER";
102
- InferenceMessageRole[InferenceMessageRole["INFERENCE_MESSAGE_ROLE_ASSISTANT"] = 3] = "INFERENCE_MESSAGE_ROLE_ASSISTANT";
103
- InferenceMessageRole[InferenceMessageRole["INFERENCE_MESSAGE_ROLE_TOOL"] = 4] = "INFERENCE_MESSAGE_ROLE_TOOL";
104
- InferenceMessageRole[InferenceMessageRole["INFERENCE_MESSAGE_ROLE_DEVELOPER"] = 5] = "INFERENCE_MESSAGE_ROLE_DEVELOPER";
105
- InferenceMessageRole[InferenceMessageRole["UNRECOGNIZED"] = -1] = "UNRECOGNIZED";
106
- })(InferenceMessageRole || (exports.InferenceMessageRole = InferenceMessageRole = {}));
107
- function inferenceMessageRoleFromJSON(object) {
96
+ /** MessageRole identifies one participant role in a model gateway message. */
97
+ var MessageRole;
98
+ (function (MessageRole) {
99
+ MessageRole[MessageRole["MESSAGE_ROLE_UNSPECIFIED"] = 0] = "MESSAGE_ROLE_UNSPECIFIED";
100
+ MessageRole[MessageRole["MESSAGE_ROLE_SYSTEM"] = 1] = "MESSAGE_ROLE_SYSTEM";
101
+ MessageRole[MessageRole["MESSAGE_ROLE_USER"] = 2] = "MESSAGE_ROLE_USER";
102
+ MessageRole[MessageRole["MESSAGE_ROLE_ASSISTANT"] = 3] = "MESSAGE_ROLE_ASSISTANT";
103
+ MessageRole[MessageRole["MESSAGE_ROLE_TOOL"] = 4] = "MESSAGE_ROLE_TOOL";
104
+ MessageRole[MessageRole["MESSAGE_ROLE_DEVELOPER"] = 5] = "MESSAGE_ROLE_DEVELOPER";
105
+ MessageRole[MessageRole["UNRECOGNIZED"] = -1] = "UNRECOGNIZED";
106
+ })(MessageRole || (exports.MessageRole = MessageRole = {}));
107
+ function messageRoleFromJSON(object) {
108
108
  switch (object) {
109
109
  case 0:
110
- case "INFERENCE_MESSAGE_ROLE_UNSPECIFIED":
111
- return InferenceMessageRole.INFERENCE_MESSAGE_ROLE_UNSPECIFIED;
110
+ case "MESSAGE_ROLE_UNSPECIFIED":
111
+ return MessageRole.MESSAGE_ROLE_UNSPECIFIED;
112
112
  case 1:
113
- case "INFERENCE_MESSAGE_ROLE_SYSTEM":
114
- return InferenceMessageRole.INFERENCE_MESSAGE_ROLE_SYSTEM;
113
+ case "MESSAGE_ROLE_SYSTEM":
114
+ return MessageRole.MESSAGE_ROLE_SYSTEM;
115
115
  case 2:
116
- case "INFERENCE_MESSAGE_ROLE_USER":
117
- return InferenceMessageRole.INFERENCE_MESSAGE_ROLE_USER;
116
+ case "MESSAGE_ROLE_USER":
117
+ return MessageRole.MESSAGE_ROLE_USER;
118
118
  case 3:
119
- case "INFERENCE_MESSAGE_ROLE_ASSISTANT":
120
- return InferenceMessageRole.INFERENCE_MESSAGE_ROLE_ASSISTANT;
119
+ case "MESSAGE_ROLE_ASSISTANT":
120
+ return MessageRole.MESSAGE_ROLE_ASSISTANT;
121
121
  case 4:
122
- case "INFERENCE_MESSAGE_ROLE_TOOL":
123
- return InferenceMessageRole.INFERENCE_MESSAGE_ROLE_TOOL;
122
+ case "MESSAGE_ROLE_TOOL":
123
+ return MessageRole.MESSAGE_ROLE_TOOL;
124
124
  case 5:
125
- case "INFERENCE_MESSAGE_ROLE_DEVELOPER":
126
- return InferenceMessageRole.INFERENCE_MESSAGE_ROLE_DEVELOPER;
125
+ case "MESSAGE_ROLE_DEVELOPER":
126
+ return MessageRole.MESSAGE_ROLE_DEVELOPER;
127
127
  case -1:
128
128
  case "UNRECOGNIZED":
129
129
  default:
130
- return InferenceMessageRole.UNRECOGNIZED;
130
+ return MessageRole.UNRECOGNIZED;
131
131
  }
132
132
  }
133
- function inferenceMessageRoleToJSON(object) {
133
+ function messageRoleToJSON(object) {
134
134
  switch (object) {
135
- case InferenceMessageRole.INFERENCE_MESSAGE_ROLE_UNSPECIFIED:
136
- return "INFERENCE_MESSAGE_ROLE_UNSPECIFIED";
137
- case InferenceMessageRole.INFERENCE_MESSAGE_ROLE_SYSTEM:
138
- return "INFERENCE_MESSAGE_ROLE_SYSTEM";
139
- case InferenceMessageRole.INFERENCE_MESSAGE_ROLE_USER:
140
- return "INFERENCE_MESSAGE_ROLE_USER";
141
- case InferenceMessageRole.INFERENCE_MESSAGE_ROLE_ASSISTANT:
142
- return "INFERENCE_MESSAGE_ROLE_ASSISTANT";
143
- case InferenceMessageRole.INFERENCE_MESSAGE_ROLE_TOOL:
144
- return "INFERENCE_MESSAGE_ROLE_TOOL";
145
- case InferenceMessageRole.INFERENCE_MESSAGE_ROLE_DEVELOPER:
146
- return "INFERENCE_MESSAGE_ROLE_DEVELOPER";
147
- case InferenceMessageRole.UNRECOGNIZED:
135
+ case MessageRole.MESSAGE_ROLE_UNSPECIFIED:
136
+ return "MESSAGE_ROLE_UNSPECIFIED";
137
+ case MessageRole.MESSAGE_ROLE_SYSTEM:
138
+ return "MESSAGE_ROLE_SYSTEM";
139
+ case MessageRole.MESSAGE_ROLE_USER:
140
+ return "MESSAGE_ROLE_USER";
141
+ case MessageRole.MESSAGE_ROLE_ASSISTANT:
142
+ return "MESSAGE_ROLE_ASSISTANT";
143
+ case MessageRole.MESSAGE_ROLE_TOOL:
144
+ return "MESSAGE_ROLE_TOOL";
145
+ case MessageRole.MESSAGE_ROLE_DEVELOPER:
146
+ return "MESSAGE_ROLE_DEVELOPER";
147
+ case MessageRole.UNRECOGNIZED:
148
148
  default:
149
149
  return "UNRECOGNIZED";
150
150
  }
151
151
  }
152
- /** InferenceFinishReason describes why one inference operation ended. */
153
- var InferenceFinishReason;
154
- (function (InferenceFinishReason) {
155
- InferenceFinishReason[InferenceFinishReason["INFERENCE_FINISH_REASON_UNSPECIFIED"] = 0] = "INFERENCE_FINISH_REASON_UNSPECIFIED";
156
- InferenceFinishReason[InferenceFinishReason["INFERENCE_FINISH_REASON_STOP"] = 1] = "INFERENCE_FINISH_REASON_STOP";
157
- InferenceFinishReason[InferenceFinishReason["INFERENCE_FINISH_REASON_LENGTH"] = 2] = "INFERENCE_FINISH_REASON_LENGTH";
158
- InferenceFinishReason[InferenceFinishReason["INFERENCE_FINISH_REASON_TOOL_CALLS"] = 3] = "INFERENCE_FINISH_REASON_TOOL_CALLS";
159
- InferenceFinishReason[InferenceFinishReason["INFERENCE_FINISH_REASON_CONTENT_FILTER"] = 4] = "INFERENCE_FINISH_REASON_CONTENT_FILTER";
160
- InferenceFinishReason[InferenceFinishReason["INFERENCE_FINISH_REASON_ERROR"] = 5] = "INFERENCE_FINISH_REASON_ERROR";
161
- InferenceFinishReason[InferenceFinishReason["UNRECOGNIZED"] = -1] = "UNRECOGNIZED";
162
- })(InferenceFinishReason || (exports.InferenceFinishReason = InferenceFinishReason = {}));
163
- function inferenceFinishReasonFromJSON(object) {
152
+ /** FinishReason describes why one model call ended. */
153
+ var FinishReason;
154
+ (function (FinishReason) {
155
+ FinishReason[FinishReason["FINISH_REASON_UNSPECIFIED"] = 0] = "FINISH_REASON_UNSPECIFIED";
156
+ FinishReason[FinishReason["FINISH_REASON_STOP"] = 1] = "FINISH_REASON_STOP";
157
+ FinishReason[FinishReason["FINISH_REASON_LENGTH"] = 2] = "FINISH_REASON_LENGTH";
158
+ FinishReason[FinishReason["FINISH_REASON_TOOL_CALLS"] = 3] = "FINISH_REASON_TOOL_CALLS";
159
+ FinishReason[FinishReason["FINISH_REASON_CONTENT_FILTER"] = 4] = "FINISH_REASON_CONTENT_FILTER";
160
+ FinishReason[FinishReason["FINISH_REASON_ERROR"] = 5] = "FINISH_REASON_ERROR";
161
+ FinishReason[FinishReason["UNRECOGNIZED"] = -1] = "UNRECOGNIZED";
162
+ })(FinishReason || (exports.FinishReason = FinishReason = {}));
163
+ function finishReasonFromJSON(object) {
164
164
  switch (object) {
165
165
  case 0:
166
- case "INFERENCE_FINISH_REASON_UNSPECIFIED":
167
- return InferenceFinishReason.INFERENCE_FINISH_REASON_UNSPECIFIED;
166
+ case "FINISH_REASON_UNSPECIFIED":
167
+ return FinishReason.FINISH_REASON_UNSPECIFIED;
168
168
  case 1:
169
- case "INFERENCE_FINISH_REASON_STOP":
170
- return InferenceFinishReason.INFERENCE_FINISH_REASON_STOP;
169
+ case "FINISH_REASON_STOP":
170
+ return FinishReason.FINISH_REASON_STOP;
171
171
  case 2:
172
- case "INFERENCE_FINISH_REASON_LENGTH":
173
- return InferenceFinishReason.INFERENCE_FINISH_REASON_LENGTH;
172
+ case "FINISH_REASON_LENGTH":
173
+ return FinishReason.FINISH_REASON_LENGTH;
174
174
  case 3:
175
- case "INFERENCE_FINISH_REASON_TOOL_CALLS":
176
- return InferenceFinishReason.INFERENCE_FINISH_REASON_TOOL_CALLS;
175
+ case "FINISH_REASON_TOOL_CALLS":
176
+ return FinishReason.FINISH_REASON_TOOL_CALLS;
177
177
  case 4:
178
- case "INFERENCE_FINISH_REASON_CONTENT_FILTER":
179
- return InferenceFinishReason.INFERENCE_FINISH_REASON_CONTENT_FILTER;
178
+ case "FINISH_REASON_CONTENT_FILTER":
179
+ return FinishReason.FINISH_REASON_CONTENT_FILTER;
180
180
  case 5:
181
- case "INFERENCE_FINISH_REASON_ERROR":
182
- return InferenceFinishReason.INFERENCE_FINISH_REASON_ERROR;
181
+ case "FINISH_REASON_ERROR":
182
+ return FinishReason.FINISH_REASON_ERROR;
183
183
  case -1:
184
184
  case "UNRECOGNIZED":
185
185
  default:
186
- return InferenceFinishReason.UNRECOGNIZED;
186
+ return FinishReason.UNRECOGNIZED;
187
187
  }
188
188
  }
189
- function inferenceFinishReasonToJSON(object) {
189
+ function finishReasonToJSON(object) {
190
190
  switch (object) {
191
- case InferenceFinishReason.INFERENCE_FINISH_REASON_UNSPECIFIED:
192
- return "INFERENCE_FINISH_REASON_UNSPECIFIED";
193
- case InferenceFinishReason.INFERENCE_FINISH_REASON_STOP:
194
- return "INFERENCE_FINISH_REASON_STOP";
195
- case InferenceFinishReason.INFERENCE_FINISH_REASON_LENGTH:
196
- return "INFERENCE_FINISH_REASON_LENGTH";
197
- case InferenceFinishReason.INFERENCE_FINISH_REASON_TOOL_CALLS:
198
- return "INFERENCE_FINISH_REASON_TOOL_CALLS";
199
- case InferenceFinishReason.INFERENCE_FINISH_REASON_CONTENT_FILTER:
200
- return "INFERENCE_FINISH_REASON_CONTENT_FILTER";
201
- case InferenceFinishReason.INFERENCE_FINISH_REASON_ERROR:
202
- return "INFERENCE_FINISH_REASON_ERROR";
203
- case InferenceFinishReason.UNRECOGNIZED:
191
+ case FinishReason.FINISH_REASON_UNSPECIFIED:
192
+ return "FINISH_REASON_UNSPECIFIED";
193
+ case FinishReason.FINISH_REASON_STOP:
194
+ return "FINISH_REASON_STOP";
195
+ case FinishReason.FINISH_REASON_LENGTH:
196
+ return "FINISH_REASON_LENGTH";
197
+ case FinishReason.FINISH_REASON_TOOL_CALLS:
198
+ return "FINISH_REASON_TOOL_CALLS";
199
+ case FinishReason.FINISH_REASON_CONTENT_FILTER:
200
+ return "FINISH_REASON_CONTENT_FILTER";
201
+ case FinishReason.FINISH_REASON_ERROR:
202
+ return "FINISH_REASON_ERROR";
203
+ case FinishReason.UNRECOGNIZED:
204
204
  default:
205
205
  return "UNRECOGNIZED";
206
206
  }
@@ -293,84 +293,84 @@ function imageDeliveryModeToJSON(object) {
293
293
  return "UNRECOGNIZED";
294
294
  }
295
295
  }
296
- /** InferenceTokenKind classifies one token bucket for usage accounting. */
297
- var InferenceTokenKind;
298
- (function (InferenceTokenKind) {
299
- InferenceTokenKind[InferenceTokenKind["INFERENCE_TOKEN_KIND_UNSPECIFIED"] = 0] = "INFERENCE_TOKEN_KIND_UNSPECIFIED";
300
- InferenceTokenKind[InferenceTokenKind["INFERENCE_TOKEN_KIND_INPUT"] = 1] = "INFERENCE_TOKEN_KIND_INPUT";
301
- InferenceTokenKind[InferenceTokenKind["INFERENCE_TOKEN_KIND_INPUT_CACHE_WRITE"] = 2] = "INFERENCE_TOKEN_KIND_INPUT_CACHE_WRITE";
302
- InferenceTokenKind[InferenceTokenKind["INFERENCE_TOKEN_KIND_INPUT_CACHE_READ"] = 3] = "INFERENCE_TOKEN_KIND_INPUT_CACHE_READ";
303
- InferenceTokenKind[InferenceTokenKind["INFERENCE_TOKEN_KIND_INPUT_AUDIO"] = 4] = "INFERENCE_TOKEN_KIND_INPUT_AUDIO";
304
- InferenceTokenKind[InferenceTokenKind["INFERENCE_TOKEN_KIND_INPUT_IMAGE"] = 5] = "INFERENCE_TOKEN_KIND_INPUT_IMAGE";
305
- InferenceTokenKind[InferenceTokenKind["INFERENCE_TOKEN_KIND_OUTPUT"] = 6] = "INFERENCE_TOKEN_KIND_OUTPUT";
306
- InferenceTokenKind[InferenceTokenKind["INFERENCE_TOKEN_KIND_OUTPUT_REASONING"] = 7] = "INFERENCE_TOKEN_KIND_OUTPUT_REASONING";
307
- InferenceTokenKind[InferenceTokenKind["INFERENCE_TOKEN_KIND_OUTPUT_AUDIO"] = 8] = "INFERENCE_TOKEN_KIND_OUTPUT_AUDIO";
308
- InferenceTokenKind[InferenceTokenKind["UNRECOGNIZED"] = -1] = "UNRECOGNIZED";
309
- })(InferenceTokenKind || (exports.InferenceTokenKind = InferenceTokenKind = {}));
310
- function inferenceTokenKindFromJSON(object) {
296
+ /** TokenKind classifies one token bucket for usage accounting. */
297
+ var TokenKind;
298
+ (function (TokenKind) {
299
+ TokenKind[TokenKind["TOKEN_KIND_UNSPECIFIED"] = 0] = "TOKEN_KIND_UNSPECIFIED";
300
+ TokenKind[TokenKind["TOKEN_KIND_INPUT"] = 1] = "TOKEN_KIND_INPUT";
301
+ TokenKind[TokenKind["TOKEN_KIND_INPUT_CACHE_WRITE"] = 2] = "TOKEN_KIND_INPUT_CACHE_WRITE";
302
+ TokenKind[TokenKind["TOKEN_KIND_INPUT_CACHE_READ"] = 3] = "TOKEN_KIND_INPUT_CACHE_READ";
303
+ TokenKind[TokenKind["TOKEN_KIND_INPUT_AUDIO"] = 4] = "TOKEN_KIND_INPUT_AUDIO";
304
+ TokenKind[TokenKind["TOKEN_KIND_INPUT_IMAGE"] = 5] = "TOKEN_KIND_INPUT_IMAGE";
305
+ TokenKind[TokenKind["TOKEN_KIND_OUTPUT"] = 6] = "TOKEN_KIND_OUTPUT";
306
+ TokenKind[TokenKind["TOKEN_KIND_OUTPUT_REASONING"] = 7] = "TOKEN_KIND_OUTPUT_REASONING";
307
+ TokenKind[TokenKind["TOKEN_KIND_OUTPUT_AUDIO"] = 8] = "TOKEN_KIND_OUTPUT_AUDIO";
308
+ TokenKind[TokenKind["UNRECOGNIZED"] = -1] = "UNRECOGNIZED";
309
+ })(TokenKind || (exports.TokenKind = TokenKind = {}));
310
+ function tokenKindFromJSON(object) {
311
311
  switch (object) {
312
312
  case 0:
313
- case "INFERENCE_TOKEN_KIND_UNSPECIFIED":
314
- return InferenceTokenKind.INFERENCE_TOKEN_KIND_UNSPECIFIED;
313
+ case "TOKEN_KIND_UNSPECIFIED":
314
+ return TokenKind.TOKEN_KIND_UNSPECIFIED;
315
315
  case 1:
316
- case "INFERENCE_TOKEN_KIND_INPUT":
317
- return InferenceTokenKind.INFERENCE_TOKEN_KIND_INPUT;
316
+ case "TOKEN_KIND_INPUT":
317
+ return TokenKind.TOKEN_KIND_INPUT;
318
318
  case 2:
319
- case "INFERENCE_TOKEN_KIND_INPUT_CACHE_WRITE":
320
- return InferenceTokenKind.INFERENCE_TOKEN_KIND_INPUT_CACHE_WRITE;
319
+ case "TOKEN_KIND_INPUT_CACHE_WRITE":
320
+ return TokenKind.TOKEN_KIND_INPUT_CACHE_WRITE;
321
321
  case 3:
322
- case "INFERENCE_TOKEN_KIND_INPUT_CACHE_READ":
323
- return InferenceTokenKind.INFERENCE_TOKEN_KIND_INPUT_CACHE_READ;
322
+ case "TOKEN_KIND_INPUT_CACHE_READ":
323
+ return TokenKind.TOKEN_KIND_INPUT_CACHE_READ;
324
324
  case 4:
325
- case "INFERENCE_TOKEN_KIND_INPUT_AUDIO":
326
- return InferenceTokenKind.INFERENCE_TOKEN_KIND_INPUT_AUDIO;
325
+ case "TOKEN_KIND_INPUT_AUDIO":
326
+ return TokenKind.TOKEN_KIND_INPUT_AUDIO;
327
327
  case 5:
328
- case "INFERENCE_TOKEN_KIND_INPUT_IMAGE":
329
- return InferenceTokenKind.INFERENCE_TOKEN_KIND_INPUT_IMAGE;
328
+ case "TOKEN_KIND_INPUT_IMAGE":
329
+ return TokenKind.TOKEN_KIND_INPUT_IMAGE;
330
330
  case 6:
331
- case "INFERENCE_TOKEN_KIND_OUTPUT":
332
- return InferenceTokenKind.INFERENCE_TOKEN_KIND_OUTPUT;
331
+ case "TOKEN_KIND_OUTPUT":
332
+ return TokenKind.TOKEN_KIND_OUTPUT;
333
333
  case 7:
334
- case "INFERENCE_TOKEN_KIND_OUTPUT_REASONING":
335
- return InferenceTokenKind.INFERENCE_TOKEN_KIND_OUTPUT_REASONING;
334
+ case "TOKEN_KIND_OUTPUT_REASONING":
335
+ return TokenKind.TOKEN_KIND_OUTPUT_REASONING;
336
336
  case 8:
337
- case "INFERENCE_TOKEN_KIND_OUTPUT_AUDIO":
338
- return InferenceTokenKind.INFERENCE_TOKEN_KIND_OUTPUT_AUDIO;
337
+ case "TOKEN_KIND_OUTPUT_AUDIO":
338
+ return TokenKind.TOKEN_KIND_OUTPUT_AUDIO;
339
339
  case -1:
340
340
  case "UNRECOGNIZED":
341
341
  default:
342
- return InferenceTokenKind.UNRECOGNIZED;
342
+ return TokenKind.UNRECOGNIZED;
343
343
  }
344
344
  }
345
- function inferenceTokenKindToJSON(object) {
345
+ function tokenKindToJSON(object) {
346
346
  switch (object) {
347
- case InferenceTokenKind.INFERENCE_TOKEN_KIND_UNSPECIFIED:
348
- return "INFERENCE_TOKEN_KIND_UNSPECIFIED";
349
- case InferenceTokenKind.INFERENCE_TOKEN_KIND_INPUT:
350
- return "INFERENCE_TOKEN_KIND_INPUT";
351
- case InferenceTokenKind.INFERENCE_TOKEN_KIND_INPUT_CACHE_WRITE:
352
- return "INFERENCE_TOKEN_KIND_INPUT_CACHE_WRITE";
353
- case InferenceTokenKind.INFERENCE_TOKEN_KIND_INPUT_CACHE_READ:
354
- return "INFERENCE_TOKEN_KIND_INPUT_CACHE_READ";
355
- case InferenceTokenKind.INFERENCE_TOKEN_KIND_INPUT_AUDIO:
356
- return "INFERENCE_TOKEN_KIND_INPUT_AUDIO";
357
- case InferenceTokenKind.INFERENCE_TOKEN_KIND_INPUT_IMAGE:
358
- return "INFERENCE_TOKEN_KIND_INPUT_IMAGE";
359
- case InferenceTokenKind.INFERENCE_TOKEN_KIND_OUTPUT:
360
- return "INFERENCE_TOKEN_KIND_OUTPUT";
361
- case InferenceTokenKind.INFERENCE_TOKEN_KIND_OUTPUT_REASONING:
362
- return "INFERENCE_TOKEN_KIND_OUTPUT_REASONING";
363
- case InferenceTokenKind.INFERENCE_TOKEN_KIND_OUTPUT_AUDIO:
364
- return "INFERENCE_TOKEN_KIND_OUTPUT_AUDIO";
365
- case InferenceTokenKind.UNRECOGNIZED:
347
+ case TokenKind.TOKEN_KIND_UNSPECIFIED:
348
+ return "TOKEN_KIND_UNSPECIFIED";
349
+ case TokenKind.TOKEN_KIND_INPUT:
350
+ return "TOKEN_KIND_INPUT";
351
+ case TokenKind.TOKEN_KIND_INPUT_CACHE_WRITE:
352
+ return "TOKEN_KIND_INPUT_CACHE_WRITE";
353
+ case TokenKind.TOKEN_KIND_INPUT_CACHE_READ:
354
+ return "TOKEN_KIND_INPUT_CACHE_READ";
355
+ case TokenKind.TOKEN_KIND_INPUT_AUDIO:
356
+ return "TOKEN_KIND_INPUT_AUDIO";
357
+ case TokenKind.TOKEN_KIND_INPUT_IMAGE:
358
+ return "TOKEN_KIND_INPUT_IMAGE";
359
+ case TokenKind.TOKEN_KIND_OUTPUT:
360
+ return "TOKEN_KIND_OUTPUT";
361
+ case TokenKind.TOKEN_KIND_OUTPUT_REASONING:
362
+ return "TOKEN_KIND_OUTPUT_REASONING";
363
+ case TokenKind.TOKEN_KIND_OUTPUT_AUDIO:
364
+ return "TOKEN_KIND_OUTPUT_AUDIO";
365
+ case TokenKind.UNRECOGNIZED:
366
366
  default:
367
367
  return "UNRECOGNIZED";
368
368
  }
369
369
  }
370
- function createBaseInferenceRequestContext() {
370
+ function createBaseRequestContext() {
371
371
  return { organizationId: "", approvedModelId: "", idempotencyKey: "", metadata: undefined };
372
372
  }
373
- exports.InferenceRequestContext = {
373
+ exports.RequestContext = {
374
374
  encode(message, writer = new wire_1.BinaryWriter()) {
375
375
  if (message.organizationId !== "") {
376
376
  writer.uint32(10).string(message.organizationId);
@@ -389,7 +389,7 @@ exports.InferenceRequestContext = {
389
389
  decode(input, length) {
390
390
  const reader = input instanceof wire_1.BinaryReader ? input : new wire_1.BinaryReader(input);
391
391
  const end = length === undefined ? reader.len : reader.pos + length;
392
- const message = createBaseInferenceRequestContext();
392
+ const message = createBaseRequestContext();
393
393
  while (reader.pos < end) {
394
394
  const tag = reader.uint32();
395
395
  switch (tag >>> 3) {
@@ -466,11 +466,11 @@ exports.InferenceRequestContext = {
466
466
  return obj;
467
467
  },
468
468
  create(base) {
469
- return exports.InferenceRequestContext.fromPartial(base !== null && base !== void 0 ? base : {});
469
+ return exports.RequestContext.fromPartial(base !== null && base !== void 0 ? base : {});
470
470
  },
471
471
  fromPartial(object) {
472
472
  var _a, _b, _c, _d;
473
- const message = createBaseInferenceRequestContext();
473
+ const message = createBaseRequestContext();
474
474
  message.organizationId = (_a = object.organizationId) !== null && _a !== void 0 ? _a : "";
475
475
  message.approvedModelId = (_b = object.approvedModelId) !== null && _b !== void 0 ? _b : "";
476
476
  message.idempotencyKey = (_c = object.idempotencyKey) !== null && _c !== void 0 ? _c : "";
@@ -478,20 +478,20 @@ exports.InferenceRequestContext = {
478
478
  return message;
479
479
  },
480
480
  };
481
- function createBaseResolvedInferenceContext() {
481
+ function createBaseResolvedModelRoute() {
482
482
  return {
483
483
  organizationId: "",
484
484
  approvedModelId: "",
485
485
  providerConfigurationId: "",
486
486
  providerKind: 0,
487
487
  resolvedModel: "",
488
- operationType: 0,
488
+ operation: 0,
489
489
  requestId: "",
490
490
  upstreamRequestId: "",
491
491
  requestedAt: undefined,
492
492
  };
493
493
  }
494
- exports.ResolvedInferenceContext = {
494
+ exports.ResolvedModelRoute = {
495
495
  encode(message, writer = new wire_1.BinaryWriter()) {
496
496
  if (message.organizationId !== "") {
497
497
  writer.uint32(10).string(message.organizationId);
@@ -508,8 +508,8 @@ exports.ResolvedInferenceContext = {
508
508
  if (message.resolvedModel !== "") {
509
509
  writer.uint32(42).string(message.resolvedModel);
510
510
  }
511
- if (message.operationType !== 0) {
512
- writer.uint32(48).int32(message.operationType);
511
+ if (message.operation !== 0) {
512
+ writer.uint32(48).int32(message.operation);
513
513
  }
514
514
  if (message.requestId !== "") {
515
515
  writer.uint32(58).string(message.requestId);
@@ -525,7 +525,7 @@ exports.ResolvedInferenceContext = {
525
525
  decode(input, length) {
526
526
  const reader = input instanceof wire_1.BinaryReader ? input : new wire_1.BinaryReader(input);
527
527
  const end = length === undefined ? reader.len : reader.pos + length;
528
- const message = createBaseResolvedInferenceContext();
528
+ const message = createBaseResolvedModelRoute();
529
529
  while (reader.pos < end) {
530
530
  const tag = reader.uint32();
531
531
  switch (tag >>> 3) {
@@ -568,7 +568,7 @@ exports.ResolvedInferenceContext = {
568
568
  if (tag !== 48) {
569
569
  break;
570
570
  }
571
- message.operationType = reader.int32();
571
+ message.operation = reader.int32();
572
572
  continue;
573
573
  }
574
574
  case 7: {
@@ -627,11 +627,7 @@ exports.ResolvedInferenceContext = {
627
627
  : isSet(object.resolved_model)
628
628
  ? globalThis.String(object.resolved_model)
629
629
  : "",
630
- operationType: isSet(object.operationType)
631
- ? inferenceOperationTypeFromJSON(object.operationType)
632
- : isSet(object.operation_type)
633
- ? inferenceOperationTypeFromJSON(object.operation_type)
634
- : 0,
630
+ operation: isSet(object.operation) ? modelOperationFromJSON(object.operation) : 0,
635
631
  requestId: isSet(object.requestId)
636
632
  ? globalThis.String(object.requestId)
637
633
  : isSet(object.request_id)
@@ -666,8 +662,8 @@ exports.ResolvedInferenceContext = {
666
662
  if (message.resolvedModel !== "") {
667
663
  obj.resolvedModel = message.resolvedModel;
668
664
  }
669
- if (message.operationType !== 0) {
670
- obj.operationType = inferenceOperationTypeToJSON(message.operationType);
665
+ if (message.operation !== 0) {
666
+ obj.operation = modelOperationToJSON(message.operation);
671
667
  }
672
668
  if (message.requestId !== "") {
673
669
  obj.requestId = message.requestId;
@@ -681,27 +677,27 @@ exports.ResolvedInferenceContext = {
681
677
  return obj;
682
678
  },
683
679
  create(base) {
684
- return exports.ResolvedInferenceContext.fromPartial(base !== null && base !== void 0 ? base : {});
680
+ return exports.ResolvedModelRoute.fromPartial(base !== null && base !== void 0 ? base : {});
685
681
  },
686
682
  fromPartial(object) {
687
683
  var _a, _b, _c, _d, _e, _f, _g, _h, _j;
688
- const message = createBaseResolvedInferenceContext();
684
+ const message = createBaseResolvedModelRoute();
689
685
  message.organizationId = (_a = object.organizationId) !== null && _a !== void 0 ? _a : "";
690
686
  message.approvedModelId = (_b = object.approvedModelId) !== null && _b !== void 0 ? _b : "";
691
687
  message.providerConfigurationId = (_c = object.providerConfigurationId) !== null && _c !== void 0 ? _c : "";
692
688
  message.providerKind = (_d = object.providerKind) !== null && _d !== void 0 ? _d : 0;
693
689
  message.resolvedModel = (_e = object.resolvedModel) !== null && _e !== void 0 ? _e : "";
694
- message.operationType = (_f = object.operationType) !== null && _f !== void 0 ? _f : 0;
690
+ message.operation = (_f = object.operation) !== null && _f !== void 0 ? _f : 0;
695
691
  message.requestId = (_g = object.requestId) !== null && _g !== void 0 ? _g : "";
696
692
  message.upstreamRequestId = (_h = object.upstreamRequestId) !== null && _h !== void 0 ? _h : "";
697
693
  message.requestedAt = (_j = object.requestedAt) !== null && _j !== void 0 ? _j : undefined;
698
694
  return message;
699
695
  },
700
696
  };
701
- function createBaseInferenceTokenUsageBreakdown() {
697
+ function createBaseTokenUsageBreakdown() {
702
698
  return { kind: 0, tokenCount: 0, providerMetricName: "" };
703
699
  }
704
- exports.InferenceTokenUsageBreakdown = {
700
+ exports.TokenUsageBreakdown = {
705
701
  encode(message, writer = new wire_1.BinaryWriter()) {
706
702
  if (message.kind !== 0) {
707
703
  writer.uint32(8).int32(message.kind);
@@ -717,7 +713,7 @@ exports.InferenceTokenUsageBreakdown = {
717
713
  decode(input, length) {
718
714
  const reader = input instanceof wire_1.BinaryReader ? input : new wire_1.BinaryReader(input);
719
715
  const end = length === undefined ? reader.len : reader.pos + length;
720
- const message = createBaseInferenceTokenUsageBreakdown();
716
+ const message = createBaseTokenUsageBreakdown();
721
717
  while (reader.pos < end) {
722
718
  const tag = reader.uint32();
723
719
  switch (tag >>> 3) {
@@ -752,7 +748,7 @@ exports.InferenceTokenUsageBreakdown = {
752
748
  },
753
749
  fromJSON(object) {
754
750
  return {
755
- kind: isSet(object.kind) ? inferenceTokenKindFromJSON(object.kind) : 0,
751
+ kind: isSet(object.kind) ? tokenKindFromJSON(object.kind) : 0,
756
752
  tokenCount: isSet(object.tokenCount)
757
753
  ? globalThis.Number(object.tokenCount)
758
754
  : isSet(object.token_count)
@@ -768,7 +764,7 @@ exports.InferenceTokenUsageBreakdown = {
768
764
  toJSON(message) {
769
765
  const obj = {};
770
766
  if (message.kind !== 0) {
771
- obj.kind = inferenceTokenKindToJSON(message.kind);
767
+ obj.kind = tokenKindToJSON(message.kind);
772
768
  }
773
769
  if (message.tokenCount !== 0) {
774
770
  obj.tokenCount = Math.round(message.tokenCount);
@@ -779,21 +775,21 @@ exports.InferenceTokenUsageBreakdown = {
779
775
  return obj;
780
776
  },
781
777
  create(base) {
782
- return exports.InferenceTokenUsageBreakdown.fromPartial(base !== null && base !== void 0 ? base : {});
778
+ return exports.TokenUsageBreakdown.fromPartial(base !== null && base !== void 0 ? base : {});
783
779
  },
784
780
  fromPartial(object) {
785
781
  var _a, _b, _c;
786
- const message = createBaseInferenceTokenUsageBreakdown();
782
+ const message = createBaseTokenUsageBreakdown();
787
783
  message.kind = (_a = object.kind) !== null && _a !== void 0 ? _a : 0;
788
784
  message.tokenCount = (_b = object.tokenCount) !== null && _b !== void 0 ? _b : 0;
789
785
  message.providerMetricName = (_c = object.providerMetricName) !== null && _c !== void 0 ? _c : "";
790
786
  return message;
791
787
  },
792
788
  };
793
- function createBaseInferenceUsage() {
789
+ function createBaseUsage() {
794
790
  return { inputTokens: 0, outputTokens: 0, totalTokens: 0, tokenBreakdown: [], providerUsageRaw: undefined };
795
791
  }
796
- exports.InferenceUsage = {
792
+ exports.Usage = {
797
793
  encode(message, writer = new wire_1.BinaryWriter()) {
798
794
  if (message.inputTokens !== 0) {
799
795
  writer.uint32(8).int64(message.inputTokens);
@@ -805,7 +801,7 @@ exports.InferenceUsage = {
805
801
  writer.uint32(24).int64(message.totalTokens);
806
802
  }
807
803
  for (const v of message.tokenBreakdown) {
808
- exports.InferenceTokenUsageBreakdown.encode(v, writer.uint32(34).fork()).join();
804
+ exports.TokenUsageBreakdown.encode(v, writer.uint32(34).fork()).join();
809
805
  }
810
806
  if (message.providerUsageRaw !== undefined) {
811
807
  struct_pb_1.Struct.encode(struct_pb_1.Struct.wrap(message.providerUsageRaw), writer.uint32(42).fork()).join();
@@ -815,7 +811,7 @@ exports.InferenceUsage = {
815
811
  decode(input, length) {
816
812
  const reader = input instanceof wire_1.BinaryReader ? input : new wire_1.BinaryReader(input);
817
813
  const end = length === undefined ? reader.len : reader.pos + length;
818
- const message = createBaseInferenceUsage();
814
+ const message = createBaseUsage();
819
815
  while (reader.pos < end) {
820
816
  const tag = reader.uint32();
821
817
  switch (tag >>> 3) {
@@ -844,7 +840,7 @@ exports.InferenceUsage = {
844
840
  if (tag !== 34) {
845
841
  break;
846
842
  }
847
- message.tokenBreakdown.push(exports.InferenceTokenUsageBreakdown.decode(reader, reader.uint32()));
843
+ message.tokenBreakdown.push(exports.TokenUsageBreakdown.decode(reader, reader.uint32()));
848
844
  continue;
849
845
  }
850
846
  case 5: {
@@ -880,9 +876,9 @@ exports.InferenceUsage = {
880
876
  ? globalThis.Number(object.total_tokens)
881
877
  : 0,
882
878
  tokenBreakdown: globalThis.Array.isArray(object === null || object === void 0 ? void 0 : object.tokenBreakdown)
883
- ? object.tokenBreakdown.map((e) => exports.InferenceTokenUsageBreakdown.fromJSON(e))
879
+ ? object.tokenBreakdown.map((e) => exports.TokenUsageBreakdown.fromJSON(e))
884
880
  : globalThis.Array.isArray(object === null || object === void 0 ? void 0 : object.token_breakdown)
885
- ? object.token_breakdown.map((e) => exports.InferenceTokenUsageBreakdown.fromJSON(e))
881
+ ? object.token_breakdown.map((e) => exports.TokenUsageBreakdown.fromJSON(e))
886
882
  : [],
887
883
  providerUsageRaw: isObject(object.providerUsageRaw)
888
884
  ? object.providerUsageRaw
@@ -904,7 +900,7 @@ exports.InferenceUsage = {
904
900
  obj.totalTokens = Math.round(message.totalTokens);
905
901
  }
906
902
  if ((_a = message.tokenBreakdown) === null || _a === void 0 ? void 0 : _a.length) {
907
- obj.tokenBreakdown = message.tokenBreakdown.map((e) => exports.InferenceTokenUsageBreakdown.toJSON(e));
903
+ obj.tokenBreakdown = message.tokenBreakdown.map((e) => exports.TokenUsageBreakdown.toJSON(e));
908
904
  }
909
905
  if (message.providerUsageRaw !== undefined) {
910
906
  obj.providerUsageRaw = message.providerUsageRaw;
@@ -912,21 +908,21 @@ exports.InferenceUsage = {
912
908
  return obj;
913
909
  },
914
910
  create(base) {
915
- return exports.InferenceUsage.fromPartial(base !== null && base !== void 0 ? base : {});
911
+ return exports.Usage.fromPartial(base !== null && base !== void 0 ? base : {});
916
912
  },
917
913
  fromPartial(object) {
918
914
  var _a;
919
915
  var _b, _c, _d, _e;
920
- const message = createBaseInferenceUsage();
916
+ const message = createBaseUsage();
921
917
  message.inputTokens = (_b = object.inputTokens) !== null && _b !== void 0 ? _b : 0;
922
918
  message.outputTokens = (_c = object.outputTokens) !== null && _c !== void 0 ? _c : 0;
923
919
  message.totalTokens = (_d = object.totalTokens) !== null && _d !== void 0 ? _d : 0;
924
- message.tokenBreakdown = ((_a = object.tokenBreakdown) === null || _a === void 0 ? void 0 : _a.map((e) => exports.InferenceTokenUsageBreakdown.fromPartial(e))) || [];
920
+ message.tokenBreakdown = ((_a = object.tokenBreakdown) === null || _a === void 0 ? void 0 : _a.map((e) => exports.TokenUsageBreakdown.fromPartial(e))) || [];
925
921
  message.providerUsageRaw = (_e = object.providerUsageRaw) !== null && _e !== void 0 ? _e : undefined;
926
922
  return message;
927
923
  },
928
924
  };
929
- function createBaseInferenceGenerationConfig() {
925
+ function createBaseGenerationConfig() {
930
926
  return {
931
927
  temperature: 0,
932
928
  maxOutputTokens: 0,
@@ -940,7 +936,7 @@ function createBaseInferenceGenerationConfig() {
940
936
  metadata: undefined,
941
937
  };
942
938
  }
943
- exports.InferenceGenerationConfig = {
939
+ exports.GenerationConfig = {
944
940
  encode(message, writer = new wire_1.BinaryWriter()) {
945
941
  if (message.temperature !== 0) {
946
942
  writer.uint32(9).double(message.temperature);
@@ -977,7 +973,7 @@ exports.InferenceGenerationConfig = {
977
973
  decode(input, length) {
978
974
  const reader = input instanceof wire_1.BinaryReader ? input : new wire_1.BinaryReader(input);
979
975
  const end = length === undefined ? reader.len : reader.pos + length;
980
- const message = createBaseInferenceGenerationConfig();
976
+ const message = createBaseGenerationConfig();
981
977
  while (reader.pos < end) {
982
978
  const tag = reader.uint32();
983
979
  switch (tag >>> 3) {
@@ -1137,12 +1133,12 @@ exports.InferenceGenerationConfig = {
1137
1133
  return obj;
1138
1134
  },
1139
1135
  create(base) {
1140
- return exports.InferenceGenerationConfig.fromPartial(base !== null && base !== void 0 ? base : {});
1136
+ return exports.GenerationConfig.fromPartial(base !== null && base !== void 0 ? base : {});
1141
1137
  },
1142
1138
  fromPartial(object) {
1143
1139
  var _a;
1144
1140
  var _b, _c, _d, _e, _f, _g, _h, _j, _k;
1145
- const message = createBaseInferenceGenerationConfig();
1141
+ const message = createBaseGenerationConfig();
1146
1142
  message.temperature = (_b = object.temperature) !== null && _b !== void 0 ? _b : 0;
1147
1143
  message.maxOutputTokens = (_c = object.maxOutputTokens) !== null && _c !== void 0 ? _c : 0;
1148
1144
  message.stopSequences = ((_a = object.stopSequences) === null || _a === void 0 ? void 0 : _a.map((e) => e)) || [];
@@ -1337,7 +1333,7 @@ exports.ToolDefinition = {
1337
1333
  },
1338
1334
  };
1339
1335
  function createBaseToolCall() {
1340
- return { id: "", name: "", arguments: undefined };
1336
+ return { id: "", name: "", argumentsJson: "" };
1341
1337
  }
1342
1338
  exports.ToolCall = {
1343
1339
  encode(message, writer = new wire_1.BinaryWriter()) {
@@ -1347,8 +1343,8 @@ exports.ToolCall = {
1347
1343
  if (message.name !== "") {
1348
1344
  writer.uint32(18).string(message.name);
1349
1345
  }
1350
- if (message.arguments !== undefined) {
1351
- struct_pb_1.Struct.encode(struct_pb_1.Struct.wrap(message.arguments), writer.uint32(26).fork()).join();
1346
+ if (message.argumentsJson !== "") {
1347
+ writer.uint32(26).string(message.argumentsJson);
1352
1348
  }
1353
1349
  return writer;
1354
1350
  },
@@ -1377,7 +1373,7 @@ exports.ToolCall = {
1377
1373
  if (tag !== 26) {
1378
1374
  break;
1379
1375
  }
1380
- message.arguments = struct_pb_1.Struct.unwrap(struct_pb_1.Struct.decode(reader, reader.uint32()));
1376
+ message.argumentsJson = reader.string();
1381
1377
  continue;
1382
1378
  }
1383
1379
  }
@@ -1392,7 +1388,11 @@ exports.ToolCall = {
1392
1388
  return {
1393
1389
  id: isSet(object.id) ? globalThis.String(object.id) : "",
1394
1390
  name: isSet(object.name) ? globalThis.String(object.name) : "",
1395
- arguments: isObject(object.arguments) ? object.arguments : undefined,
1391
+ argumentsJson: isSet(object.argumentsJson)
1392
+ ? globalThis.String(object.argumentsJson)
1393
+ : isSet(object.arguments_json)
1394
+ ? globalThis.String(object.arguments_json)
1395
+ : "",
1396
1396
  };
1397
1397
  },
1398
1398
  toJSON(message) {
@@ -1403,8 +1403,8 @@ exports.ToolCall = {
1403
1403
  if (message.name !== "") {
1404
1404
  obj.name = message.name;
1405
1405
  }
1406
- if (message.arguments !== undefined) {
1407
- obj.arguments = message.arguments;
1406
+ if (message.argumentsJson !== "") {
1407
+ obj.argumentsJson = message.argumentsJson;
1408
1408
  }
1409
1409
  return obj;
1410
1410
  },
@@ -1416,7 +1416,114 @@ exports.ToolCall = {
1416
1416
  const message = createBaseToolCall();
1417
1417
  message.id = (_a = object.id) !== null && _a !== void 0 ? _a : "";
1418
1418
  message.name = (_b = object.name) !== null && _b !== void 0 ? _b : "";
1419
- message.arguments = (_c = object.arguments) !== null && _c !== void 0 ? _c : undefined;
1419
+ message.argumentsJson = (_c = object.argumentsJson) !== null && _c !== void 0 ? _c : "";
1420
+ return message;
1421
+ },
1422
+ };
1423
+ function createBaseToolCallDelta() {
1424
+ return { id: "", name: "", argumentsDelta: "", argumentsJson: "" };
1425
+ }
1426
+ exports.ToolCallDelta = {
1427
+ encode(message, writer = new wire_1.BinaryWriter()) {
1428
+ if (message.id !== "") {
1429
+ writer.uint32(10).string(message.id);
1430
+ }
1431
+ if (message.name !== "") {
1432
+ writer.uint32(18).string(message.name);
1433
+ }
1434
+ if (message.argumentsDelta !== "") {
1435
+ writer.uint32(26).string(message.argumentsDelta);
1436
+ }
1437
+ if (message.argumentsJson !== "") {
1438
+ writer.uint32(34).string(message.argumentsJson);
1439
+ }
1440
+ return writer;
1441
+ },
1442
+ decode(input, length) {
1443
+ const reader = input instanceof wire_1.BinaryReader ? input : new wire_1.BinaryReader(input);
1444
+ const end = length === undefined ? reader.len : reader.pos + length;
1445
+ const message = createBaseToolCallDelta();
1446
+ while (reader.pos < end) {
1447
+ const tag = reader.uint32();
1448
+ switch (tag >>> 3) {
1449
+ case 1: {
1450
+ if (tag !== 10) {
1451
+ break;
1452
+ }
1453
+ message.id = reader.string();
1454
+ continue;
1455
+ }
1456
+ case 2: {
1457
+ if (tag !== 18) {
1458
+ break;
1459
+ }
1460
+ message.name = reader.string();
1461
+ continue;
1462
+ }
1463
+ case 3: {
1464
+ if (tag !== 26) {
1465
+ break;
1466
+ }
1467
+ message.argumentsDelta = reader.string();
1468
+ continue;
1469
+ }
1470
+ case 4: {
1471
+ if (tag !== 34) {
1472
+ break;
1473
+ }
1474
+ message.argumentsJson = reader.string();
1475
+ continue;
1476
+ }
1477
+ }
1478
+ if ((tag & 7) === 4 || tag === 0) {
1479
+ break;
1480
+ }
1481
+ reader.skip(tag & 7);
1482
+ }
1483
+ return message;
1484
+ },
1485
+ fromJSON(object) {
1486
+ return {
1487
+ id: isSet(object.id) ? globalThis.String(object.id) : "",
1488
+ name: isSet(object.name) ? globalThis.String(object.name) : "",
1489
+ argumentsDelta: isSet(object.argumentsDelta)
1490
+ ? globalThis.String(object.argumentsDelta)
1491
+ : isSet(object.arguments_delta)
1492
+ ? globalThis.String(object.arguments_delta)
1493
+ : "",
1494
+ argumentsJson: isSet(object.argumentsJson)
1495
+ ? globalThis.String(object.argumentsJson)
1496
+ : isSet(object.arguments_json)
1497
+ ? globalThis.String(object.arguments_json)
1498
+ : "",
1499
+ };
1500
+ },
1501
+ toJSON(message) {
1502
+ const obj = {};
1503
+ if (message.id !== "") {
1504
+ obj.id = message.id;
1505
+ }
1506
+ if (message.name !== "") {
1507
+ obj.name = message.name;
1508
+ }
1509
+ if (message.argumentsDelta !== "") {
1510
+ obj.argumentsDelta = message.argumentsDelta;
1511
+ }
1512
+ if (message.argumentsJson !== "") {
1513
+ obj.argumentsJson = message.argumentsJson;
1514
+ }
1515
+ return obj;
1516
+ },
1517
+ create(base) {
1518
+ return exports.ToolCallDelta.fromPartial(base !== null && base !== void 0 ? base : {});
1519
+ },
1520
+ fromPartial(object) {
1521
+ var _a, _b, _c, _d;
1522
+ const message = createBaseToolCallDelta();
1523
+ message.id = (_a = object.id) !== null && _a !== void 0 ? _a : "";
1524
+ message.name = (_b = object.name) !== null && _b !== void 0 ? _b : "";
1525
+ message.argumentsDelta = (_c = object.argumentsDelta) !== null && _c !== void 0 ? _c : "";
1526
+ message.argumentsJson = (_d = object.argumentsJson) !== null && _d !== void 0 ? _d : "";
1420
1527
  return message;
1421
1528
  },
1422
1529
  };
@@ -1527,7 +1634,7 @@ exports.ToolResult = {
1527
1634
  return message;
1528
1635
  },
1529
1636
  };
1530
- function createBaseInferenceContentPart() {
1637
+ function createBaseContentPart() {
1531
1638
  return {
1532
1639
  text: undefined,
1533
1640
  imageUrl: undefined,
@@ -1538,7 +1645,7 @@ function createBaseInferenceContentPart() {
1538
1645
  mimeType: "",
1539
1646
  };
1540
1647
  }
1541
- exports.InferenceContentPart = {
1648
+ exports.ContentPart = {
1542
1649
  encode(message, writer = new wire_1.BinaryWriter()) {
1543
1650
  if (message.text !== undefined) {
1544
1651
  writer.uint32(10).string(message.text);
@@ -1566,7 +1673,7 @@ exports.InferenceContentPart = {
1566
1673
  decode(input, length) {
1567
1674
  const reader = input instanceof wire_1.BinaryReader ? input : new wire_1.BinaryReader(input);
1568
1675
  const end = length === undefined ? reader.len : reader.pos + length;
1569
- const message = createBaseInferenceContentPart();
1676
+ const message = createBaseContentPart();
1570
1677
  while (reader.pos < end) {
1571
1678
  const tag = reader.uint32();
1572
1679
  switch (tag >>> 3) {
@@ -1688,11 +1795,11 @@ exports.InferenceContentPart = {
1688
1795
  return obj;
1689
1796
  },
1690
1797
  create(base) {
1691
- return exports.InferenceContentPart.fromPartial(base !== null && base !== void 0 ? base : {});
1798
+ return exports.ContentPart.fromPartial(base !== null && base !== void 0 ? base : {});
1692
1799
  },
1693
1800
  fromPartial(object) {
1694
1801
  var _a, _b, _c, _d, _e;
1695
- const message = createBaseInferenceContentPart();
1802
+ const message = createBaseContentPart();
1696
1803
  message.text = (_a = object.text) !== null && _a !== void 0 ? _a : undefined;
1697
1804
  message.imageUrl = (_b = object.imageUrl) !== null && _b !== void 0 ? _b : undefined;
1698
1805
  message.binaryData = (_c = object.binaryData) !== null && _c !== void 0 ? _c : undefined;
@@ -1716,7 +1823,7 @@ exports.ChatMessage = {
1716
1823
  writer.uint32(8).int32(message.role);
1717
1824
  }
1718
1825
  for (const v of message.content) {
1719
- exports.InferenceContentPart.encode(v, writer.uint32(18).fork()).join();
1826
+ exports.ContentPart.encode(v, writer.uint32(18).fork()).join();
1720
1827
  }
1721
1828
  if (message.participantName !== "") {
1722
1829
  writer.uint32(26).string(message.participantName);
@@ -1744,7 +1851,7 @@ exports.ChatMessage = {
1744
1851
  if (tag !== 18) {
1745
1852
  break;
1746
1853
  }
1747
- message.content.push(exports.InferenceContentPart.decode(reader, reader.uint32()));
1854
+ message.content.push(exports.ContentPart.decode(reader, reader.uint32()));
1748
1855
  continue;
1749
1856
  }
1750
1857
  case 3: {
@@ -1771,10 +1878,8 @@ exports.ChatMessage = {
1771
1878
  },
1772
1879
  fromJSON(object) {
1773
1880
  return {
1774
- role: isSet(object.role) ? inferenceMessageRoleFromJSON(object.role) : 0,
1775
- content: globalThis.Array.isArray(object === null || object === void 0 ? void 0 : object.content)
1776
- ? object.content.map((e) => exports.InferenceContentPart.fromJSON(e))
1777
- : [],
1881
+ role: isSet(object.role) ? messageRoleFromJSON(object.role) : 0,
1882
+ content: globalThis.Array.isArray(object === null || object === void 0 ? void 0 : object.content) ? object.content.map((e) => exports.ContentPart.fromJSON(e)) : [],
1778
1883
  participantName: isSet(object.participantName)
1779
1884
  ? globalThis.String(object.participantName)
1780
1885
  : isSet(object.participant_name)
@@ -1791,10 +1896,10 @@ exports.ChatMessage = {
1791
1896
  var _a;
1792
1897
  const obj = {};
1793
1898
  if (message.role !== 0) {
1794
- obj.role = inferenceMessageRoleToJSON(message.role);
1899
+ obj.role = messageRoleToJSON(message.role);
1795
1900
  }
1796
1901
  if ((_a = message.content) === null || _a === void 0 ? void 0 : _a.length) {
1797
- obj.content = message.content.map((e) => exports.InferenceContentPart.toJSON(e));
1902
+ obj.content = message.content.map((e) => exports.ContentPart.toJSON(e));
1798
1903
  }
1799
1904
  if (message.participantName !== "") {
1800
1905
  obj.participantName = message.participantName;
@@ -1812,7 +1917,7 @@ exports.ChatMessage = {
1812
1917
  var _b, _c, _d;
1813
1918
  const message = createBaseChatMessage();
1814
1919
  message.role = (_b = object.role) !== null && _b !== void 0 ? _b : 0;
1815
- message.content = ((_a = object.content) === null || _a === void 0 ? void 0 : _a.map((e) => exports.InferenceContentPart.fromPartial(e))) || [];
1920
+ message.content = ((_a = object.content) === null || _a === void 0 ? void 0 : _a.map((e) => exports.ContentPart.fromPartial(e))) || [];
1816
1921
  message.participantName = (_c = object.participantName) !== null && _c !== void 0 ? _c : "";
1817
1922
  message.toolCallId = (_d = object.toolCallId) !== null && _d !== void 0 ? _d : "";
1818
1923
  return message;
@@ -2154,7 +2259,7 @@ function createBaseCreateChatCompletionRequest() {
2154
2259
  exports.CreateChatCompletionRequest = {
2155
2260
  encode(message, writer = new wire_1.BinaryWriter()) {
2156
2261
  if (message.context !== undefined) {
2157
- exports.InferenceRequestContext.encode(message.context, writer.uint32(10).fork()).join();
2262
+ exports.RequestContext.encode(message.context, writer.uint32(10).fork()).join();
2158
2263
  }
2159
2264
  if (message.model !== "") {
2160
2265
  writer.uint32(18).string(message.model);
@@ -2172,7 +2277,7 @@ exports.CreateChatCompletionRequest = {
2172
2277
  writer.uint32(48).int32(message.toolChoiceMode);
2173
2278
  }
2174
2279
  if (message.generationConfig !== undefined) {
2175
- exports.InferenceGenerationConfig.encode(message.generationConfig, writer.uint32(58).fork()).join();
2280
+ exports.GenerationConfig.encode(message.generationConfig, writer.uint32(58).fork()).join();
2176
2281
  }
2177
2282
  if (message.responseSchema !== undefined) {
2178
2283
  exports.StructuredOutputSchema.encode(message.responseSchema, writer.uint32(66).fork()).join();
@@ -2190,7 +2295,7 @@ exports.CreateChatCompletionRequest = {
2190
2295
  if (tag !== 10) {
2191
2296
  break;
2192
2297
  }
2193
- message.context = exports.InferenceRequestContext.decode(reader, reader.uint32());
2298
+ message.context = exports.RequestContext.decode(reader, reader.uint32());
2194
2299
  continue;
2195
2300
  }
2196
2301
  case 2: {
@@ -2232,7 +2337,7 @@ exports.CreateChatCompletionRequest = {
2232
2337
  if (tag !== 58) {
2233
2338
  break;
2234
2339
  }
2235
- message.generationConfig = exports.InferenceGenerationConfig.decode(reader, reader.uint32());
2340
+ message.generationConfig = exports.GenerationConfig.decode(reader, reader.uint32());
2236
2341
  continue;
2237
2342
  }
2238
2343
  case 8: {
@@ -2252,7 +2357,7 @@ exports.CreateChatCompletionRequest = {
2252
2357
  },
2253
2358
  fromJSON(object) {
2254
2359
  return {
2255
- context: isSet(object.context) ? exports.InferenceRequestContext.fromJSON(object.context) : undefined,
2360
+ context: isSet(object.context) ? exports.RequestContext.fromJSON(object.context) : undefined,
2256
2361
  model: isSet(object.model) ? globalThis.String(object.model) : "",
2257
2362
  messages: globalThis.Array.isArray(object === null || object === void 0 ? void 0 : object.messages)
2258
2363
  ? object.messages.map((e) => exports.ChatMessage.fromJSON(e))
@@ -2269,9 +2374,9 @@ exports.CreateChatCompletionRequest = {
2269
2374
  ? toolChoiceModeFromJSON(object.tool_choice_mode)
2270
2375
  : 0,
2271
2376
  generationConfig: isSet(object.generationConfig)
2272
- ? exports.InferenceGenerationConfig.fromJSON(object.generationConfig)
2377
+ ? exports.GenerationConfig.fromJSON(object.generationConfig)
2273
2378
  : isSet(object.generation_config)
2274
- ? exports.InferenceGenerationConfig.fromJSON(object.generation_config)
2379
+ ? exports.GenerationConfig.fromJSON(object.generation_config)
2275
2380
  : undefined,
2276
2381
  responseSchema: isSet(object.responseSchema)
2277
2382
  ? exports.StructuredOutputSchema.fromJSON(object.responseSchema)
@@ -2284,7 +2389,7 @@ exports.CreateChatCompletionRequest = {
2284
2389
  var _a, _b;
2285
2390
  const obj = {};
2286
2391
  if (message.context !== undefined) {
2287
- obj.context = exports.InferenceRequestContext.toJSON(message.context);
2392
+ obj.context = exports.RequestContext.toJSON(message.context);
2288
2393
  }
2289
2394
  if (message.model !== "") {
2290
2395
  obj.model = message.model;
@@ -2302,7 +2407,7 @@ exports.CreateChatCompletionRequest = {
2302
2407
  obj.toolChoiceMode = toolChoiceModeToJSON(message.toolChoiceMode);
2303
2408
  }
2304
2409
  if (message.generationConfig !== undefined) {
2305
- obj.generationConfig = exports.InferenceGenerationConfig.toJSON(message.generationConfig);
2410
+ obj.generationConfig = exports.GenerationConfig.toJSON(message.generationConfig);
2306
2411
  }
2307
2412
  if (message.responseSchema !== undefined) {
2308
2413
  obj.responseSchema = exports.StructuredOutputSchema.toJSON(message.responseSchema);
@@ -2317,7 +2422,7 @@ exports.CreateChatCompletionRequest = {
2317
2422
  var _c, _d, _e;
2318
2423
  const message = createBaseCreateChatCompletionRequest();
2319
2424
  message.context = (object.context !== undefined && object.context !== null)
2320
- ? exports.InferenceRequestContext.fromPartial(object.context)
2425
+ ? exports.RequestContext.fromPartial(object.context)
2321
2426
  : undefined;
2322
2427
  message.model = (_c = object.model) !== null && _c !== void 0 ? _c : "";
2323
2428
  message.messages = ((_a = object.messages) === null || _a === void 0 ? void 0 : _a.map((e) => exports.ChatMessage.fromPartial(e))) || [];
@@ -2325,7 +2430,7 @@ exports.CreateChatCompletionRequest = {
2325
2430
  message.tools = ((_b = object.tools) === null || _b === void 0 ? void 0 : _b.map((e) => exports.ToolDefinition.fromPartial(e))) || [];
2326
2431
  message.toolChoiceMode = (_e = object.toolChoiceMode) !== null && _e !== void 0 ? _e : 0;
2327
2432
  message.generationConfig = (object.generationConfig !== undefined && object.generationConfig !== null)
2328
- ? exports.InferenceGenerationConfig.fromPartial(object.generationConfig)
2433
+ ? exports.GenerationConfig.fromPartial(object.generationConfig)
2329
2434
  : undefined;
2330
2435
  message.responseSchema = (object.responseSchema !== undefined && object.responseSchema !== null)
2331
2436
  ? exports.StructuredOutputSchema.fromPartial(object.responseSchema)
@@ -2346,7 +2451,7 @@ function createBaseCreateChatCompletionResponse() {
2346
2451
  exports.CreateChatCompletionResponse = {
2347
2452
  encode(message, writer = new wire_1.BinaryWriter()) {
2348
2453
  if (message.context !== undefined) {
2349
- exports.ResolvedInferenceContext.encode(message.context, writer.uint32(10).fork()).join();
2454
+ exports.ResolvedModelRoute.encode(message.context, writer.uint32(10).fork()).join();
2350
2455
  }
2351
2456
  if (message.message !== undefined) {
2352
2457
  exports.ChatMessage.encode(message.message, writer.uint32(18).fork()).join();
@@ -2358,7 +2463,7 @@ exports.CreateChatCompletionResponse = {
2358
2463
  writer.uint32(32).int32(message.finishReason);
2359
2464
  }
2360
2465
  if (message.usage !== undefined) {
2361
- exports.InferenceUsage.encode(message.usage, writer.uint32(42).fork()).join();
2466
+ exports.Usage.encode(message.usage, writer.uint32(42).fork()).join();
2362
2467
  }
2363
2468
  if (message.structuredOutput !== undefined) {
2364
2469
  struct_pb_1.Struct.encode(struct_pb_1.Struct.wrap(message.structuredOutput), writer.uint32(50).fork()).join();
@@ -2376,7 +2481,7 @@ exports.CreateChatCompletionResponse = {
2376
2481
  if (tag !== 10) {
2377
2482
  break;
2378
2483
  }
2379
- message.context = exports.ResolvedInferenceContext.decode(reader, reader.uint32());
2484
+ message.context = exports.ResolvedModelRoute.decode(reader, reader.uint32());
2380
2485
  continue;
2381
2486
  }
2382
2487
  case 2: {
@@ -2404,7 +2509,7 @@ exports.CreateChatCompletionResponse = {
2404
2509
  if (tag !== 42) {
2405
2510
  break;
2406
2511
  }
2407
- message.usage = exports.InferenceUsage.decode(reader, reader.uint32());
2512
+ message.usage = exports.Usage.decode(reader, reader.uint32());
2408
2513
  continue;
2409
2514
  }
2410
2515
  case 6: {
@@ -2424,7 +2529,7 @@ exports.CreateChatCompletionResponse = {
2424
2529
  },
2425
2530
  fromJSON(object) {
2426
2531
  return {
2427
- context: isSet(object.context) ? exports.ResolvedInferenceContext.fromJSON(object.context) : undefined,
2532
+ context: isSet(object.context) ? exports.ResolvedModelRoute.fromJSON(object.context) : undefined,
2428
2533
  message: isSet(object.message) ? exports.ChatMessage.fromJSON(object.message) : undefined,
2429
2534
  toolCalls: globalThis.Array.isArray(object === null || object === void 0 ? void 0 : object.toolCalls)
2430
2535
  ? object.toolCalls.map((e) => exports.ToolCall.fromJSON(e))
@@ -2432,11 +2537,11 @@ exports.CreateChatCompletionResponse = {
2432
2537
  ? object.tool_calls.map((e) => exports.ToolCall.fromJSON(e))
2433
2538
  : [],
2434
2539
  finishReason: isSet(object.finishReason)
2435
- ? inferenceFinishReasonFromJSON(object.finishReason)
2540
+ ? finishReasonFromJSON(object.finishReason)
2436
2541
  : isSet(object.finish_reason)
2437
- ? inferenceFinishReasonFromJSON(object.finish_reason)
2542
+ ? finishReasonFromJSON(object.finish_reason)
2438
2543
  : 0,
2439
- usage: isSet(object.usage) ? exports.InferenceUsage.fromJSON(object.usage) : undefined,
2544
+ usage: isSet(object.usage) ? exports.Usage.fromJSON(object.usage) : undefined,
2440
2545
  structuredOutput: isObject(object.structuredOutput)
2441
2546
  ? object.structuredOutput
2442
2547
  : isObject(object.structured_output)
@@ -2448,7 +2553,7 @@ exports.CreateChatCompletionResponse = {
2448
2553
  var _a;
2449
2554
  const obj = {};
2450
2555
  if (message.context !== undefined) {
2451
- obj.context = exports.ResolvedInferenceContext.toJSON(message.context);
2556
+ obj.context = exports.ResolvedModelRoute.toJSON(message.context);
2452
2557
  }
2453
2558
  if (message.message !== undefined) {
2454
2559
  obj.message = exports.ChatMessage.toJSON(message.message);
@@ -2457,10 +2562,10 @@ exports.CreateChatCompletionResponse = {
2457
2562
  obj.toolCalls = message.toolCalls.map((e) => exports.ToolCall.toJSON(e));
2458
2563
  }
2459
2564
  if (message.finishReason !== 0) {
2460
- obj.finishReason = inferenceFinishReasonToJSON(message.finishReason);
2565
+ obj.finishReason = finishReasonToJSON(message.finishReason);
2461
2566
  }
2462
2567
  if (message.usage !== undefined) {
2463
- obj.usage = exports.InferenceUsage.toJSON(message.usage);
2568
+ obj.usage = exports.Usage.toJSON(message.usage);
2464
2569
  }
2465
2570
  if (message.structuredOutput !== undefined) {
2466
2571
  obj.structuredOutput = message.structuredOutput;
@@ -2475,16 +2580,14 @@ exports.CreateChatCompletionResponse = {
2475
2580
  var _b, _c;
2476
2581
  const message = createBaseCreateChatCompletionResponse();
2477
2582
  message.context = (object.context !== undefined && object.context !== null)
2478
- ? exports.ResolvedInferenceContext.fromPartial(object.context)
2583
+ ? exports.ResolvedModelRoute.fromPartial(object.context)
2479
2584
  : undefined;
2480
2585
  message.message = (object.message !== undefined && object.message !== null)
2481
2586
  ? exports.ChatMessage.fromPartial(object.message)
2482
2587
  : undefined;
2483
2588
  message.toolCalls = ((_a = object.toolCalls) === null || _a === void 0 ? void 0 : _a.map((e) => exports.ToolCall.fromPartial(e))) || [];
2484
2589
  message.finishReason = (_b = object.finishReason) !== null && _b !== void 0 ? _b : 0;
2485
- message.usage = (object.usage !== undefined && object.usage !== null)
2486
- ? exports.InferenceUsage.fromPartial(object.usage)
2487
- : undefined;
2590
+ message.usage = (object.usage !== undefined && object.usage !== null) ? exports.Usage.fromPartial(object.usage) : undefined;
2488
2591
  message.structuredOutput = (_c = object.structuredOutput) !== null && _c !== void 0 ? _c : undefined;
2489
2592
  return message;
2490
2593
  },
@@ -2504,7 +2607,7 @@ function createBaseStreamChatCompletionRequest() {
2504
2607
  exports.StreamChatCompletionRequest = {
2505
2608
  encode(message, writer = new wire_1.BinaryWriter()) {
2506
2609
  if (message.context !== undefined) {
2507
- exports.InferenceRequestContext.encode(message.context, writer.uint32(10).fork()).join();
2610
+ exports.RequestContext.encode(message.context, writer.uint32(10).fork()).join();
2508
2611
  }
2509
2612
  if (message.model !== "") {
2510
2613
  writer.uint32(18).string(message.model);
@@ -2522,7 +2625,7 @@ exports.StreamChatCompletionRequest = {
2522
2625
  writer.uint32(48).int32(message.toolChoiceMode);
2523
2626
  }
2524
2627
  if (message.generationConfig !== undefined) {
2525
- exports.InferenceGenerationConfig.encode(message.generationConfig, writer.uint32(58).fork()).join();
2628
+ exports.GenerationConfig.encode(message.generationConfig, writer.uint32(58).fork()).join();
2526
2629
  }
2527
2630
  if (message.responseSchema !== undefined) {
2528
2631
  exports.StructuredOutputSchema.encode(message.responseSchema, writer.uint32(66).fork()).join();
@@ -2540,7 +2643,7 @@ exports.StreamChatCompletionRequest = {
2540
2643
  if (tag !== 10) {
2541
2644
  break;
2542
2645
  }
2543
- message.context = exports.InferenceRequestContext.decode(reader, reader.uint32());
2646
+ message.context = exports.RequestContext.decode(reader, reader.uint32());
2544
2647
  continue;
2545
2648
  }
2546
2649
  case 2: {
@@ -2582,7 +2685,7 @@ exports.StreamChatCompletionRequest = {
2582
2685
  if (tag !== 58) {
2583
2686
  break;
2584
2687
  }
2585
- message.generationConfig = exports.InferenceGenerationConfig.decode(reader, reader.uint32());
2688
+ message.generationConfig = exports.GenerationConfig.decode(reader, reader.uint32());
2586
2689
  continue;
2587
2690
  }
2588
2691
  case 8: {
@@ -2602,7 +2705,7 @@ exports.StreamChatCompletionRequest = {
2602
2705
  },
2603
2706
  fromJSON(object) {
2604
2707
  return {
2605
- context: isSet(object.context) ? exports.InferenceRequestContext.fromJSON(object.context) : undefined,
2708
+ context: isSet(object.context) ? exports.RequestContext.fromJSON(object.context) : undefined,
2606
2709
  model: isSet(object.model) ? globalThis.String(object.model) : "",
2607
2710
  messages: globalThis.Array.isArray(object === null || object === void 0 ? void 0 : object.messages)
2608
2711
  ? object.messages.map((e) => exports.ChatMessage.fromJSON(e))
@@ -2619,9 +2722,9 @@ exports.StreamChatCompletionRequest = {
2619
2722
  ? toolChoiceModeFromJSON(object.tool_choice_mode)
2620
2723
  : 0,
2621
2724
  generationConfig: isSet(object.generationConfig)
2622
- ? exports.InferenceGenerationConfig.fromJSON(object.generationConfig)
2725
+ ? exports.GenerationConfig.fromJSON(object.generationConfig)
2623
2726
  : isSet(object.generation_config)
2624
- ? exports.InferenceGenerationConfig.fromJSON(object.generation_config)
2727
+ ? exports.GenerationConfig.fromJSON(object.generation_config)
2625
2728
  : undefined,
2626
2729
  responseSchema: isSet(object.responseSchema)
2627
2730
  ? exports.StructuredOutputSchema.fromJSON(object.responseSchema)
@@ -2634,7 +2737,7 @@ exports.StreamChatCompletionRequest = {
2634
2737
  var _a, _b;
2635
2738
  const obj = {};
2636
2739
  if (message.context !== undefined) {
2637
- obj.context = exports.InferenceRequestContext.toJSON(message.context);
2740
+ obj.context = exports.RequestContext.toJSON(message.context);
2638
2741
  }
2639
2742
  if (message.model !== "") {
2640
2743
  obj.model = message.model;
@@ -2652,7 +2755,7 @@ exports.StreamChatCompletionRequest = {
2652
2755
  obj.toolChoiceMode = toolChoiceModeToJSON(message.toolChoiceMode);
2653
2756
  }
2654
2757
  if (message.generationConfig !== undefined) {
2655
- obj.generationConfig = exports.InferenceGenerationConfig.toJSON(message.generationConfig);
2758
+ obj.generationConfig = exports.GenerationConfig.toJSON(message.generationConfig);
2656
2759
  }
2657
2760
  if (message.responseSchema !== undefined) {
2658
2761
  obj.responseSchema = exports.StructuredOutputSchema.toJSON(message.responseSchema);
@@ -2667,7 +2770,7 @@ exports.StreamChatCompletionRequest = {
2667
2770
  var _c, _d, _e;
2668
2771
  const message = createBaseStreamChatCompletionRequest();
2669
2772
  message.context = (object.context !== undefined && object.context !== null)
2670
- ? exports.InferenceRequestContext.fromPartial(object.context)
2773
+ ? exports.RequestContext.fromPartial(object.context)
2671
2774
  : undefined;
2672
2775
  message.model = (_c = object.model) !== null && _c !== void 0 ? _c : "";
2673
2776
  message.messages = ((_a = object.messages) === null || _a === void 0 ? void 0 : _a.map((e) => exports.ChatMessage.fromPartial(e))) || [];
@@ -2675,7 +2778,7 @@ exports.StreamChatCompletionRequest = {
2675
2778
  message.tools = ((_b = object.tools) === null || _b === void 0 ? void 0 : _b.map((e) => exports.ToolDefinition.fromPartial(e))) || [];
2676
2779
  message.toolChoiceMode = (_e = object.toolChoiceMode) !== null && _e !== void 0 ? _e : 0;
2677
2780
  message.generationConfig = (object.generationConfig !== undefined && object.generationConfig !== null)
2678
- ? exports.InferenceGenerationConfig.fromPartial(object.generationConfig)
2781
+ ? exports.GenerationConfig.fromPartial(object.generationConfig)
2679
2782
  : undefined;
2680
2783
  message.responseSchema = (object.responseSchema !== undefined && object.responseSchema !== null)
2681
2784
  ? exports.StructuredOutputSchema.fromPartial(object.responseSchema)
@@ -2698,7 +2801,7 @@ function createBaseStreamChatCompletionResponse() {
2698
2801
  exports.StreamChatCompletionResponse = {
2699
2802
  encode(message, writer = new wire_1.BinaryWriter()) {
2700
2803
  if (message.context !== undefined) {
2701
- exports.ResolvedInferenceContext.encode(message.context, writer.uint32(10).fork()).join();
2804
+ exports.ResolvedModelRoute.encode(message.context, writer.uint32(10).fork()).join();
2702
2805
  }
2703
2806
  if (message.deltaText !== "") {
2704
2807
  writer.uint32(18).string(message.deltaText);
@@ -2707,13 +2810,13 @@ exports.StreamChatCompletionResponse = {
2707
2810
  exports.ChatMessage.encode(message.deltaMessage, writer.uint32(26).fork()).join();
2708
2811
  }
2709
2812
  if (message.toolCallDelta !== undefined) {
2710
- exports.ToolCall.encode(message.toolCallDelta, writer.uint32(34).fork()).join();
2813
+ exports.ToolCallDelta.encode(message.toolCallDelta, writer.uint32(34).fork()).join();
2711
2814
  }
2712
2815
  if (message.finishReason !== 0) {
2713
2816
  writer.uint32(40).int32(message.finishReason);
2714
2817
  }
2715
2818
  if (message.usage !== undefined) {
2716
- exports.InferenceUsage.encode(message.usage, writer.uint32(50).fork()).join();
2819
+ exports.Usage.encode(message.usage, writer.uint32(50).fork()).join();
2717
2820
  }
2718
2821
  if (message.done !== false) {
2719
2822
  writer.uint32(56).bool(message.done);
@@ -2734,7 +2837,7 @@ exports.StreamChatCompletionResponse = {
2734
2837
  if (tag !== 10) {
2735
2838
  break;
2736
2839
  }
2737
- message.context = exports.ResolvedInferenceContext.decode(reader, reader.uint32());
2840
+ message.context = exports.ResolvedModelRoute.decode(reader, reader.uint32());
2738
2841
  continue;
2739
2842
  }
2740
2843
  case 2: {
@@ -2755,7 +2858,7 @@ exports.StreamChatCompletionResponse = {
2755
2858
  if (tag !== 34) {
2756
2859
  break;
2757
2860
  }
2758
- message.toolCallDelta = exports.ToolCall.decode(reader, reader.uint32());
2861
+ message.toolCallDelta = exports.ToolCallDelta.decode(reader, reader.uint32());
2759
2862
  continue;
2760
2863
  }
2761
2864
  case 5: {
@@ -2769,7 +2872,7 @@ exports.StreamChatCompletionResponse = {
2769
2872
  if (tag !== 50) {
2770
2873
  break;
2771
2874
  }
2772
- message.usage = exports.InferenceUsage.decode(reader, reader.uint32());
2875
+ message.usage = exports.Usage.decode(reader, reader.uint32());
2773
2876
  continue;
2774
2877
  }
2775
2878
  case 7: {
@@ -2796,7 +2899,7 @@ exports.StreamChatCompletionResponse = {
2796
2899
  },
2797
2900
  fromJSON(object) {
2798
2901
  return {
2799
- context: isSet(object.context) ? exports.ResolvedInferenceContext.fromJSON(object.context) : undefined,
2902
+ context: isSet(object.context) ? exports.ResolvedModelRoute.fromJSON(object.context) : undefined,
2800
2903
  deltaText: isSet(object.deltaText)
2801
2904
  ? globalThis.String(object.deltaText)
2802
2905
  : isSet(object.delta_text)
@@ -2808,16 +2911,16 @@ exports.StreamChatCompletionResponse = {
2808
2911
  ? exports.ChatMessage.fromJSON(object.delta_message)
2809
2912
  : undefined,
2810
2913
  toolCallDelta: isSet(object.toolCallDelta)
2811
- ? exports.ToolCall.fromJSON(object.toolCallDelta)
2914
+ ? exports.ToolCallDelta.fromJSON(object.toolCallDelta)
2812
2915
  : isSet(object.tool_call_delta)
2813
- ? exports.ToolCall.fromJSON(object.tool_call_delta)
2916
+ ? exports.ToolCallDelta.fromJSON(object.tool_call_delta)
2814
2917
  : undefined,
2815
2918
  finishReason: isSet(object.finishReason)
2816
- ? inferenceFinishReasonFromJSON(object.finishReason)
2919
+ ? finishReasonFromJSON(object.finishReason)
2817
2920
  : isSet(object.finish_reason)
2818
- ? inferenceFinishReasonFromJSON(object.finish_reason)
2921
+ ? finishReasonFromJSON(object.finish_reason)
2819
2922
  : 0,
2820
- usage: isSet(object.usage) ? exports.InferenceUsage.fromJSON(object.usage) : undefined,
2923
+ usage: isSet(object.usage) ? exports.Usage.fromJSON(object.usage) : undefined,
2821
2924
  done: isSet(object.done) ? globalThis.Boolean(object.done) : false,
2822
2925
  structuredOutput: isObject(object.structuredOutput)
2823
2926
  ? object.structuredOutput
@@ -2829,7 +2932,7 @@ exports.StreamChatCompletionResponse = {
2829
2932
  toJSON(message) {
2830
2933
  const obj = {};
2831
2934
  if (message.context !== undefined) {
2832
- obj.context = exports.ResolvedInferenceContext.toJSON(message.context);
2935
+ obj.context = exports.ResolvedModelRoute.toJSON(message.context);
2833
2936
  }
2834
2937
  if (message.deltaText !== "") {
2835
2938
  obj.deltaText = message.deltaText;
@@ -2838,13 +2941,13 @@ exports.StreamChatCompletionResponse = {
2838
2941
  obj.deltaMessage = exports.ChatMessage.toJSON(message.deltaMessage);
2839
2942
  }
2840
2943
  if (message.toolCallDelta !== undefined) {
2841
- obj.toolCallDelta = exports.ToolCall.toJSON(message.toolCallDelta);
2944
+ obj.toolCallDelta = exports.ToolCallDelta.toJSON(message.toolCallDelta);
2842
2945
  }
2843
2946
  if (message.finishReason !== 0) {
2844
- obj.finishReason = inferenceFinishReasonToJSON(message.finishReason);
2947
+ obj.finishReason = finishReasonToJSON(message.finishReason);
2845
2948
  }
2846
2949
  if (message.usage !== undefined) {
2847
- obj.usage = exports.InferenceUsage.toJSON(message.usage);
2950
+ obj.usage = exports.Usage.toJSON(message.usage);
2848
2951
  }
2849
2952
  if (message.done !== false) {
2850
2953
  obj.done = message.done;
@@ -2861,19 +2964,17 @@ exports.StreamChatCompletionResponse = {
2861
2964
  var _a, _b, _c, _d;
2862
2965
  const message = createBaseStreamChatCompletionResponse();
2863
2966
  message.context = (object.context !== undefined && object.context !== null)
2864
- ? exports.ResolvedInferenceContext.fromPartial(object.context)
2967
+ ? exports.ResolvedModelRoute.fromPartial(object.context)
2865
2968
  : undefined;
2866
2969
  message.deltaText = (_a = object.deltaText) !== null && _a !== void 0 ? _a : "";
2867
2970
  message.deltaMessage = (object.deltaMessage !== undefined && object.deltaMessage !== null)
2868
2971
  ? exports.ChatMessage.fromPartial(object.deltaMessage)
2869
2972
  : undefined;
2870
2973
  message.toolCallDelta = (object.toolCallDelta !== undefined && object.toolCallDelta !== null)
2871
- ? exports.ToolCall.fromPartial(object.toolCallDelta)
2974
+ ? exports.ToolCallDelta.fromPartial(object.toolCallDelta)
2872
2975
  : undefined;
2873
2976
  message.finishReason = (_b = object.finishReason) !== null && _b !== void 0 ? _b : 0;
2874
- message.usage = (object.usage !== undefined && object.usage !== null)
2875
- ? exports.InferenceUsage.fromPartial(object.usage)
2876
- : undefined;
2977
+ message.usage = (object.usage !== undefined && object.usage !== null) ? exports.Usage.fromPartial(object.usage) : undefined;
2877
2978
  message.done = (_c = object.done) !== null && _c !== void 0 ? _c : false;
2878
2979
  message.structuredOutput = (_d = object.structuredOutput) !== null && _d !== void 0 ? _d : undefined;
2879
2980
  return message;
@@ -2893,7 +2994,7 @@ function createBaseCallToolsRequest() {
2893
2994
  exports.CallToolsRequest = {
2894
2995
  encode(message, writer = new wire_1.BinaryWriter()) {
2895
2996
  if (message.context !== undefined) {
2896
- exports.InferenceRequestContext.encode(message.context, writer.uint32(10).fork()).join();
2997
+ exports.RequestContext.encode(message.context, writer.uint32(10).fork()).join();
2897
2998
  }
2898
2999
  if (message.model !== "") {
2899
3000
  writer.uint32(18).string(message.model);
@@ -2911,7 +3012,7 @@ exports.CallToolsRequest = {
2911
3012
  writer.uint32(48).int32(message.toolChoiceMode);
2912
3013
  }
2913
3014
  if (message.generationConfig !== undefined) {
2914
- exports.InferenceGenerationConfig.encode(message.generationConfig, writer.uint32(58).fork()).join();
3015
+ exports.GenerationConfig.encode(message.generationConfig, writer.uint32(58).fork()).join();
2915
3016
  }
2916
3017
  return writer;
2917
3018
  },
@@ -2926,7 +3027,7 @@ exports.CallToolsRequest = {
2926
3027
  if (tag !== 10) {
2927
3028
  break;
2928
3029
  }
2929
- message.context = exports.InferenceRequestContext.decode(reader, reader.uint32());
3030
+ message.context = exports.RequestContext.decode(reader, reader.uint32());
2930
3031
  continue;
2931
3032
  }
2932
3033
  case 2: {
@@ -2968,7 +3069,7 @@ exports.CallToolsRequest = {
2968
3069
  if (tag !== 58) {
2969
3070
  break;
2970
3071
  }
2971
- message.generationConfig = exports.InferenceGenerationConfig.decode(reader, reader.uint32());
3072
+ message.generationConfig = exports.GenerationConfig.decode(reader, reader.uint32());
2972
3073
  continue;
2973
3074
  }
2974
3075
  }
@@ -2981,7 +3082,7 @@ exports.CallToolsRequest = {
2981
3082
  },
2982
3083
  fromJSON(object) {
2983
3084
  return {
2984
- context: isSet(object.context) ? exports.InferenceRequestContext.fromJSON(object.context) : undefined,
3085
+ context: isSet(object.context) ? exports.RequestContext.fromJSON(object.context) : undefined,
2985
3086
  model: isSet(object.model) ? globalThis.String(object.model) : "",
2986
3087
  messages: globalThis.Array.isArray(object === null || object === void 0 ? void 0 : object.messages)
2987
3088
  ? object.messages.map((e) => exports.ChatMessage.fromJSON(e))
@@ -2998,9 +3099,9 @@ exports.CallToolsRequest = {
2998
3099
  ? toolChoiceModeFromJSON(object.tool_choice_mode)
2999
3100
  : 0,
3000
3101
  generationConfig: isSet(object.generationConfig)
3001
- ? exports.InferenceGenerationConfig.fromJSON(object.generationConfig)
3102
+ ? exports.GenerationConfig.fromJSON(object.generationConfig)
3002
3103
  : isSet(object.generation_config)
3003
- ? exports.InferenceGenerationConfig.fromJSON(object.generation_config)
3104
+ ? exports.GenerationConfig.fromJSON(object.generation_config)
3004
3105
  : undefined,
3005
3106
  };
3006
3107
  },
@@ -3008,7 +3109,7 @@ exports.CallToolsRequest = {
3008
3109
  var _a, _b;
3009
3110
  const obj = {};
3010
3111
  if (message.context !== undefined) {
3011
- obj.context = exports.InferenceRequestContext.toJSON(message.context);
3112
+ obj.context = exports.RequestContext.toJSON(message.context);
3012
3113
  }
3013
3114
  if (message.model !== "") {
3014
3115
  obj.model = message.model;
@@ -3026,7 +3127,7 @@ exports.CallToolsRequest = {
3026
3127
  obj.toolChoiceMode = toolChoiceModeToJSON(message.toolChoiceMode);
3027
3128
  }
3028
3129
  if (message.generationConfig !== undefined) {
3029
- obj.generationConfig = exports.InferenceGenerationConfig.toJSON(message.generationConfig);
3130
+ obj.generationConfig = exports.GenerationConfig.toJSON(message.generationConfig);
3030
3131
  }
3031
3132
  return obj;
3032
3133
  },
@@ -3038,7 +3139,7 @@ exports.CallToolsRequest = {
3038
3139
  var _c, _d, _e;
3039
3140
  const message = createBaseCallToolsRequest();
3040
3141
  message.context = (object.context !== undefined && object.context !== null)
3041
- ? exports.InferenceRequestContext.fromPartial(object.context)
3142
+ ? exports.RequestContext.fromPartial(object.context)
3042
3143
  : undefined;
3043
3144
  message.model = (_c = object.model) !== null && _c !== void 0 ? _c : "";
3044
3145
  message.messages = ((_a = object.messages) === null || _a === void 0 ? void 0 : _a.map((e) => exports.ChatMessage.fromPartial(e))) || [];
@@ -3046,7 +3147,7 @@ exports.CallToolsRequest = {
3046
3147
  message.tools = ((_b = object.tools) === null || _b === void 0 ? void 0 : _b.map((e) => exports.ToolDefinition.fromPartial(e))) || [];
3047
3148
  message.toolChoiceMode = (_e = object.toolChoiceMode) !== null && _e !== void 0 ? _e : 0;
3048
3149
  message.generationConfig = (object.generationConfig !== undefined && object.generationConfig !== null)
3049
- ? exports.InferenceGenerationConfig.fromPartial(object.generationConfig)
3150
+ ? exports.GenerationConfig.fromPartial(object.generationConfig)
3050
3151
  : undefined;
3051
3152
  return message;
3052
3153
  },
@@ -3057,7 +3158,7 @@ function createBaseCallToolsResponse() {
3057
3158
  exports.CallToolsResponse = {
3058
3159
  encode(message, writer = new wire_1.BinaryWriter()) {
3059
3160
  if (message.context !== undefined) {
3060
- exports.ResolvedInferenceContext.encode(message.context, writer.uint32(10).fork()).join();
3161
+ exports.ResolvedModelRoute.encode(message.context, writer.uint32(10).fork()).join();
3061
3162
  }
3062
3163
  if (message.message !== undefined) {
3063
3164
  exports.ChatMessage.encode(message.message, writer.uint32(18).fork()).join();
@@ -3069,7 +3170,7 @@ exports.CallToolsResponse = {
3069
3170
  writer.uint32(32).int32(message.finishReason);
3070
3171
  }
3071
3172
  if (message.usage !== undefined) {
3072
- exports.InferenceUsage.encode(message.usage, writer.uint32(42).fork()).join();
3173
+ exports.Usage.encode(message.usage, writer.uint32(42).fork()).join();
3073
3174
  }
3074
3175
  return writer;
3075
3176
  },
@@ -3084,7 +3185,7 @@ exports.CallToolsResponse = {
3084
3185
  if (tag !== 10) {
3085
3186
  break;
3086
3187
  }
3087
- message.context = exports.ResolvedInferenceContext.decode(reader, reader.uint32());
3188
+ message.context = exports.ResolvedModelRoute.decode(reader, reader.uint32());
3088
3189
  continue;
3089
3190
  }
3090
3191
  case 2: {
@@ -3112,7 +3213,7 @@ exports.CallToolsResponse = {
3112
3213
  if (tag !== 42) {
3113
3214
  break;
3114
3215
  }
3115
- message.usage = exports.InferenceUsage.decode(reader, reader.uint32());
3216
+ message.usage = exports.Usage.decode(reader, reader.uint32());
3116
3217
  continue;
3117
3218
  }
3118
3219
  }
@@ -3125,7 +3226,7 @@ exports.CallToolsResponse = {
3125
3226
  },
3126
3227
  fromJSON(object) {
3127
3228
  return {
3128
- context: isSet(object.context) ? exports.ResolvedInferenceContext.fromJSON(object.context) : undefined,
3229
+ context: isSet(object.context) ? exports.ResolvedModelRoute.fromJSON(object.context) : undefined,
3129
3230
  message: isSet(object.message) ? exports.ChatMessage.fromJSON(object.message) : undefined,
3130
3231
  toolCalls: globalThis.Array.isArray(object === null || object === void 0 ? void 0 : object.toolCalls)
3131
3232
  ? object.toolCalls.map((e) => exports.ToolCall.fromJSON(e))
@@ -3133,18 +3234,18 @@ exports.CallToolsResponse = {
3133
3234
  ? object.tool_calls.map((e) => exports.ToolCall.fromJSON(e))
3134
3235
  : [],
3135
3236
  finishReason: isSet(object.finishReason)
3136
- ? inferenceFinishReasonFromJSON(object.finishReason)
3237
+ ? finishReasonFromJSON(object.finishReason)
3137
3238
  : isSet(object.finish_reason)
3138
- ? inferenceFinishReasonFromJSON(object.finish_reason)
3239
+ ? finishReasonFromJSON(object.finish_reason)
3139
3240
  : 0,
3140
- usage: isSet(object.usage) ? exports.InferenceUsage.fromJSON(object.usage) : undefined,
3241
+ usage: isSet(object.usage) ? exports.Usage.fromJSON(object.usage) : undefined,
3141
3242
  };
3142
3243
  },
3143
3244
  toJSON(message) {
3144
3245
  var _a;
3145
3246
  const obj = {};
3146
3247
  if (message.context !== undefined) {
3147
- obj.context = exports.ResolvedInferenceContext.toJSON(message.context);
3248
+ obj.context = exports.ResolvedModelRoute.toJSON(message.context);
3148
3249
  }
3149
3250
  if (message.message !== undefined) {
3150
3251
  obj.message = exports.ChatMessage.toJSON(message.message);
@@ -3153,10 +3254,10 @@ exports.CallToolsResponse = {
3153
3254
  obj.toolCalls = message.toolCalls.map((e) => exports.ToolCall.toJSON(e));
3154
3255
  }
3155
3256
  if (message.finishReason !== 0) {
3156
- obj.finishReason = inferenceFinishReasonToJSON(message.finishReason);
3257
+ obj.finishReason = finishReasonToJSON(message.finishReason);
3157
3258
  }
3158
3259
  if (message.usage !== undefined) {
3159
- obj.usage = exports.InferenceUsage.toJSON(message.usage);
3260
+ obj.usage = exports.Usage.toJSON(message.usage);
3160
3261
  }
3161
3262
  return obj;
3162
3263
  },
@@ -3168,16 +3269,14 @@ exports.CallToolsResponse = {
3168
3269
  var _b;
3169
3270
  const message = createBaseCallToolsResponse();
3170
3271
  message.context = (object.context !== undefined && object.context !== null)
3171
- ? exports.ResolvedInferenceContext.fromPartial(object.context)
3272
+ ? exports.ResolvedModelRoute.fromPartial(object.context)
3172
3273
  : undefined;
3173
3274
  message.message = (object.message !== undefined && object.message !== null)
3174
3275
  ? exports.ChatMessage.fromPartial(object.message)
3175
3276
  : undefined;
3176
3277
  message.toolCalls = ((_a = object.toolCalls) === null || _a === void 0 ? void 0 : _a.map((e) => exports.ToolCall.fromPartial(e))) || [];
3177
3278
  message.finishReason = (_b = object.finishReason) !== null && _b !== void 0 ? _b : 0;
3178
- message.usage = (object.usage !== undefined && object.usage !== null)
3179
- ? exports.InferenceUsage.fromPartial(object.usage)
3180
- : undefined;
3279
+ message.usage = (object.usage !== undefined && object.usage !== null) ? exports.Usage.fromPartial(object.usage) : undefined;
3181
3280
  return message;
3182
3281
  },
3183
3282
  };
@@ -3187,7 +3286,7 @@ function createBaseCreateEmbeddingsRequest() {
3187
3286
  exports.CreateEmbeddingsRequest = {
3188
3287
  encode(message, writer = new wire_1.BinaryWriter()) {
3189
3288
  if (message.context !== undefined) {
3190
- exports.InferenceRequestContext.encode(message.context, writer.uint32(10).fork()).join();
3289
+ exports.RequestContext.encode(message.context, writer.uint32(10).fork()).join();
3191
3290
  }
3192
3291
  if (message.model !== "") {
3193
3292
  writer.uint32(18).string(message.model);
@@ -3217,7 +3316,7 @@ exports.CreateEmbeddingsRequest = {
3217
3316
  if (tag !== 10) {
3218
3317
  break;
3219
3318
  }
3220
- message.context = exports.InferenceRequestContext.decode(reader, reader.uint32());
3319
+ message.context = exports.RequestContext.decode(reader, reader.uint32());
3221
3320
  continue;
3222
3321
  }
3223
3322
  case 2: {
@@ -3265,7 +3364,7 @@ exports.CreateEmbeddingsRequest = {
3265
3364
  },
3266
3365
  fromJSON(object) {
3267
3366
  return {
3268
- context: isSet(object.context) ? exports.InferenceRequestContext.fromJSON(object.context) : undefined,
3367
+ context: isSet(object.context) ? exports.RequestContext.fromJSON(object.context) : undefined,
3269
3368
  model: isSet(object.model) ? globalThis.String(object.model) : "",
3270
3369
  inputs: globalThis.Array.isArray(object === null || object === void 0 ? void 0 : object.inputs) ? object.inputs.map((e) => exports.EmbeddingInput.fromJSON(e)) : [],
3271
3370
  dimensions: isSet(object.dimensions) ? globalThis.Number(object.dimensions) : 0,
@@ -3281,7 +3380,7 @@ exports.CreateEmbeddingsRequest = {
3281
3380
  var _a;
3282
3381
  const obj = {};
3283
3382
  if (message.context !== undefined) {
3284
- obj.context = exports.InferenceRequestContext.toJSON(message.context);
3383
+ obj.context = exports.RequestContext.toJSON(message.context);
3285
3384
  }
3286
3385
  if (message.model !== "") {
3287
3386
  obj.model = message.model;
@@ -3308,7 +3407,7 @@ exports.CreateEmbeddingsRequest = {
3308
3407
  var _b, _c, _d, _e;
3309
3408
  const message = createBaseCreateEmbeddingsRequest();
3310
3409
  message.context = (object.context !== undefined && object.context !== null)
3311
- ? exports.InferenceRequestContext.fromPartial(object.context)
3410
+ ? exports.RequestContext.fromPartial(object.context)
3312
3411
  : undefined;
3313
3412
  message.model = (_b = object.model) !== null && _b !== void 0 ? _b : "";
3314
3413
  message.inputs = ((_a = object.inputs) === null || _a === void 0 ? void 0 : _a.map((e) => exports.EmbeddingInput.fromPartial(e))) || [];
@@ -3324,13 +3423,13 @@ function createBaseCreateEmbeddingsResponse() {
3324
3423
  exports.CreateEmbeddingsResponse = {
3325
3424
  encode(message, writer = new wire_1.BinaryWriter()) {
3326
3425
  if (message.context !== undefined) {
3327
- exports.ResolvedInferenceContext.encode(message.context, writer.uint32(10).fork()).join();
3426
+ exports.ResolvedModelRoute.encode(message.context, writer.uint32(10).fork()).join();
3328
3427
  }
3329
3428
  for (const v of message.embeddings) {
3330
3429
  exports.EmbeddingVector.encode(v, writer.uint32(18).fork()).join();
3331
3430
  }
3332
3431
  if (message.usage !== undefined) {
3333
- exports.InferenceUsage.encode(message.usage, writer.uint32(26).fork()).join();
3432
+ exports.Usage.encode(message.usage, writer.uint32(26).fork()).join();
3334
3433
  }
3335
3434
  return writer;
3336
3435
  },
@@ -3345,7 +3444,7 @@ exports.CreateEmbeddingsResponse = {
3345
3444
  if (tag !== 10) {
3346
3445
  break;
3347
3446
  }
3348
- message.context = exports.ResolvedInferenceContext.decode(reader, reader.uint32());
3447
+ message.context = exports.ResolvedModelRoute.decode(reader, reader.uint32());
3349
3448
  continue;
3350
3449
  }
3351
3450
  case 2: {
@@ -3359,7 +3458,7 @@ exports.CreateEmbeddingsResponse = {
3359
3458
  if (tag !== 26) {
3360
3459
  break;
3361
3460
  }
3362
- message.usage = exports.InferenceUsage.decode(reader, reader.uint32());
3461
+ message.usage = exports.Usage.decode(reader, reader.uint32());
3363
3462
  continue;
3364
3463
  }
3365
3464
  }
@@ -3372,24 +3471,24 @@ exports.CreateEmbeddingsResponse = {
3372
3471
  },
3373
3472
  fromJSON(object) {
3374
3473
  return {
3375
- context: isSet(object.context) ? exports.ResolvedInferenceContext.fromJSON(object.context) : undefined,
3474
+ context: isSet(object.context) ? exports.ResolvedModelRoute.fromJSON(object.context) : undefined,
3376
3475
  embeddings: globalThis.Array.isArray(object === null || object === void 0 ? void 0 : object.embeddings)
3377
3476
  ? object.embeddings.map((e) => exports.EmbeddingVector.fromJSON(e))
3378
3477
  : [],
3379
- usage: isSet(object.usage) ? exports.InferenceUsage.fromJSON(object.usage) : undefined,
3478
+ usage: isSet(object.usage) ? exports.Usage.fromJSON(object.usage) : undefined,
3380
3479
  };
3381
3480
  },
3382
3481
  toJSON(message) {
3383
3482
  var _a;
3384
3483
  const obj = {};
3385
3484
  if (message.context !== undefined) {
3386
- obj.context = exports.ResolvedInferenceContext.toJSON(message.context);
3485
+ obj.context = exports.ResolvedModelRoute.toJSON(message.context);
3387
3486
  }
3388
3487
  if ((_a = message.embeddings) === null || _a === void 0 ? void 0 : _a.length) {
3389
3488
  obj.embeddings = message.embeddings.map((e) => exports.EmbeddingVector.toJSON(e));
3390
3489
  }
3391
3490
  if (message.usage !== undefined) {
3392
- obj.usage = exports.InferenceUsage.toJSON(message.usage);
3491
+ obj.usage = exports.Usage.toJSON(message.usage);
3393
3492
  }
3394
3493
  return obj;
3395
3494
  },
@@ -3400,12 +3499,10 @@ exports.CreateEmbeddingsResponse = {
3400
3499
  var _a;
3401
3500
  const message = createBaseCreateEmbeddingsResponse();
3402
3501
  message.context = (object.context !== undefined && object.context !== null)
3403
- ? exports.ResolvedInferenceContext.fromPartial(object.context)
3502
+ ? exports.ResolvedModelRoute.fromPartial(object.context)
3404
3503
  : undefined;
3405
3504
  message.embeddings = ((_a = object.embeddings) === null || _a === void 0 ? void 0 : _a.map((e) => exports.EmbeddingVector.fromPartial(e))) || [];
3406
- message.usage = (object.usage !== undefined && object.usage !== null)
3407
- ? exports.InferenceUsage.fromPartial(object.usage)
3408
- : undefined;
3505
+ message.usage = (object.usage !== undefined && object.usage !== null) ? exports.Usage.fromPartial(object.usage) : undefined;
3409
3506
  return message;
3410
3507
  },
3411
3508
  };
@@ -3426,7 +3523,7 @@ function createBaseGenerateImagesRequest() {
3426
3523
  exports.GenerateImagesRequest = {
3427
3524
  encode(message, writer = new wire_1.BinaryWriter()) {
3428
3525
  if (message.context !== undefined) {
3429
- exports.InferenceRequestContext.encode(message.context, writer.uint32(10).fork()).join();
3526
+ exports.RequestContext.encode(message.context, writer.uint32(10).fork()).join();
3430
3527
  }
3431
3528
  if (message.model !== "") {
3432
3529
  writer.uint32(18).string(message.model);
@@ -3468,7 +3565,7 @@ exports.GenerateImagesRequest = {
3468
3565
  if (tag !== 10) {
3469
3566
  break;
3470
3567
  }
3471
- message.context = exports.InferenceRequestContext.decode(reader, reader.uint32());
3568
+ message.context = exports.RequestContext.decode(reader, reader.uint32());
3472
3569
  continue;
3473
3570
  }
3474
3571
  case 2: {
@@ -3544,7 +3641,7 @@ exports.GenerateImagesRequest = {
3544
3641
  },
3545
3642
  fromJSON(object) {
3546
3643
  return {
3547
- context: isSet(object.context) ? exports.InferenceRequestContext.fromJSON(object.context) : undefined,
3644
+ context: isSet(object.context) ? exports.RequestContext.fromJSON(object.context) : undefined,
3548
3645
  model: isSet(object.model) ? globalThis.String(object.model) : "",
3549
3646
  prompt: isSet(object.prompt) ? globalThis.String(object.prompt) : "",
3550
3647
  negativePrompt: isSet(object.negativePrompt)
@@ -3571,7 +3668,7 @@ exports.GenerateImagesRequest = {
3571
3668
  toJSON(message) {
3572
3669
  const obj = {};
3573
3670
  if (message.context !== undefined) {
3574
- obj.context = exports.InferenceRequestContext.toJSON(message.context);
3671
+ obj.context = exports.RequestContext.toJSON(message.context);
3575
3672
  }
3576
3673
  if (message.model !== "") {
3577
3674
  obj.model = message.model;
@@ -3609,7 +3706,7 @@ exports.GenerateImagesRequest = {
3609
3706
  var _a, _b, _c, _d, _e, _f, _g, _h, _j;
3610
3707
  const message = createBaseGenerateImagesRequest();
3611
3708
  message.context = (object.context !== undefined && object.context !== null)
3612
- ? exports.InferenceRequestContext.fromPartial(object.context)
3709
+ ? exports.RequestContext.fromPartial(object.context)
3613
3710
  : undefined;
3614
3711
  message.model = (_a = object.model) !== null && _a !== void 0 ? _a : "";
3615
3712
  message.prompt = (_b = object.prompt) !== null && _b !== void 0 ? _b : "";
@@ -3629,7 +3726,7 @@ function createBaseGenerateImagesResponse() {
3629
3726
  exports.GenerateImagesResponse = {
3630
3727
  encode(message, writer = new wire_1.BinaryWriter()) {
3631
3728
  if (message.context !== undefined) {
3632
- exports.ResolvedInferenceContext.encode(message.context, writer.uint32(10).fork()).join();
3729
+ exports.ResolvedModelRoute.encode(message.context, writer.uint32(10).fork()).join();
3633
3730
  }
3634
3731
  for (const v of message.images) {
3635
3732
  exports.GeneratedImage.encode(v, writer.uint32(18).fork()).join();
@@ -3647,7 +3744,7 @@ exports.GenerateImagesResponse = {
3647
3744
  if (tag !== 10) {
3648
3745
  break;
3649
3746
  }
3650
- message.context = exports.ResolvedInferenceContext.decode(reader, reader.uint32());
3747
+ message.context = exports.ResolvedModelRoute.decode(reader, reader.uint32());
3651
3748
  continue;
3652
3749
  }
3653
3750
  case 2: {
@@ -3667,7 +3764,7 @@ exports.GenerateImagesResponse = {
3667
3764
  },
3668
3765
  fromJSON(object) {
3669
3766
  return {
3670
- context: isSet(object.context) ? exports.ResolvedInferenceContext.fromJSON(object.context) : undefined,
3767
+ context: isSet(object.context) ? exports.ResolvedModelRoute.fromJSON(object.context) : undefined,
3671
3768
  images: globalThis.Array.isArray(object === null || object === void 0 ? void 0 : object.images) ? object.images.map((e) => exports.GeneratedImage.fromJSON(e)) : [],
3672
3769
  };
3673
3770
  },
@@ -3675,7 +3772,7 @@ exports.GenerateImagesResponse = {
3675
3772
  var _a;
3676
3773
  const obj = {};
3677
3774
  if (message.context !== undefined) {
3678
- obj.context = exports.ResolvedInferenceContext.toJSON(message.context);
3775
+ obj.context = exports.ResolvedModelRoute.toJSON(message.context);
3679
3776
  }
3680
3777
  if ((_a = message.images) === null || _a === void 0 ? void 0 : _a.length) {
3681
3778
  obj.images = message.images.map((e) => exports.GeneratedImage.toJSON(e));
@@ -3689,7 +3786,7 @@ exports.GenerateImagesResponse = {
3689
3786
  var _a;
3690
3787
  const message = createBaseGenerateImagesResponse();
3691
3788
  message.context = (object.context !== undefined && object.context !== null)
3692
- ? exports.ResolvedInferenceContext.fromPartial(object.context)
3789
+ ? exports.ResolvedModelRoute.fromPartial(object.context)
3693
3790
  : undefined;
3694
3791
  message.images = ((_a = object.images) === null || _a === void 0 ? void 0 : _a.map((e) => exports.GeneratedImage.fromPartial(e))) || [];
3695
3792
  return message;
@@ -3701,7 +3798,7 @@ function createBaseCallMCPRequest() {
3701
3798
  exports.CallMCPRequest = {
3702
3799
  encode(message, writer = new wire_1.BinaryWriter()) {
3703
3800
  if (message.context !== undefined) {
3704
- exports.InferenceRequestContext.encode(message.context, writer.uint32(10).fork()).join();
3801
+ exports.RequestContext.encode(message.context, writer.uint32(10).fork()).join();
3705
3802
  }
3706
3803
  if (message.model !== "") {
3707
3804
  writer.uint32(18).string(message.model);
@@ -3731,7 +3828,7 @@ exports.CallMCPRequest = {
3731
3828
  if (tag !== 10) {
3732
3829
  break;
3733
3830
  }
3734
- message.context = exports.InferenceRequestContext.decode(reader, reader.uint32());
3831
+ message.context = exports.RequestContext.decode(reader, reader.uint32());
3735
3832
  continue;
3736
3833
  }
3737
3834
  case 2: {
@@ -3779,7 +3876,7 @@ exports.CallMCPRequest = {
3779
3876
  },
3780
3877
  fromJSON(object) {
3781
3878
  return {
3782
- context: isSet(object.context) ? exports.InferenceRequestContext.fromJSON(object.context) : undefined,
3879
+ context: isSet(object.context) ? exports.RequestContext.fromJSON(object.context) : undefined,
3783
3880
  model: isSet(object.model) ? globalThis.String(object.model) : "",
3784
3881
  serverName: isSet(object.serverName)
3785
3882
  ? globalThis.String(object.serverName)
@@ -3798,7 +3895,7 @@ exports.CallMCPRequest = {
3798
3895
  toJSON(message) {
3799
3896
  const obj = {};
3800
3897
  if (message.context !== undefined) {
3801
- obj.context = exports.InferenceRequestContext.toJSON(message.context);
3898
+ obj.context = exports.RequestContext.toJSON(message.context);
3802
3899
  }
3803
3900
  if (message.model !== "") {
3804
3901
  obj.model = message.model;
@@ -3824,7 +3921,7 @@ exports.CallMCPRequest = {
3824
3921
  var _a, _b, _c, _d, _e;
3825
3922
  const message = createBaseCallMCPRequest();
3826
3923
  message.context = (object.context !== undefined && object.context !== null)
3827
- ? exports.InferenceRequestContext.fromPartial(object.context)
3924
+ ? exports.RequestContext.fromPartial(object.context)
3828
3925
  : undefined;
3829
3926
  message.model = (_a = object.model) !== null && _a !== void 0 ? _a : "";
3830
3927
  message.serverName = (_b = object.serverName) !== null && _b !== void 0 ? _b : "";
@@ -3840,7 +3937,7 @@ function createBaseCallMCPResponse() {
3840
3937
  exports.CallMCPResponse = {
3841
3938
  encode(message, writer = new wire_1.BinaryWriter()) {
3842
3939
  if (message.context !== undefined) {
3843
- exports.ResolvedInferenceContext.encode(message.context, writer.uint32(10).fork()).join();
3940
+ exports.ResolvedModelRoute.encode(message.context, writer.uint32(10).fork()).join();
3844
3941
  }
3845
3942
  if (message.result !== undefined) {
3846
3943
  struct_pb_1.Struct.encode(struct_pb_1.Struct.wrap(message.result), writer.uint32(18).fork()).join();
@@ -3858,7 +3955,7 @@ exports.CallMCPResponse = {
3858
3955
  if (tag !== 10) {
3859
3956
  break;
3860
3957
  }
3861
- message.context = exports.ResolvedInferenceContext.decode(reader, reader.uint32());
3958
+ message.context = exports.ResolvedModelRoute.decode(reader, reader.uint32());
3862
3959
  continue;
3863
3960
  }
3864
3961
  case 2: {
@@ -3878,14 +3975,14 @@ exports.CallMCPResponse = {
3878
3975
  },
3879
3976
  fromJSON(object) {
3880
3977
  return {
3881
- context: isSet(object.context) ? exports.ResolvedInferenceContext.fromJSON(object.context) : undefined,
3978
+ context: isSet(object.context) ? exports.ResolvedModelRoute.fromJSON(object.context) : undefined,
3882
3979
  result: isObject(object.result) ? object.result : undefined,
3883
3980
  };
3884
3981
  },
3885
3982
  toJSON(message) {
3886
3983
  const obj = {};
3887
3984
  if (message.context !== undefined) {
3888
- obj.context = exports.ResolvedInferenceContext.toJSON(message.context);
3985
+ obj.context = exports.ResolvedModelRoute.toJSON(message.context);
3889
3986
  }
3890
3987
  if (message.result !== undefined) {
3891
3988
  obj.result = message.result;
@@ -3899,7 +3996,7 @@ exports.CallMCPResponse = {
3899
3996
  var _a;
3900
3997
  const message = createBaseCallMCPResponse();
3901
3998
  message.context = (object.context !== undefined && object.context !== null)
3902
- ? exports.ResolvedInferenceContext.fromPartial(object.context)
3999
+ ? exports.ResolvedModelRoute.fromPartial(object.context)
3903
4000
  : undefined;
3904
4001
  message.result = (_a = object.result) !== null && _a !== void 0 ? _a : undefined;
3905
4002
  return message;
@@ -4807,7 +4904,7 @@ exports.OpenAICompatibilityServiceCreateChatCompletionResponse = {
4807
4904
  exports.OpenAIChatChoice.encode(v, writer.uint32(34).fork()).join();
4808
4905
  }
4809
4906
  if (message.usage !== undefined) {
4810
- exports.InferenceUsage.encode(message.usage, writer.uint32(42).fork()).join();
4907
+ exports.Usage.encode(message.usage, writer.uint32(42).fork()).join();
4811
4908
  }
4812
4909
  return writer;
4813
4910
  },
@@ -4850,7 +4947,7 @@ exports.OpenAICompatibilityServiceCreateChatCompletionResponse = {
4850
4947
  if (tag !== 42) {
4851
4948
  break;
4852
4949
  }
4853
- message.usage = exports.InferenceUsage.decode(reader, reader.uint32());
4950
+ message.usage = exports.Usage.decode(reader, reader.uint32());
4854
4951
  continue;
4855
4952
  }
4856
4953
  }
@@ -4869,7 +4966,7 @@ exports.OpenAICompatibilityServiceCreateChatCompletionResponse = {
4869
4966
  choices: globalThis.Array.isArray(object === null || object === void 0 ? void 0 : object.choices)
4870
4967
  ? object.choices.map((e) => exports.OpenAIChatChoice.fromJSON(e))
4871
4968
  : [],
4872
- usage: isSet(object.usage) ? exports.InferenceUsage.fromJSON(object.usage) : undefined,
4969
+ usage: isSet(object.usage) ? exports.Usage.fromJSON(object.usage) : undefined,
4873
4970
  };
4874
4971
  },
4875
4972
  toJSON(message) {
@@ -4888,7 +4985,7 @@ exports.OpenAICompatibilityServiceCreateChatCompletionResponse = {
4888
4985
  obj.choices = message.choices.map((e) => exports.OpenAIChatChoice.toJSON(e));
4889
4986
  }
4890
4987
  if (message.usage !== undefined) {
4891
- obj.usage = exports.InferenceUsage.toJSON(message.usage);
4988
+ obj.usage = exports.Usage.toJSON(message.usage);
4892
4989
  }
4893
4990
  return obj;
4894
4991
  },
@@ -4903,9 +5000,7 @@ exports.OpenAICompatibilityServiceCreateChatCompletionResponse = {
4903
5000
  message.object = (_c = object.object) !== null && _c !== void 0 ? _c : "";
4904
5001
  message.model = (_d = object.model) !== null && _d !== void 0 ? _d : "";
4905
5002
  message.choices = ((_a = object.choices) === null || _a === void 0 ? void 0 : _a.map((e) => exports.OpenAIChatChoice.fromPartial(e))) || [];
4906
- message.usage = (object.usage !== undefined && object.usage !== null)
4907
- ? exports.InferenceUsage.fromPartial(object.usage)
4908
- : undefined;
5003
+ message.usage = (object.usage !== undefined && object.usage !== null) ? exports.Usage.fromPartial(object.usage) : undefined;
4909
5004
  return message;
4910
5005
  },
4911
5006
  };
@@ -5255,7 +5350,7 @@ exports.OpenAICompatibilityServiceStreamChatCompletionResponse = {
5255
5350
  exports.OpenAIChatDeltaChoice.encode(v, writer.uint32(34).fork()).join();
5256
5351
  }
5257
5352
  if (message.usage !== undefined) {
5258
- exports.InferenceUsage.encode(message.usage, writer.uint32(42).fork()).join();
5353
+ exports.Usage.encode(message.usage, writer.uint32(42).fork()).join();
5259
5354
  }
5260
5355
  if (message.done !== false) {
5261
5356
  writer.uint32(48).bool(message.done);
@@ -5301,7 +5396,7 @@ exports.OpenAICompatibilityServiceStreamChatCompletionResponse = {
5301
5396
  if (tag !== 42) {
5302
5397
  break;
5303
5398
  }
5304
- message.usage = exports.InferenceUsage.decode(reader, reader.uint32());
5399
+ message.usage = exports.Usage.decode(reader, reader.uint32());
5305
5400
  continue;
5306
5401
  }
5307
5402
  case 6: {
@@ -5327,7 +5422,7 @@ exports.OpenAICompatibilityServiceStreamChatCompletionResponse = {
5327
5422
  choices: globalThis.Array.isArray(object === null || object === void 0 ? void 0 : object.choices)
5328
5423
  ? object.choices.map((e) => exports.OpenAIChatDeltaChoice.fromJSON(e))
5329
5424
  : [],
5330
- usage: isSet(object.usage) ? exports.InferenceUsage.fromJSON(object.usage) : undefined,
5425
+ usage: isSet(object.usage) ? exports.Usage.fromJSON(object.usage) : undefined,
5331
5426
  done: isSet(object.done) ? globalThis.Boolean(object.done) : false,
5332
5427
  };
5333
5428
  },
@@ -5347,7 +5442,7 @@ exports.OpenAICompatibilityServiceStreamChatCompletionResponse = {
5347
5442
  obj.choices = message.choices.map((e) => exports.OpenAIChatDeltaChoice.toJSON(e));
5348
5443
  }
5349
5444
  if (message.usage !== undefined) {
5350
- obj.usage = exports.InferenceUsage.toJSON(message.usage);
5445
+ obj.usage = exports.Usage.toJSON(message.usage);
5351
5446
  }
5352
5447
  if (message.done !== false) {
5353
5448
  obj.done = message.done;
@@ -5365,9 +5460,7 @@ exports.OpenAICompatibilityServiceStreamChatCompletionResponse = {
5365
5460
  message.object = (_c = object.object) !== null && _c !== void 0 ? _c : "";
5366
5461
  message.model = (_d = object.model) !== null && _d !== void 0 ? _d : "";
5367
5462
  message.choices = ((_a = object.choices) === null || _a === void 0 ? void 0 : _a.map((e) => exports.OpenAIChatDeltaChoice.fromPartial(e))) || [];
5368
- message.usage = (object.usage !== undefined && object.usage !== null)
5369
- ? exports.InferenceUsage.fromPartial(object.usage)
5370
- : undefined;
5463
+ message.usage = (object.usage !== undefined && object.usage !== null) ? exports.Usage.fromPartial(object.usage) : undefined;
5371
5464
  message.done = (_e = object.done) !== null && _e !== void 0 ? _e : false;
5372
5465
  return message;
5373
5466
  },
@@ -5604,7 +5697,7 @@ exports.OpenAICompatibilityServiceCreateEmbeddingResponse = {
5604
5697
  writer.uint32(26).string(message.model);
5605
5698
  }
5606
5699
  if (message.usage !== undefined) {
5607
- exports.InferenceUsage.encode(message.usage, writer.uint32(34).fork()).join();
5700
+ exports.Usage.encode(message.usage, writer.uint32(34).fork()).join();
5608
5701
  }
5609
5702
  return writer;
5610
5703
  },
@@ -5640,7 +5733,7 @@ exports.OpenAICompatibilityServiceCreateEmbeddingResponse = {
5640
5733
  if (tag !== 34) {
5641
5734
  break;
5642
5735
  }
5643
- message.usage = exports.InferenceUsage.decode(reader, reader.uint32());
5736
+ message.usage = exports.Usage.decode(reader, reader.uint32());
5644
5737
  continue;
5645
5738
  }
5646
5739
  }
@@ -5656,7 +5749,7 @@ exports.OpenAICompatibilityServiceCreateEmbeddingResponse = {
5656
5749
  object: isSet(object.object) ? globalThis.String(object.object) : "",
5657
5750
  data: globalThis.Array.isArray(object === null || object === void 0 ? void 0 : object.data) ? object.data.map((e) => exports.OpenAIEmbeddingData.fromJSON(e)) : [],
5658
5751
  model: isSet(object.model) ? globalThis.String(object.model) : "",
5659
- usage: isSet(object.usage) ? exports.InferenceUsage.fromJSON(object.usage) : undefined,
5752
+ usage: isSet(object.usage) ? exports.Usage.fromJSON(object.usage) : undefined,
5660
5753
  };
5661
5754
  },
5662
5755
  toJSON(message) {
@@ -5672,7 +5765,7 @@ exports.OpenAICompatibilityServiceCreateEmbeddingResponse = {
5672
5765
  obj.model = message.model;
5673
5766
  }
5674
5767
  if (message.usage !== undefined) {
5675
- obj.usage = exports.InferenceUsage.toJSON(message.usage);
5768
+ obj.usage = exports.Usage.toJSON(message.usage);
5676
5769
  }
5677
5770
  return obj;
5678
5771
  },
@@ -5686,9 +5779,7 @@ exports.OpenAICompatibilityServiceCreateEmbeddingResponse = {
5686
5779
  message.object = (_b = object.object) !== null && _b !== void 0 ? _b : "";
5687
5780
  message.data = ((_a = object.data) === null || _a === void 0 ? void 0 : _a.map((e) => exports.OpenAIEmbeddingData.fromPartial(e))) || [];
5688
5781
  message.model = (_c = object.model) !== null && _c !== void 0 ? _c : "";
5689
- message.usage = (object.usage !== undefined && object.usage !== null)
5690
- ? exports.InferenceUsage.fromPartial(object.usage)
5691
- : undefined;
5782
+ message.usage = (object.usage !== undefined && object.usage !== null) ? exports.Usage.fromPartial(object.usage) : undefined;
5692
5783
  return message;
5693
5784
  },
5694
5785
  };