liter_llm 1.0.0.pre.rc.6
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- data/README.md +239 -0
- data/ext/liter_llm_rb/extconf.rb +65 -0
- data/ext/liter_llm_rb/native/.cargo/config.toml +23 -0
- data/ext/liter_llm_rb/native/Cargo.lock +3713 -0
- data/ext/liter_llm_rb/native/Cargo.toml +32 -0
- data/ext/liter_llm_rb/native/build.rs +15 -0
- data/ext/liter_llm_rb/native/src/lib.rs +1079 -0
- data/lib/liter_llm.rb +8 -0
- data/sig/liter_llm.rbs +416 -0
- data/vendor/Cargo.toml +54 -0
- data/vendor/liter-llm/Cargo.toml +92 -0
- data/vendor/liter-llm/README.md +252 -0
- data/vendor/liter-llm/schemas/pricing.json +40 -0
- data/vendor/liter-llm/schemas/providers.json +1662 -0
- data/vendor/liter-llm/src/auth/azure_ad.rs +264 -0
- data/vendor/liter-llm/src/auth/bedrock_sts.rs +353 -0
- data/vendor/liter-llm/src/auth/mod.rs +68 -0
- data/vendor/liter-llm/src/auth/vertex_oauth.rs +353 -0
- data/vendor/liter-llm/src/client/config.rs +351 -0
- data/vendor/liter-llm/src/client/managed.rs +622 -0
- data/vendor/liter-llm/src/client/mod.rs +864 -0
- data/vendor/liter-llm/src/cost.rs +212 -0
- data/vendor/liter-llm/src/error.rs +190 -0
- data/vendor/liter-llm/src/http/eventstream.rs +860 -0
- data/vendor/liter-llm/src/http/mod.rs +12 -0
- data/vendor/liter-llm/src/http/request.rs +438 -0
- data/vendor/liter-llm/src/http/retry.rs +72 -0
- data/vendor/liter-llm/src/http/streaming.rs +289 -0
- data/vendor/liter-llm/src/lib.rs +37 -0
- data/vendor/liter-llm/src/provider/anthropic.rs +2250 -0
- data/vendor/liter-llm/src/provider/azure.rs +579 -0
- data/vendor/liter-llm/src/provider/bedrock.rs +1543 -0
- data/vendor/liter-llm/src/provider/cohere.rs +654 -0
- data/vendor/liter-llm/src/provider/custom.rs +404 -0
- data/vendor/liter-llm/src/provider/google_ai.rs +281 -0
- data/vendor/liter-llm/src/provider/mistral.rs +188 -0
- data/vendor/liter-llm/src/provider/mod.rs +616 -0
- data/vendor/liter-llm/src/provider/vertex.rs +1504 -0
- data/vendor/liter-llm/src/tests.rs +1425 -0
- data/vendor/liter-llm/src/tokenizer.rs +281 -0
- data/vendor/liter-llm/src/tower/budget.rs +599 -0
- data/vendor/liter-llm/src/tower/cache.rs +502 -0
- data/vendor/liter-llm/src/tower/cache_opendal.rs +270 -0
- data/vendor/liter-llm/src/tower/cooldown.rs +231 -0
- data/vendor/liter-llm/src/tower/cost.rs +404 -0
- data/vendor/liter-llm/src/tower/fallback.rs +121 -0
- data/vendor/liter-llm/src/tower/health.rs +219 -0
- data/vendor/liter-llm/src/tower/hooks.rs +369 -0
- data/vendor/liter-llm/src/tower/mod.rs +77 -0
- data/vendor/liter-llm/src/tower/rate_limit.rs +300 -0
- data/vendor/liter-llm/src/tower/router.rs +436 -0
- data/vendor/liter-llm/src/tower/service.rs +181 -0
- data/vendor/liter-llm/src/tower/tests.rs +539 -0
- data/vendor/liter-llm/src/tower/tests_common.rs +252 -0
- data/vendor/liter-llm/src/tower/tracing.rs +209 -0
- data/vendor/liter-llm/src/tower/types.rs +170 -0
- data/vendor/liter-llm/src/types/audio.rs +52 -0
- data/vendor/liter-llm/src/types/batch.rs +77 -0
- data/vendor/liter-llm/src/types/chat.rs +214 -0
- data/vendor/liter-llm/src/types/common.rs +244 -0
- data/vendor/liter-llm/src/types/embedding.rs +84 -0
- data/vendor/liter-llm/src/types/files.rs +58 -0
- data/vendor/liter-llm/src/types/image.rs +40 -0
- data/vendor/liter-llm/src/types/mod.rs +27 -0
- data/vendor/liter-llm/src/types/models.rs +21 -0
- data/vendor/liter-llm/src/types/moderation.rs +80 -0
- data/vendor/liter-llm/src/types/ocr.rs +87 -0
- data/vendor/liter-llm/src/types/rerank.rs +46 -0
- data/vendor/liter-llm/src/types/responses.rs +55 -0
- data/vendor/liter-llm/src/types/search.rs +45 -0
- data/vendor/liter-llm/tests/contract.rs +332 -0
- data/vendor/liter-llm-ffi/Cargo.toml +30 -0
- data/vendor/liter-llm-ffi/build.rs +66 -0
- data/vendor/liter-llm-ffi/cbindgen.toml +60 -0
- data/vendor/liter-llm-ffi/liter_llm.h +850 -0
- data/vendor/liter-llm-ffi/src/lib.rs +2488 -0
- metadata +286 -0
|
@@ -0,0 +1,404 @@
|
|
|
1
|
+
//! Runtime registration of custom LLM providers.
|
|
2
|
+
//!
|
|
3
|
+
//! Allows users to register providers that are not part of the built-in
|
|
4
|
+
//! `providers.json` registry. Custom providers are checked **first** during
|
|
5
|
+
//! model detection, so they can override built-in routing.
|
|
6
|
+
|
|
7
|
+
use std::borrow::Cow;
|
|
8
|
+
use std::sync::RwLock;
|
|
9
|
+
|
|
10
|
+
use serde::{Deserialize, Serialize};
|
|
11
|
+
|
|
12
|
+
use super::Provider;
|
|
13
|
+
use crate::error::{LiterLlmError, Result};
|
|
14
|
+
|
|
15
|
+
// ── Global custom-provider registry ──────────────────────────────────────────
|
|
16
|
+
|
|
17
|
+
/// Thread-safe registry of runtime-registered custom providers.
|
|
18
|
+
///
|
|
19
|
+
/// Uses `RwLock` so that reads (the hot path inside `detect_provider`) only
|
|
20
|
+
/// take a shared lock, while mutations (`register` / `unregister`) take an
|
|
21
|
+
/// exclusive lock.
|
|
22
|
+
static CUSTOM_PROVIDERS: RwLock<Vec<CustomProviderConfig>> = RwLock::new(Vec::new());
|
|
23
|
+
|
|
24
|
+
/// Configuration for registering a custom LLM provider at runtime.
|
|
25
|
+
#[derive(Debug, Clone, Serialize, Deserialize)]
|
|
26
|
+
pub struct CustomProviderConfig {
|
|
27
|
+
/// Unique name for this provider (e.g., "my-provider").
|
|
28
|
+
pub name: String,
|
|
29
|
+
/// Base URL for the provider's API (e.g., "https://api.my-provider.com/v1").
|
|
30
|
+
pub base_url: String,
|
|
31
|
+
/// Authentication header format.
|
|
32
|
+
pub auth_header: AuthHeaderFormat,
|
|
33
|
+
/// Model name prefixes that route to this provider (e.g., ["my-"]).
|
|
34
|
+
pub model_prefixes: Vec<String>,
|
|
35
|
+
}
|
|
36
|
+
|
|
37
|
+
/// How the API key is sent in the HTTP request.
|
|
38
|
+
#[derive(Debug, Clone, Serialize, Deserialize)]
|
|
39
|
+
pub enum AuthHeaderFormat {
|
|
40
|
+
/// Bearer token: `Authorization: Bearer <key>`
|
|
41
|
+
Bearer,
|
|
42
|
+
/// Custom header: e.g., `X-Api-Key: <key>`
|
|
43
|
+
ApiKey(String),
|
|
44
|
+
/// No authentication required.
|
|
45
|
+
None,
|
|
46
|
+
}
|
|
47
|
+
|
|
48
|
+
// ── Public API ───────────────────────────────────────────────────────────────
|
|
49
|
+
|
|
50
|
+
/// Register a custom provider in the global runtime registry.
|
|
51
|
+
///
|
|
52
|
+
/// The provider will be checked **before** all built-in providers during model
|
|
53
|
+
/// detection. If a provider with the same `name` already exists it is replaced.
|
|
54
|
+
///
|
|
55
|
+
/// # Errors
|
|
56
|
+
///
|
|
57
|
+
/// Returns an error if the config is invalid (empty name, empty base_url, or
|
|
58
|
+
/// no model prefixes).
|
|
59
|
+
pub fn register_custom_provider(config: CustomProviderConfig) -> Result<()> {
|
|
60
|
+
validate_config(&config)?;
|
|
61
|
+
|
|
62
|
+
let mut providers = CUSTOM_PROVIDERS.write().map_err(|e| LiterLlmError::ServerError {
|
|
63
|
+
message: format!("custom provider registry lock poisoned: {e}"),
|
|
64
|
+
})?;
|
|
65
|
+
|
|
66
|
+
// Replace existing entry with the same name, or append.
|
|
67
|
+
if let Some(existing) = providers.iter_mut().find(|p| p.name == config.name) {
|
|
68
|
+
*existing = config;
|
|
69
|
+
} else {
|
|
70
|
+
providers.push(config);
|
|
71
|
+
}
|
|
72
|
+
|
|
73
|
+
Ok(())
|
|
74
|
+
}
|
|
75
|
+
|
|
76
|
+
/// Remove a previously registered custom provider by name.
|
|
77
|
+
///
|
|
78
|
+
/// Returns `true` if a provider with the given name was found and removed,
|
|
79
|
+
/// `false` if no such provider existed.
|
|
80
|
+
///
|
|
81
|
+
/// # Errors
|
|
82
|
+
///
|
|
83
|
+
/// Returns an error only if the internal lock is poisoned.
|
|
84
|
+
pub fn unregister_custom_provider(name: &str) -> Result<bool> {
|
|
85
|
+
let mut providers = CUSTOM_PROVIDERS.write().map_err(|e| LiterLlmError::ServerError {
|
|
86
|
+
message: format!("custom provider registry lock poisoned: {e}"),
|
|
87
|
+
})?;
|
|
88
|
+
|
|
89
|
+
let before = providers.len();
|
|
90
|
+
providers.retain(|p| p.name != name);
|
|
91
|
+
Ok(providers.len() < before)
|
|
92
|
+
}
|
|
93
|
+
|
|
94
|
+
/// Try to match a model name against the custom-provider registry.
|
|
95
|
+
///
|
|
96
|
+
/// Returns a boxed [`Provider`] if a custom provider claims the model,
|
|
97
|
+
/// `None` otherwise. This is called at the **top** of `detect_provider`
|
|
98
|
+
/// so custom providers always take priority over built-in ones.
|
|
99
|
+
pub(crate) fn detect_custom_provider(model: &str) -> Option<Box<dyn Provider>> {
|
|
100
|
+
let providers = CUSTOM_PROVIDERS.read().ok()?;
|
|
101
|
+
|
|
102
|
+
for cfg in providers.iter() {
|
|
103
|
+
let matches = cfg
|
|
104
|
+
.model_prefixes
|
|
105
|
+
.iter()
|
|
106
|
+
.any(|prefix| model.starts_with(prefix.as_str()));
|
|
107
|
+
|
|
108
|
+
if matches {
|
|
109
|
+
return Some(Box::new(CustomProvider { config: cfg.clone() }));
|
|
110
|
+
}
|
|
111
|
+
}
|
|
112
|
+
|
|
113
|
+
None
|
|
114
|
+
}
|
|
115
|
+
|
|
116
|
+
/// Clear all custom providers. Intended for test isolation only.
|
|
117
|
+
#[cfg(test)]
|
|
118
|
+
pub(crate) fn clear_custom_providers() {
|
|
119
|
+
if let Ok(mut providers) = CUSTOM_PROVIDERS.write() {
|
|
120
|
+
providers.clear();
|
|
121
|
+
}
|
|
122
|
+
}
|
|
123
|
+
|
|
124
|
+
// ── Validation ───────────────────────────────────────────────────────────────
|
|
125
|
+
|
|
126
|
+
fn validate_config(config: &CustomProviderConfig) -> Result<()> {
|
|
127
|
+
if config.name.trim().is_empty() {
|
|
128
|
+
return Err(LiterLlmError::BadRequest {
|
|
129
|
+
message: "custom provider name must not be empty or whitespace-only".into(),
|
|
130
|
+
});
|
|
131
|
+
}
|
|
132
|
+
if config.base_url.trim().is_empty() {
|
|
133
|
+
return Err(LiterLlmError::BadRequest {
|
|
134
|
+
message: "custom provider base_url must not be empty or whitespace-only".into(),
|
|
135
|
+
});
|
|
136
|
+
}
|
|
137
|
+
if config.model_prefixes.is_empty() {
|
|
138
|
+
return Err(LiterLlmError::BadRequest {
|
|
139
|
+
message: "custom provider must have at least one model prefix".into(),
|
|
140
|
+
});
|
|
141
|
+
}
|
|
142
|
+
for prefix in &config.model_prefixes {
|
|
143
|
+
if prefix.is_empty() {
|
|
144
|
+
return Err(LiterLlmError::BadRequest {
|
|
145
|
+
message: "custom provider model prefix must not be empty (would match all models)".into(),
|
|
146
|
+
});
|
|
147
|
+
}
|
|
148
|
+
}
|
|
149
|
+
Ok(())
|
|
150
|
+
}
|
|
151
|
+
|
|
152
|
+
// ── Provider implementation ──────────────────────────────────────────────────
|
|
153
|
+
|
|
154
|
+
/// A runtime-registered custom provider.
|
|
155
|
+
///
|
|
156
|
+
/// Wraps a [`CustomProviderConfig`] and implements the [`Provider`] trait so
|
|
157
|
+
/// the client can use it exactly like a built-in provider.
|
|
158
|
+
struct CustomProvider {
|
|
159
|
+
config: CustomProviderConfig,
|
|
160
|
+
}
|
|
161
|
+
|
|
162
|
+
impl Provider for CustomProvider {
|
|
163
|
+
fn name(&self) -> &str {
|
|
164
|
+
&self.config.name
|
|
165
|
+
}
|
|
166
|
+
|
|
167
|
+
fn base_url(&self) -> &str {
|
|
168
|
+
&self.config.base_url
|
|
169
|
+
}
|
|
170
|
+
|
|
171
|
+
fn auth_header<'a>(&'a self, api_key: &'a str) -> Option<(Cow<'static, str>, Cow<'a, str>)> {
|
|
172
|
+
match &self.config.auth_header {
|
|
173
|
+
AuthHeaderFormat::Bearer => Some((Cow::Borrowed("Authorization"), Cow::Owned(format!("Bearer {api_key}")))),
|
|
174
|
+
AuthHeaderFormat::ApiKey(header_name) => Some((Cow::Owned(header_name.clone()), Cow::Borrowed(api_key))),
|
|
175
|
+
AuthHeaderFormat::None => None,
|
|
176
|
+
}
|
|
177
|
+
}
|
|
178
|
+
|
|
179
|
+
fn matches_model(&self, model: &str) -> bool {
|
|
180
|
+
self.config
|
|
181
|
+
.model_prefixes
|
|
182
|
+
.iter()
|
|
183
|
+
.any(|prefix| model.starts_with(prefix.as_str()))
|
|
184
|
+
}
|
|
185
|
+
}
|
|
186
|
+
|
|
187
|
+
// ── Tests ────────────────────────────────────────────────────────────────────
|
|
188
|
+
|
|
189
|
+
#[cfg(test)]
|
|
190
|
+
mod tests {
|
|
191
|
+
use super::*;
|
|
192
|
+
|
|
193
|
+
/// Mutex to serialize tests that share the global custom-provider registry.
|
|
194
|
+
static TEST_LOCK: std::sync::Mutex<()> = std::sync::Mutex::new(());
|
|
195
|
+
|
|
196
|
+
/// Acquire the test lock and clear the registry.
|
|
197
|
+
fn setup() -> std::sync::MutexGuard<'static, ()> {
|
|
198
|
+
let guard = TEST_LOCK.lock().unwrap_or_else(|e| e.into_inner());
|
|
199
|
+
clear_custom_providers();
|
|
200
|
+
guard
|
|
201
|
+
}
|
|
202
|
+
|
|
203
|
+
#[test]
|
|
204
|
+
fn register_and_detect_by_model_prefix() {
|
|
205
|
+
let _guard = setup();
|
|
206
|
+
|
|
207
|
+
let config = CustomProviderConfig {
|
|
208
|
+
name: "my-provider".into(),
|
|
209
|
+
base_url: "https://api.my-provider.com/v1".into(),
|
|
210
|
+
auth_header: AuthHeaderFormat::Bearer,
|
|
211
|
+
model_prefixes: vec!["my-".into(), "my-provider/".into()],
|
|
212
|
+
};
|
|
213
|
+
|
|
214
|
+
register_custom_provider(config).expect("registration should succeed");
|
|
215
|
+
|
|
216
|
+
let provider = detect_custom_provider("my-model-7b");
|
|
217
|
+
assert!(provider.is_some(), "should detect custom provider by prefix 'my-'");
|
|
218
|
+
let provider = provider.unwrap();
|
|
219
|
+
assert_eq!(provider.name(), "my-provider");
|
|
220
|
+
assert_eq!(provider.base_url(), "https://api.my-provider.com/v1");
|
|
221
|
+
|
|
222
|
+
// Also detect via slash-prefix routing.
|
|
223
|
+
let provider2 = detect_custom_provider("my-provider/llama-70b");
|
|
224
|
+
assert!(provider2.is_some(), "should detect custom provider by slash prefix");
|
|
225
|
+
|
|
226
|
+
// Non-matching model should not detect.
|
|
227
|
+
let none = detect_custom_provider("gpt-4");
|
|
228
|
+
assert!(none.is_none(), "should not match unrelated model");
|
|
229
|
+
}
|
|
230
|
+
|
|
231
|
+
#[test]
|
|
232
|
+
fn unregister_removes_provider() {
|
|
233
|
+
let _guard = setup();
|
|
234
|
+
|
|
235
|
+
let config = CustomProviderConfig {
|
|
236
|
+
name: "ephemeral".into(),
|
|
237
|
+
base_url: "https://api.ephemeral.com/v1".into(),
|
|
238
|
+
auth_header: AuthHeaderFormat::Bearer,
|
|
239
|
+
model_prefixes: vec!["eph-".into()],
|
|
240
|
+
};
|
|
241
|
+
|
|
242
|
+
register_custom_provider(config).expect("registration should succeed");
|
|
243
|
+
assert!(detect_custom_provider("eph-model").is_some());
|
|
244
|
+
|
|
245
|
+
let removed = unregister_custom_provider("ephemeral").expect("unregister should succeed");
|
|
246
|
+
assert!(removed, "should return true when provider was found");
|
|
247
|
+
|
|
248
|
+
assert!(
|
|
249
|
+
detect_custom_provider("eph-model").is_none(),
|
|
250
|
+
"should no longer detect after unregister"
|
|
251
|
+
);
|
|
252
|
+
|
|
253
|
+
// Unregistering again returns false.
|
|
254
|
+
let removed_again = unregister_custom_provider("ephemeral").expect("unregister should succeed");
|
|
255
|
+
assert!(!removed_again, "should return false when provider not found");
|
|
256
|
+
}
|
|
257
|
+
|
|
258
|
+
#[test]
|
|
259
|
+
fn custom_provider_with_api_key_auth() {
|
|
260
|
+
let _guard = setup();
|
|
261
|
+
|
|
262
|
+
let config = CustomProviderConfig {
|
|
263
|
+
name: "secure-provider".into(),
|
|
264
|
+
base_url: "https://api.secure.com/v1".into(),
|
|
265
|
+
auth_header: AuthHeaderFormat::ApiKey("X-Custom-Auth".into()),
|
|
266
|
+
model_prefixes: vec!["secure/".into()],
|
|
267
|
+
};
|
|
268
|
+
|
|
269
|
+
register_custom_provider(config).expect("registration should succeed");
|
|
270
|
+
|
|
271
|
+
let provider = detect_custom_provider("secure/model-1").expect("should detect provider");
|
|
272
|
+
let (header_name, header_value) = provider
|
|
273
|
+
.auth_header("my-secret-key")
|
|
274
|
+
.expect("should return auth header");
|
|
275
|
+
assert_eq!(header_name.as_ref(), "X-Custom-Auth");
|
|
276
|
+
assert_eq!(header_value.as_ref(), "my-secret-key");
|
|
277
|
+
}
|
|
278
|
+
|
|
279
|
+
#[test]
|
|
280
|
+
fn custom_provider_with_no_auth() {
|
|
281
|
+
let _guard = setup();
|
|
282
|
+
|
|
283
|
+
let config = CustomProviderConfig {
|
|
284
|
+
name: "local-provider".into(),
|
|
285
|
+
base_url: "http://localhost:8080/v1".into(),
|
|
286
|
+
auth_header: AuthHeaderFormat::None,
|
|
287
|
+
model_prefixes: vec!["local/".into()],
|
|
288
|
+
};
|
|
289
|
+
|
|
290
|
+
register_custom_provider(config).expect("registration should succeed");
|
|
291
|
+
|
|
292
|
+
let provider = detect_custom_provider("local/model").expect("should detect provider");
|
|
293
|
+
assert!(
|
|
294
|
+
provider.auth_header("unused").is_none(),
|
|
295
|
+
"no-auth provider should return None"
|
|
296
|
+
);
|
|
297
|
+
}
|
|
298
|
+
|
|
299
|
+
#[test]
|
|
300
|
+
fn custom_provider_bearer_auth() {
|
|
301
|
+
let _guard = setup();
|
|
302
|
+
|
|
303
|
+
let config = CustomProviderConfig {
|
|
304
|
+
name: "bearer-provider".into(),
|
|
305
|
+
base_url: "https://api.bearer.com/v1".into(),
|
|
306
|
+
auth_header: AuthHeaderFormat::Bearer,
|
|
307
|
+
model_prefixes: vec!["bearer/".into()],
|
|
308
|
+
};
|
|
309
|
+
|
|
310
|
+
register_custom_provider(config).expect("registration should succeed");
|
|
311
|
+
|
|
312
|
+
let provider = detect_custom_provider("bearer/model").expect("should detect provider");
|
|
313
|
+
let (header_name, header_value) = provider.auth_header("my-token").expect("should return auth header");
|
|
314
|
+
assert_eq!(header_name.as_ref(), "Authorization");
|
|
315
|
+
assert_eq!(header_value.as_ref(), "Bearer my-token");
|
|
316
|
+
}
|
|
317
|
+
|
|
318
|
+
#[test]
|
|
319
|
+
fn register_replaces_existing_provider() {
|
|
320
|
+
let _guard = setup();
|
|
321
|
+
|
|
322
|
+
let config1 = CustomProviderConfig {
|
|
323
|
+
name: "updatable".into(),
|
|
324
|
+
base_url: "https://old.example.com/v1".into(),
|
|
325
|
+
auth_header: AuthHeaderFormat::Bearer,
|
|
326
|
+
model_prefixes: vec!["upd/".into()],
|
|
327
|
+
};
|
|
328
|
+
register_custom_provider(config1).expect("first registration should succeed");
|
|
329
|
+
|
|
330
|
+
let config2 = CustomProviderConfig {
|
|
331
|
+
name: "updatable".into(),
|
|
332
|
+
base_url: "https://new.example.com/v1".into(),
|
|
333
|
+
auth_header: AuthHeaderFormat::Bearer,
|
|
334
|
+
model_prefixes: vec!["upd/".into()],
|
|
335
|
+
};
|
|
336
|
+
register_custom_provider(config2).expect("second registration should succeed");
|
|
337
|
+
|
|
338
|
+
let provider = detect_custom_provider("upd/model").expect("should detect provider");
|
|
339
|
+
assert_eq!(
|
|
340
|
+
provider.base_url(),
|
|
341
|
+
"https://new.example.com/v1",
|
|
342
|
+
"should use the updated config"
|
|
343
|
+
);
|
|
344
|
+
}
|
|
345
|
+
|
|
346
|
+
#[test]
|
|
347
|
+
fn validation_rejects_empty_name() {
|
|
348
|
+
let _guard = setup();
|
|
349
|
+
|
|
350
|
+
let config = CustomProviderConfig {
|
|
351
|
+
name: String::new(),
|
|
352
|
+
base_url: "https://example.com".into(),
|
|
353
|
+
auth_header: AuthHeaderFormat::Bearer,
|
|
354
|
+
model_prefixes: vec!["x/".into()],
|
|
355
|
+
};
|
|
356
|
+
let result = register_custom_provider(config);
|
|
357
|
+
assert!(result.is_err(), "should reject empty name");
|
|
358
|
+
}
|
|
359
|
+
|
|
360
|
+
#[test]
|
|
361
|
+
fn validation_rejects_empty_base_url() {
|
|
362
|
+
let _guard = setup();
|
|
363
|
+
|
|
364
|
+
let config = CustomProviderConfig {
|
|
365
|
+
name: "valid-name".into(),
|
|
366
|
+
base_url: String::new(),
|
|
367
|
+
auth_header: AuthHeaderFormat::Bearer,
|
|
368
|
+
model_prefixes: vec!["x/".into()],
|
|
369
|
+
};
|
|
370
|
+
let result = register_custom_provider(config);
|
|
371
|
+
assert!(result.is_err(), "should reject empty base_url");
|
|
372
|
+
}
|
|
373
|
+
|
|
374
|
+
#[test]
|
|
375
|
+
fn validation_rejects_no_prefixes() {
|
|
376
|
+
let _guard = setup();
|
|
377
|
+
|
|
378
|
+
let config = CustomProviderConfig {
|
|
379
|
+
name: "valid-name".into(),
|
|
380
|
+
base_url: "https://example.com".into(),
|
|
381
|
+
auth_header: AuthHeaderFormat::Bearer,
|
|
382
|
+
model_prefixes: vec![],
|
|
383
|
+
};
|
|
384
|
+
let result = register_custom_provider(config);
|
|
385
|
+
assert!(result.is_err(), "should reject empty model_prefixes");
|
|
386
|
+
}
|
|
387
|
+
|
|
388
|
+
#[test]
|
|
389
|
+
fn config_serde_round_trip() {
|
|
390
|
+
let config = CustomProviderConfig {
|
|
391
|
+
name: "serde-test".into(),
|
|
392
|
+
base_url: "https://example.com/v1".into(),
|
|
393
|
+
auth_header: AuthHeaderFormat::ApiKey("X-Api-Key".into()),
|
|
394
|
+
model_prefixes: vec!["serde/".into()],
|
|
395
|
+
};
|
|
396
|
+
|
|
397
|
+
let json = serde_json::to_string(&config).expect("should serialize");
|
|
398
|
+
let parsed: CustomProviderConfig = serde_json::from_str(&json).expect("should deserialize");
|
|
399
|
+
|
|
400
|
+
assert_eq!(parsed.name, "serde-test");
|
|
401
|
+
assert_eq!(parsed.base_url, "https://example.com/v1");
|
|
402
|
+
assert_eq!(parsed.model_prefixes, vec!["serde/"]);
|
|
403
|
+
}
|
|
404
|
+
}
|
|
@@ -0,0 +1,281 @@
|
|
|
1
|
+
use std::borrow::Cow;
|
|
2
|
+
|
|
3
|
+
use crate::error::Result;
|
|
4
|
+
use crate::provider::Provider;
|
|
5
|
+
use crate::types::ChatCompletionChunk;
|
|
6
|
+
|
|
7
|
+
use super::vertex::{parse_gemini_stream_event, transform_gemini_request, transform_gemini_response};
|
|
8
|
+
|
|
9
|
+
/// Google AI Studio base URL (Gemini API via API key).
|
|
10
|
+
const BASE_URL: &str = "https://generativelanguage.googleapis.com/v1beta";
|
|
11
|
+
|
|
12
|
+
/// Google AI Studio (Gemini) provider.
|
|
13
|
+
///
|
|
14
|
+
/// Uses the same Gemini `generateContent` format as Vertex AI but with:
|
|
15
|
+
/// - Different base URL: `https://generativelanguage.googleapis.com/v1beta`
|
|
16
|
+
/// - API key authentication via `x-goog-api-key` header (not OAuth2).
|
|
17
|
+
/// - Model routing via `gemini/` or `google_ai/` prefix.
|
|
18
|
+
///
|
|
19
|
+
/// Request/response translation is shared with [`super::vertex::VertexAiProvider`]
|
|
20
|
+
/// via the `pub(crate)` Gemini transform functions.
|
|
21
|
+
///
|
|
22
|
+
/// # Configuration
|
|
23
|
+
///
|
|
24
|
+
/// ```rust,ignore
|
|
25
|
+
/// let config = ClientConfigBuilder::new("AIza...your-api-key").build();
|
|
26
|
+
/// let client = DefaultClient::new(config, Some("gemini/gemini-2.0-flash"))?;
|
|
27
|
+
///
|
|
28
|
+
/// // Or using the google_ai/ prefix:
|
|
29
|
+
/// let client = DefaultClient::new(config, Some("google_ai/gemini-2.0-flash"))?;
|
|
30
|
+
/// ```
|
|
31
|
+
pub struct GoogleAiProvider;
|
|
32
|
+
|
|
33
|
+
impl Provider for GoogleAiProvider {
|
|
34
|
+
fn name(&self) -> &str {
|
|
35
|
+
"google_ai"
|
|
36
|
+
}
|
|
37
|
+
|
|
38
|
+
fn base_url(&self) -> &str {
|
|
39
|
+
BASE_URL
|
|
40
|
+
}
|
|
41
|
+
|
|
42
|
+
/// Google AI Studio uses `x-goog-api-key` header for authentication.
|
|
43
|
+
fn auth_header<'a>(&'a self, api_key: &'a str) -> Option<(Cow<'static, str>, Cow<'a, str>)> {
|
|
44
|
+
Some((Cow::Borrowed("x-goog-api-key"), Cow::Borrowed(api_key)))
|
|
45
|
+
}
|
|
46
|
+
|
|
47
|
+
fn matches_model(&self, model: &str) -> bool {
|
|
48
|
+
model.starts_with("gemini/") || model.starts_with("google_ai/")
|
|
49
|
+
}
|
|
50
|
+
|
|
51
|
+
fn strip_model_prefix<'m>(&self, model: &'m str) -> &'m str {
|
|
52
|
+
model
|
|
53
|
+
.strip_prefix("gemini/")
|
|
54
|
+
.or_else(|| model.strip_prefix("google_ai/"))
|
|
55
|
+
.unwrap_or(model)
|
|
56
|
+
}
|
|
57
|
+
|
|
58
|
+
/// Build the full URL for a Google AI Studio request.
|
|
59
|
+
///
|
|
60
|
+
/// Chat completions → `{base}/models/{model}:generateContent`
|
|
61
|
+
/// Embeddings → `{base}/models/{model}:embedContent`
|
|
62
|
+
/// Other paths → `{base}{endpoint_path}`
|
|
63
|
+
fn build_url(&self, endpoint_path: &str, model: &str) -> String {
|
|
64
|
+
let base = self.base_url().trim_end_matches('/');
|
|
65
|
+
if endpoint_path.contains("chat/completions") {
|
|
66
|
+
format!("{base}/models/{model}:generateContent")
|
|
67
|
+
} else if endpoint_path.contains("embeddings") {
|
|
68
|
+
format!("{base}/models/{model}:embedContent")
|
|
69
|
+
} else {
|
|
70
|
+
format!("{base}{endpoint_path}")
|
|
71
|
+
}
|
|
72
|
+
}
|
|
73
|
+
|
|
74
|
+
fn transform_request(&self, body: &mut serde_json::Value) -> Result<()> {
|
|
75
|
+
transform_gemini_request(body)
|
|
76
|
+
}
|
|
77
|
+
|
|
78
|
+
fn transform_response(&self, body: &mut serde_json::Value) -> Result<()> {
|
|
79
|
+
transform_gemini_response(body)
|
|
80
|
+
}
|
|
81
|
+
|
|
82
|
+
/// Build the streaming URL: appends `?alt=sse` to enable SSE streaming.
|
|
83
|
+
fn build_stream_url(&self, endpoint_path: &str, model: &str) -> String {
|
|
84
|
+
let url = self.build_url(endpoint_path, model);
|
|
85
|
+
format!("{url}?alt=sse")
|
|
86
|
+
}
|
|
87
|
+
|
|
88
|
+
fn parse_stream_event(&self, event_data: &str) -> Result<Option<ChatCompletionChunk>> {
|
|
89
|
+
parse_gemini_stream_event(event_data)
|
|
90
|
+
}
|
|
91
|
+
}
|
|
92
|
+
|
|
93
|
+
// ── Unit tests ────────────────────────────────────────────────────────────────
|
|
94
|
+
|
|
95
|
+
#[cfg(test)]
|
|
96
|
+
mod tests {
|
|
97
|
+
use serde_json::json;
|
|
98
|
+
|
|
99
|
+
use super::*;
|
|
100
|
+
use crate::provider::Provider;
|
|
101
|
+
|
|
102
|
+
fn provider() -> GoogleAiProvider {
|
|
103
|
+
GoogleAiProvider
|
|
104
|
+
}
|
|
105
|
+
|
|
106
|
+
// ── base_url ──────────────────────────────────────────────────────────────
|
|
107
|
+
|
|
108
|
+
#[test]
|
|
109
|
+
fn base_url_is_generative_language_api() {
|
|
110
|
+
let p = provider();
|
|
111
|
+
assert_eq!(p.base_url(), "https://generativelanguage.googleapis.com/v1beta");
|
|
112
|
+
}
|
|
113
|
+
|
|
114
|
+
// ── auth_header ──────────────────────────────────────────────────────────
|
|
115
|
+
|
|
116
|
+
#[test]
|
|
117
|
+
fn auth_header_uses_x_goog_api_key() {
|
|
118
|
+
let p = provider();
|
|
119
|
+
let (name, value) = p.auth_header("test-key").unwrap();
|
|
120
|
+
assert_eq!(name.as_ref(), "x-goog-api-key");
|
|
121
|
+
assert_eq!(value.as_ref(), "test-key");
|
|
122
|
+
}
|
|
123
|
+
|
|
124
|
+
// ── model matching ───────────────────────────────────────────────────────
|
|
125
|
+
|
|
126
|
+
#[test]
|
|
127
|
+
fn matches_gemini_prefix() {
|
|
128
|
+
let p = provider();
|
|
129
|
+
assert!(p.matches_model("gemini/gemini-2.0-flash"));
|
|
130
|
+
assert!(p.matches_model("google_ai/gemini-2.0-flash"));
|
|
131
|
+
assert!(!p.matches_model("vertex_ai/gemini-2.0-flash"));
|
|
132
|
+
assert!(!p.matches_model("gpt-4"));
|
|
133
|
+
}
|
|
134
|
+
|
|
135
|
+
#[test]
|
|
136
|
+
fn strip_model_prefix_gemini() {
|
|
137
|
+
let p = provider();
|
|
138
|
+
assert_eq!(p.strip_model_prefix("gemini/gemini-2.0-flash"), "gemini-2.0-flash");
|
|
139
|
+
assert_eq!(p.strip_model_prefix("google_ai/gemini-pro"), "gemini-pro");
|
|
140
|
+
assert_eq!(p.strip_model_prefix("gemini-2.0-flash"), "gemini-2.0-flash");
|
|
141
|
+
}
|
|
142
|
+
|
|
143
|
+
// ── build_url ─────────────────────────────────────────────────────────────
|
|
144
|
+
|
|
145
|
+
#[test]
|
|
146
|
+
fn build_url_chat_completions() {
|
|
147
|
+
let p = provider();
|
|
148
|
+
let url = p.build_url("/chat/completions", "gemini-2.0-flash");
|
|
149
|
+
assert_eq!(
|
|
150
|
+
url,
|
|
151
|
+
"https://generativelanguage.googleapis.com/v1beta/models/gemini-2.0-flash:generateContent"
|
|
152
|
+
);
|
|
153
|
+
}
|
|
154
|
+
|
|
155
|
+
#[test]
|
|
156
|
+
fn build_url_embeddings() {
|
|
157
|
+
let p = provider();
|
|
158
|
+
let url = p.build_url("/embeddings", "text-embedding-004");
|
|
159
|
+
assert_eq!(
|
|
160
|
+
url,
|
|
161
|
+
"https://generativelanguage.googleapis.com/v1beta/models/text-embedding-004:embedContent"
|
|
162
|
+
);
|
|
163
|
+
}
|
|
164
|
+
|
|
165
|
+
#[test]
|
|
166
|
+
fn build_stream_url_appends_alt_sse() {
|
|
167
|
+
let p = provider();
|
|
168
|
+
let url = p.build_stream_url("/chat/completions", "gemini-2.0-flash");
|
|
169
|
+
assert!(url.ends_with("?alt=sse"));
|
|
170
|
+
assert!(url.contains(":generateContent"));
|
|
171
|
+
}
|
|
172
|
+
|
|
173
|
+
// ── transform_request (delegates to shared Gemini logic) ─────────────────
|
|
174
|
+
|
|
175
|
+
#[test]
|
|
176
|
+
fn transform_request_basic_chat() {
|
|
177
|
+
let p = provider();
|
|
178
|
+
let mut body = json!({
|
|
179
|
+
"messages": [
|
|
180
|
+
{"role": "system", "content": "You are helpful."},
|
|
181
|
+
{"role": "user", "content": "Hello!"}
|
|
182
|
+
],
|
|
183
|
+
"max_tokens": 100
|
|
184
|
+
});
|
|
185
|
+
|
|
186
|
+
p.transform_request(&mut body).unwrap();
|
|
187
|
+
|
|
188
|
+
assert_eq!(body["systemInstruction"]["parts"][0]["text"], "You are helpful.");
|
|
189
|
+
assert_eq!(body["contents"][0]["role"], "user");
|
|
190
|
+
assert_eq!(body["contents"][0]["parts"][0]["text"], "Hello!");
|
|
191
|
+
assert_eq!(body["generationConfig"]["maxOutputTokens"], 100);
|
|
192
|
+
}
|
|
193
|
+
|
|
194
|
+
#[test]
|
|
195
|
+
fn transform_request_safety_settings() {
|
|
196
|
+
let p = provider();
|
|
197
|
+
let mut body = json!({
|
|
198
|
+
"messages": [{"role": "user", "content": "hi"}],
|
|
199
|
+
"extra_body": {
|
|
200
|
+
"safety_settings": [
|
|
201
|
+
{"category": "HARM_CATEGORY_HATE_SPEECH", "threshold": "BLOCK_MEDIUM_AND_ABOVE"}
|
|
202
|
+
]
|
|
203
|
+
}
|
|
204
|
+
});
|
|
205
|
+
|
|
206
|
+
p.transform_request(&mut body).unwrap();
|
|
207
|
+
|
|
208
|
+
let settings = body["safetySettings"].as_array().unwrap();
|
|
209
|
+
assert_eq!(settings.len(), 1);
|
|
210
|
+
assert_eq!(settings[0]["category"], "HARM_CATEGORY_HATE_SPEECH");
|
|
211
|
+
}
|
|
212
|
+
|
|
213
|
+
#[test]
|
|
214
|
+
fn transform_request_cached_content() {
|
|
215
|
+
let p = provider();
|
|
216
|
+
let mut body = json!({
|
|
217
|
+
"messages": [{"role": "user", "content": "hi"}],
|
|
218
|
+
"extra_body": {
|
|
219
|
+
"cached_content": "cachedContents/abc123"
|
|
220
|
+
}
|
|
221
|
+
});
|
|
222
|
+
|
|
223
|
+
p.transform_request(&mut body).unwrap();
|
|
224
|
+
|
|
225
|
+
assert_eq!(body["cachedContent"], "cachedContents/abc123");
|
|
226
|
+
}
|
|
227
|
+
|
|
228
|
+
// ── transform_response (delegates to shared Gemini logic) ────────────────
|
|
229
|
+
|
|
230
|
+
#[test]
|
|
231
|
+
fn transform_response_basic() {
|
|
232
|
+
let p = provider();
|
|
233
|
+
let mut body = json!({
|
|
234
|
+
"candidates": [{
|
|
235
|
+
"content": {
|
|
236
|
+
"role": "model",
|
|
237
|
+
"parts": [{"text": "Hello from Google AI!"}]
|
|
238
|
+
},
|
|
239
|
+
"finishReason": "STOP"
|
|
240
|
+
}],
|
|
241
|
+
"usageMetadata": {
|
|
242
|
+
"promptTokenCount": 5,
|
|
243
|
+
"candidatesTokenCount": 4
|
|
244
|
+
}
|
|
245
|
+
});
|
|
246
|
+
|
|
247
|
+
p.transform_response(&mut body).unwrap();
|
|
248
|
+
|
|
249
|
+
assert_eq!(body["object"], "chat.completion");
|
|
250
|
+
assert_eq!(body["choices"][0]["message"]["content"], "Hello from Google AI!");
|
|
251
|
+
assert_eq!(body["choices"][0]["finish_reason"], "stop");
|
|
252
|
+
assert_eq!(body["usage"]["prompt_tokens"], 5);
|
|
253
|
+
assert_eq!(body["usage"]["completion_tokens"], 4);
|
|
254
|
+
}
|
|
255
|
+
|
|
256
|
+
// ── parse_stream_event (delegates to shared Gemini logic) ────────────────
|
|
257
|
+
|
|
258
|
+
#[test]
|
|
259
|
+
fn parse_stream_event_empty_returns_none() {
|
|
260
|
+
let p = provider();
|
|
261
|
+
let result = p.parse_stream_event("").unwrap();
|
|
262
|
+
assert!(result.is_none());
|
|
263
|
+
}
|
|
264
|
+
|
|
265
|
+
#[test]
|
|
266
|
+
fn parse_stream_event_basic_chunk() {
|
|
267
|
+
let p = provider();
|
|
268
|
+
let event_data = r#"{
|
|
269
|
+
"candidates": [{
|
|
270
|
+
"content": {"role": "model", "parts": [{"text": "Hi"}]},
|
|
271
|
+
"finishReason": "STOP"
|
|
272
|
+
}],
|
|
273
|
+
"usageMetadata": {"promptTokenCount": 3, "candidatesTokenCount": 1}
|
|
274
|
+
}"#;
|
|
275
|
+
|
|
276
|
+
let chunk = p.parse_stream_event(event_data).unwrap().unwrap();
|
|
277
|
+
|
|
278
|
+
assert_eq!(chunk.object, "chat.completion.chunk");
|
|
279
|
+
assert_eq!(chunk.choices[0].delta.content.as_deref(), Some("Hi"));
|
|
280
|
+
}
|
|
281
|
+
}
|