RubyGems - liter_llm - Versions diffs - 1.0.0.pre.rc.6 - Mend

liter_llm 1.0.0.pre.rc.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (78) hide show

checksums.yaml +7 -0
data/README.md +239 -0
data/ext/liter_llm_rb/extconf.rb +65 -0
data/ext/liter_llm_rb/native/.cargo/config.toml +23 -0
data/ext/liter_llm_rb/native/Cargo.lock +3713 -0
data/ext/liter_llm_rb/native/Cargo.toml +32 -0
data/ext/liter_llm_rb/native/build.rs +15 -0
data/ext/liter_llm_rb/native/src/lib.rs +1079 -0
data/lib/liter_llm.rb +8 -0
data/sig/liter_llm.rbs +416 -0
data/vendor/Cargo.toml +54 -0
data/vendor/liter-llm/Cargo.toml +92 -0
data/vendor/liter-llm/README.md +252 -0
data/vendor/liter-llm/schemas/pricing.json +40 -0
data/vendor/liter-llm/schemas/providers.json +1662 -0
data/vendor/liter-llm/src/auth/azure_ad.rs +264 -0
data/vendor/liter-llm/src/auth/bedrock_sts.rs +353 -0
data/vendor/liter-llm/src/auth/mod.rs +68 -0
data/vendor/liter-llm/src/auth/vertex_oauth.rs +353 -0
data/vendor/liter-llm/src/client/config.rs +351 -0
data/vendor/liter-llm/src/client/managed.rs +622 -0
data/vendor/liter-llm/src/client/mod.rs +864 -0
data/vendor/liter-llm/src/cost.rs +212 -0
data/vendor/liter-llm/src/error.rs +190 -0
data/vendor/liter-llm/src/http/eventstream.rs +860 -0
data/vendor/liter-llm/src/http/mod.rs +12 -0
data/vendor/liter-llm/src/http/request.rs +438 -0
data/vendor/liter-llm/src/http/retry.rs +72 -0
data/vendor/liter-llm/src/http/streaming.rs +289 -0
data/vendor/liter-llm/src/lib.rs +37 -0
data/vendor/liter-llm/src/provider/anthropic.rs +2250 -0
data/vendor/liter-llm/src/provider/azure.rs +579 -0
data/vendor/liter-llm/src/provider/bedrock.rs +1543 -0
data/vendor/liter-llm/src/provider/cohere.rs +654 -0
data/vendor/liter-llm/src/provider/custom.rs +404 -0
data/vendor/liter-llm/src/provider/google_ai.rs +281 -0
data/vendor/liter-llm/src/provider/mistral.rs +188 -0
data/vendor/liter-llm/src/provider/mod.rs +616 -0
data/vendor/liter-llm/src/provider/vertex.rs +1504 -0
data/vendor/liter-llm/src/tests.rs +1425 -0
data/vendor/liter-llm/src/tokenizer.rs +281 -0
data/vendor/liter-llm/src/tower/budget.rs +599 -0
data/vendor/liter-llm/src/tower/cache.rs +502 -0
data/vendor/liter-llm/src/tower/cache_opendal.rs +270 -0
data/vendor/liter-llm/src/tower/cooldown.rs +231 -0
data/vendor/liter-llm/src/tower/cost.rs +404 -0
data/vendor/liter-llm/src/tower/fallback.rs +121 -0
data/vendor/liter-llm/src/tower/health.rs +219 -0
data/vendor/liter-llm/src/tower/hooks.rs +369 -0
data/vendor/liter-llm/src/tower/mod.rs +77 -0
data/vendor/liter-llm/src/tower/rate_limit.rs +300 -0
data/vendor/liter-llm/src/tower/router.rs +436 -0
data/vendor/liter-llm/src/tower/service.rs +181 -0
data/vendor/liter-llm/src/tower/tests.rs +539 -0
data/vendor/liter-llm/src/tower/tests_common.rs +252 -0
data/vendor/liter-llm/src/tower/tracing.rs +209 -0
data/vendor/liter-llm/src/tower/types.rs +170 -0
data/vendor/liter-llm/src/types/audio.rs +52 -0
data/vendor/liter-llm/src/types/batch.rs +77 -0
data/vendor/liter-llm/src/types/chat.rs +214 -0
data/vendor/liter-llm/src/types/common.rs +244 -0
data/vendor/liter-llm/src/types/embedding.rs +84 -0
data/vendor/liter-llm/src/types/files.rs +58 -0
data/vendor/liter-llm/src/types/image.rs +40 -0
data/vendor/liter-llm/src/types/mod.rs +27 -0
data/vendor/liter-llm/src/types/models.rs +21 -0
data/vendor/liter-llm/src/types/moderation.rs +80 -0
data/vendor/liter-llm/src/types/ocr.rs +87 -0
data/vendor/liter-llm/src/types/rerank.rs +46 -0
data/vendor/liter-llm/src/types/responses.rs +55 -0
data/vendor/liter-llm/src/types/search.rs +45 -0
data/vendor/liter-llm/tests/contract.rs +332 -0
data/vendor/liter-llm-ffi/Cargo.toml +30 -0
data/vendor/liter-llm-ffi/build.rs +66 -0
data/vendor/liter-llm-ffi/cbindgen.toml +60 -0
data/vendor/liter-llm-ffi/liter_llm.h +850 -0
data/vendor/liter-llm-ffi/src/lib.rs +2488 -0
metadata +286 -0

data/vendor/liter-llm/src/client/config.rs ADDED Viewed

@@ -0,0 +1,351 @@
+use std::sync::Arc;
+use std::time::Duration;
+use secrecy::SecretString;
+use crate::auth::CredentialProvider;
+#[cfg(feature = "native-http")]
+use crate::error::{LiterLlmError, Result};
+#[cfg(feature = "tower")]
+use crate::tower::{BudgetConfig, CacheConfig, CacheStore, LlmHook, RateLimitConfig};
+/// Configuration for an LLM client.
+///
+/// `api_key` is stored as a [`SecretString`] so it is zeroed on drop and never
+/// printed accidentally.  Access it via [`secrecy::ExposeSecret`].
+#[derive(Clone)]
+pub struct ClientConfig {
+    /// API key for authentication (stored as a secret).
+    pub api_key: SecretString,
+    /// Override base URL.  When set, all requests go here regardless of model
+    /// name, and provider auto-detection is skipped.
+    pub base_url: Option<String>,
+    /// Request timeout.
+    pub timeout: Duration,
+    /// Maximum number of retries on 429 / 5xx responses.
+    pub max_retries: u32,
+    /// Extra headers sent on every request.
+    ///
+    /// Use `Vec<(String, String)>` rather than `HashMap` to preserve insertion
+    /// order and avoid non-deterministic iteration when building the reqwest
+    /// `HeaderMap`.  Access via [`ClientConfig::headers`]; do not mutate
+    /// directly from outside this crate.
+    pub(crate) extra_headers: Vec<(String, String)>,
+    /// Optional dynamic credential provider for token-based auth
+    /// (Azure AD, Vertex OAuth2) or refreshable credentials (AWS STS).
+    ///
+    /// When set, the client calls `resolve()` before each request to obtain
+    /// a fresh credential.  When `None`, the static `api_key` is used.
+    pub credential_provider: Option<Arc<dyn CredentialProvider>>,
+    /// Configuration for the response cache Tower middleware layer.
+    ///
+    /// When set, bindings and advanced Rust users can use this to construct
+    /// a [`CacheLayer`](crate::tower::CacheLayer) in their Tower stack.
+    #[cfg(feature = "tower")]
+    pub cache_config: Option<CacheConfig>,
+    /// Custom cache store backend for the cache Tower middleware layer.
+    ///
+    /// When set alongside `cache_config`, the cache layer will use this
+    /// store instead of the default in-memory LRU.
+    #[cfg(feature = "tower")]
+    pub cache_store: Option<Arc<dyn CacheStore>>,
+    /// Configuration for the budget enforcement Tower middleware layer.
+    ///
+    /// When set, bindings and advanced Rust users can use this to construct
+    /// a [`BudgetLayer`](crate::tower::BudgetLayer) in their Tower stack.
+    #[cfg(feature = "tower")]
+    pub budget_config: Option<BudgetConfig>,
+    /// User-defined hooks for the hooks Tower middleware layer.
+    ///
+    /// These hooks are invoked at request lifecycle points (pre-request,
+    /// post-response, on-error) when a
+    /// [`HooksLayer`](crate::tower::HooksLayer) is constructed from this
+    /// config.
+    #[cfg(feature = "tower")]
+    pub hooks: Vec<Arc<dyn LlmHook>>,
+    /// Cooldown duration after transient errors (rate limit, timeout, server error).
+    /// When set, the client rejects requests with `ServiceUnavailable` during cooldown.
+    #[cfg(feature = "tower")]
+    pub cooldown_duration: Option<Duration>,
+    /// Per-model rate limiting configuration (RPM/TPM).
+    #[cfg(feature = "tower")]
+    pub rate_limit_config: Option<RateLimitConfig>,
+    /// Background health check interval. When set, periodically probes the provider
+    /// and rejects requests when the provider is unhealthy.
+    #[cfg(feature = "tower")]
+    pub health_check_interval: Option<Duration>,
+    /// Enable per-request cost tracking. Costs are accumulated atomically and
+    /// logged via `tracing::info`.
+    #[cfg(feature = "tower")]
+    pub enable_cost_tracking: bool,
+    /// Enable OpenTelemetry-compatible tracing spans for every request.
+    #[cfg(feature = "tower")]
+    pub enable_tracing: bool,
+}
+impl ClientConfig {
+    /// Create a config with the given API key and sensible defaults.
+    pub fn new(api_key: impl Into<String>) -> Self {
+        Self {
+            api_key: SecretString::from(api_key.into()),
+            base_url: None,
+            timeout: Duration::from_secs(60),
+            max_retries: 3,
+            extra_headers: Vec::new(),
+            credential_provider: None,
+            #[cfg(feature = "tower")]
+            cache_config: None,
+            #[cfg(feature = "tower")]
+            cache_store: None,
+            #[cfg(feature = "tower")]
+            budget_config: None,
+            #[cfg(feature = "tower")]
+            hooks: Vec::new(),
+            #[cfg(feature = "tower")]
+            cooldown_duration: None,
+            #[cfg(feature = "tower")]
+            rate_limit_config: None,
+            #[cfg(feature = "tower")]
+            health_check_interval: None,
+            #[cfg(feature = "tower")]
+            enable_cost_tracking: false,
+            #[cfg(feature = "tower")]
+            enable_tracing: false,
+        }
+    }
+    /// Return the extra headers as an ordered slice of `(name, value)` pairs.
+    pub fn headers(&self) -> &[(String, String)] {
+        &self.extra_headers
+    }
+}
+/// Note: intentionally does *not* implement `Debug` so the secret key is never
+/// accidentally logged via `{:?}`.
+impl std::fmt::Debug for ClientConfig {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        // Redact all header values — they may contain API keys or secrets.
+        let redacted_headers: Vec<(&str, &str)> = self
+            .extra_headers
+            .iter()
+            .map(|(k, _v)| (k.as_str(), "[redacted]"))
+            .collect();
+        let mut dbg = f.debug_struct("ClientConfig");
+        dbg.field("api_key", &"[redacted]")
+            .field("base_url", &self.base_url)
+            .field("timeout", &self.timeout)
+            .field("max_retries", &self.max_retries)
+            .field("extra_headers", &redacted_headers)
+            .field(
+                "credential_provider",
+                &self.credential_provider.as_ref().map(|_| "[configured]"),
+            );
+        #[cfg(feature = "tower")]
+        {
+            dbg.field("cache_config", &self.cache_config)
+                .field("cache_store", &self.cache_store.as_ref().map(|_| "[configured]"))
+                .field("budget_config", &self.budget_config)
+                .field("hooks_count", &self.hooks.len())
+                .field("cooldown_duration", &self.cooldown_duration)
+                .field("rate_limit_config", &self.rate_limit_config)
+                .field("health_check_interval", &self.health_check_interval)
+                .field("enable_cost_tracking", &self.enable_cost_tracking)
+                .field("enable_tracing", &self.enable_tracing);
+        }
+        dbg.finish()
+    }
+}
+/// Builder for [`ClientConfig`].
+///
+/// Construct with [`ClientConfigBuilder::new`] and call builder methods to
+/// customise the configuration, then call [`ClientConfigBuilder::build`] to
+/// obtain a [`ClientConfig`].
+#[must_use]
+pub struct ClientConfigBuilder {
+    config: ClientConfig,
+}
+impl ClientConfigBuilder {
+    /// Create a new builder with the given API key and sensible defaults.
+    pub fn new(api_key: impl Into<String>) -> Self {
+        Self {
+            config: ClientConfig::new(api_key),
+        }
+    }
+    /// Override the provider base URL for all requests.
+    pub fn base_url(mut self, url: impl Into<String>) -> Self {
+        self.config.base_url = Some(url.into());
+        self
+    }
+    /// Set the per-request timeout (default: 60 s).
+    pub fn timeout(mut self, timeout: Duration) -> Self {
+        self.config.timeout = timeout;
+        self
+    }
+    /// Set the maximum number of retries on 429 / 5xx responses (default: 3).
+    pub fn max_retries(mut self, retries: u32) -> Self {
+        self.config.max_retries = retries;
+        self
+    }
+    /// Set a dynamic credential provider for token-based or refreshable auth.
+    ///
+    /// When configured, the client calls `resolve()` before each request
+    /// instead of using the static `api_key` for authentication.
+    pub fn credential_provider(mut self, provider: Arc<dyn CredentialProvider>) -> Self {
+        self.config.credential_provider = Some(provider);
+        self
+    }
+    /// Add a custom header sent on every request.
+    ///
+    /// Returns an error if either `key` or `value` is not a valid HTTP header
+    /// name / value.
+    ///
+    /// This method is only available when the `native-http` feature is enabled
+    /// because header validation relies on `reqwest`'s header types.
+    #[cfg(feature = "native-http")]
+    pub fn header(mut self, key: impl Into<String>, value: impl Into<String>) -> Result<Self> {
+        let key = key.into();
+        let value = value.into();
+        // Validate header name.
+        reqwest::header::HeaderName::from_bytes(key.as_bytes()).map_err(|e| LiterLlmError::InvalidHeader {
+            name: key.clone(),
+            reason: e.to_string(),
+        })?;
+        // Validate header value.
+        reqwest::header::HeaderValue::from_str(&value).map_err(|e| LiterLlmError::InvalidHeader {
+            name: key.clone(),
+            reason: e.to_string(),
+        })?;
+        self.config.extra_headers.push((key, value));
+        Ok(self)
+    }
+    /// Set the response cache configuration for the Tower middleware stack.
+    ///
+    /// When set, bindings and advanced Rust users can read this from the
+    /// built [`ClientConfig`] to construct a
+    /// [`CacheLayer`](crate::tower::CacheLayer).
+    #[cfg(feature = "tower")]
+    pub fn cache(mut self, config: CacheConfig) -> Self {
+        self.config.cache_config = Some(config);
+        self
+    }
+    /// Set a custom cache store backend for the Tower cache middleware.
+    ///
+    /// When set alongside [`cache`](Self::cache), the cache layer will use
+    /// this store instead of the default in-memory LRU.
+    #[cfg(feature = "tower")]
+    pub fn cache_store(mut self, store: Arc<dyn CacheStore>) -> Self {
+        self.config.cache_store = Some(store);
+        self
+    }
+    /// Set the budget enforcement configuration for the Tower middleware stack.
+    ///
+    /// When set, bindings and advanced Rust users can read this from the
+    /// built [`ClientConfig`] to construct a
+    /// [`BudgetLayer`](crate::tower::BudgetLayer).
+    #[cfg(feature = "tower")]
+    pub fn budget(mut self, config: BudgetConfig) -> Self {
+        self.config.budget_config = Some(config);
+        self
+    }
+    /// Add a single hook to the Tower hooks middleware stack.
+    ///
+    /// Hooks are invoked sequentially in registration order at request
+    /// lifecycle points (pre-request, post-response, on-error).
+    #[cfg(feature = "tower")]
+    pub fn hook(mut self, hook: Arc<dyn LlmHook>) -> Self {
+        self.config.hooks.push(hook);
+        self
+    }
+    /// Set the full list of hooks for the Tower hooks middleware stack,
+    /// replacing any previously registered hooks.
+    ///
+    /// Hooks are invoked sequentially in registration order.
+    #[cfg(feature = "tower")]
+    pub fn hooks(mut self, hooks: Vec<Arc<dyn LlmHook>>) -> Self {
+        self.config.hooks = hooks;
+        self
+    }
+    /// Set the cooldown duration after transient errors.
+    ///
+    /// When set, the client rejects requests with `ServiceUnavailable` for
+    /// the given duration after a transient error (rate limit, timeout,
+    /// server error).
+    #[cfg(feature = "tower")]
+    pub fn cooldown(mut self, duration: Duration) -> Self {
+        self.config.cooldown_duration = Some(duration);
+        self
+    }
+    /// Set per-model rate limiting configuration.
+    ///
+    /// When set, requests exceeding the configured RPM or TPM limits are
+    /// rejected with [`LiterLlmError::RateLimited`](crate::error::LiterLlmError::RateLimited).
+    #[cfg(feature = "tower")]
+    pub fn rate_limit(mut self, config: RateLimitConfig) -> Self {
+        self.config.rate_limit_config = Some(config);
+        self
+    }
+    /// Set the background health check interval.
+    ///
+    /// When set, the client periodically probes the provider and rejects
+    /// requests when the provider is unhealthy.
+    #[cfg(feature = "tower")]
+    pub fn health_check(mut self, interval: Duration) -> Self {
+        self.config.health_check_interval = Some(interval);
+        self
+    }
+    /// Enable or disable per-request cost tracking.
+    ///
+    /// When enabled, estimated USD cost is recorded on the current tracing
+    /// span as `gen_ai.usage.cost`.
+    #[cfg(feature = "tower")]
+    pub fn cost_tracking(mut self, enabled: bool) -> Self {
+        self.config.enable_cost_tracking = enabled;
+        self
+    }
+    /// Enable or disable OpenTelemetry-compatible tracing spans.
+    ///
+    /// When enabled, every request is wrapped in a `gen_ai` tracing span
+    /// with semantic convention attributes.
+    #[cfg(feature = "tower")]
+    pub fn tracing(mut self, enabled: bool) -> Self {
+        self.config.enable_tracing = enabled;
+        self
+    }
+    /// Consume the builder and return the completed [`ClientConfig`].
+    #[must_use]
+    pub fn build(self) -> ClientConfig {
+        self.config
+    }
+}