RubyGems - ruby_llm-agents - Versions diffs - 0.4.0 → 0.5.0 - Mend

ruby_llm-agents 0.4.0 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

checksums.yaml +4 -4
data/README.md +46 -13
data/app/controllers/ruby_llm/agents/api_configurations_controller.rb +214 -0
data/app/controllers/ruby_llm/agents/{settings_controller.rb → system_config_controller.rb} +3 -3
data/app/controllers/ruby_llm/agents/tenants_controller.rb +109 -0
data/app/models/ruby_llm/agents/api_configuration.rb +386 -0
data/app/models/ruby_llm/agents/tenant_budget.rb +62 -7
data/app/views/layouts/ruby_llm/agents/application.html.erb +3 -1
data/app/views/ruby_llm/agents/api_configurations/_api_key_field.html.erb +34 -0
data/app/views/ruby_llm/agents/api_configurations/_form.html.erb +288 -0
data/app/views/ruby_llm/agents/api_configurations/edit.html.erb +95 -0
data/app/views/ruby_llm/agents/api_configurations/edit_tenant.html.erb +97 -0
data/app/views/ruby_llm/agents/api_configurations/show.html.erb +211 -0
data/app/views/ruby_llm/agents/api_configurations/tenant.html.erb +179 -0
data/app/views/ruby_llm/agents/dashboard/_action_center.html.erb +1 -1
data/app/views/ruby_llm/agents/executions/show.html.erb +82 -0
data/app/views/ruby_llm/agents/{settings → system_config}/show.html.erb +1 -1
data/app/views/ruby_llm/agents/tenants/_form.html.erb +150 -0
data/app/views/ruby_llm/agents/tenants/edit.html.erb +13 -0
data/app/views/ruby_llm/agents/tenants/index.html.erb +129 -0
data/app/views/ruby_llm/agents/tenants/show.html.erb +374 -0
data/config/routes.rb +12 -1
data/lib/generators/ruby_llm_agents/api_configuration_generator.rb +100 -0
data/lib/generators/ruby_llm_agents/templates/create_api_configurations_migration.rb.tt +90 -0
data/lib/ruby_llm/agents/base/execution.rb +83 -0
data/lib/ruby_llm/agents/base.rb +1 -0
data/lib/ruby_llm/agents/budget_tracker.rb +285 -23
data/lib/ruby_llm/agents/configuration.rb +38 -1
data/lib/ruby_llm/agents/engine.rb +1 -0
data/lib/ruby_llm/agents/instrumentation.rb +71 -3
data/lib/ruby_llm/agents/resolved_config.rb +348 -0
data/lib/ruby_llm/agents/version.rb +1 -1
metadata +19 -3

data/lib/generators/ruby_llm_agents/templates/create_api_configurations_migration.rb.tt ADDED Viewed

@@ -0,0 +1,90 @@
+# frozen_string_literal: true
+# Migration to create the api_configurations table
+#
+# This table stores API key configurations that can be managed via the dashboard.
+# Supports both global settings and per-tenant overrides.
+#
+# Resolution priority: per-tenant DB > global DB > config file (RubyLLM.configure)
+#
+# Features:
+# - Encrypted storage for all API keys (using Rails encrypted attributes)
+# - Support for all major LLM providers
+# - Custom endpoint configuration
+# - Connection settings
+# - Default model configuration
+#
+# Run with: rails db:migrate
+class CreateRubyLLMAgentsApiConfigurations < ActiveRecord::Migration<%= migration_version %>
+  def change
+    create_table :ruby_llm_agents_api_configurations do |t|
+      # Scope type: 'global' or 'tenant'
+      t.string :scope_type, null: false, default: 'global'
+      # Tenant ID when scope_type='tenant'
+      t.string :scope_id
+      # === Encrypted API Keys ===
+      # Rails encrypts stores encrypted data in the same-named column
+      # Primary providers
+      t.text :openai_api_key
+      t.text :anthropic_api_key
+      t.text :gemini_api_key
+      # Additional providers
+      t.text :deepseek_api_key
+      t.text :mistral_api_key
+      t.text :perplexity_api_key
+      t.text :openrouter_api_key
+      t.text :gpustack_api_key
+      t.text :xai_api_key
+      t.text :ollama_api_key
+      # AWS Bedrock
+      t.text :bedrock_api_key
+      t.text :bedrock_secret_key
+      t.text :bedrock_session_token
+      t.string :bedrock_region
+      # Google Vertex AI
+      t.text :vertexai_credentials
+      t.string :vertexai_project_id
+      t.string :vertexai_location
+      # === Custom Endpoints ===
+      t.string :openai_api_base
+      t.string :gemini_api_base
+      t.string :ollama_api_base
+      t.string :gpustack_api_base
+      t.string :xai_api_base
+      # === OpenAI Options ===
+      t.string :openai_organization_id
+      t.string :openai_project_id
+      # === Default Models ===
+      t.string :default_model
+      t.string :default_embedding_model
+      t.string :default_image_model
+      t.string :default_moderation_model
+      # === Connection Settings ===
+      t.integer :request_timeout
+      t.integer :max_retries
+      t.decimal :retry_interval, precision: 5, scale: 2
+      t.decimal :retry_backoff_factor, precision: 5, scale: 2
+      t.decimal :retry_interval_randomness, precision: 5, scale: 2
+      t.string :http_proxy
+      # Whether to inherit from global config for unset values
+      t.boolean :inherit_global_defaults, default: true
+      t.timestamps
+    end
+    # Ensure unique scope_type + scope_id combinations
+    add_index :ruby_llm_agents_api_configurations, [:scope_type, :scope_id], unique: true, name: 'idx_api_configs_scope'
+    # Index for faster tenant lookups
+    add_index :ruby_llm_agents_api_configurations, :scope_id, name: 'idx_api_configs_scope_id'
+  end
+end

data/lib/ruby_llm/agents/base/execution.rb CHANGED Viewed

@@ -17,6 +17,9 @@ module RubyLLM
         # @yieldparam chunk [RubyLLM::Chunk] A streaming chunk with content
         # @return [Object] The processed LLM response
         def call(&block)
+          # Resolve tenant configuration before execution
+          resolve_tenant_context!
           return dry_run_response if @options[:dry_run]
           return uncached_call(&block) if @options[:skip_cache] || !self.class.cache_enabled?
@@ -36,6 +39,52 @@ module RubyLLM
           end
         end
+        # Resolves tenant context from the :tenant option
+        #
+        # The tenant option can be:
+        # - String: Just the tenant_id (uses resolver or DB for config)
+        # - Hash: Full config { id:, name:, daily_limit:, daily_token_limit:, ... }
+        #
+        # @return [void]
+        def resolve_tenant_context!
+          # Idempotency guard - only resolve once
+          return if defined?(@tenant_context_resolved) && @tenant_context_resolved
+          tenant_option = @options[:tenant]
+          return unless tenant_option
+          if tenant_option.is_a?(Hash)
+            # Full config passed - extract id and store config
+            @tenant_id = tenant_option[:id]&.to_s
+            @tenant_config = tenant_option.except(:id)
+          else
+            # Just tenant_id passed
+            @tenant_id = tenant_option.to_s
+            @tenant_config = nil
+          end
+          @tenant_context_resolved = true
+        end
+        # Returns the resolved tenant ID
+        #
+        # @return [String, nil] The tenant identifier
+        def resolved_tenant_id
+          return @tenant_id if defined?(@tenant_id) && @tenant_id.present?
+          config = RubyLLM::Agents.configuration
+          return nil unless config.multi_tenancy_enabled?
+          config.current_tenant_id
+        end
+        # Returns the runtime tenant config (if passed via :tenant option)
+        #
+        # @return [Hash, nil] Runtime tenant configuration
+        def runtime_tenant_config
+          @tenant_config if defined?(@tenant_config)
+        end
         # Executes the agent without caching
         #
         # Routes to reliability-enabled execution if configured, otherwise
@@ -226,6 +275,9 @@ module RubyLLM
         #
         # @return [RubyLLM::Chat] Configured chat client
         def build_client
+          # Apply database-backed API configuration if available
+          apply_api_configuration!
           client = RubyLLM.chat
             .with_model(model)
             .with_temperature(temperature)
@@ -236,11 +288,42 @@ module RubyLLM
           client
         end
+        # Applies database-backed API configuration to RubyLLM
+        #
+        # Resolution priority: per-tenant DB > global DB > RubyLLM.configure
+        # Only applies if the api_configurations table exists.
+        #
+        # @return [void]
+        def apply_api_configuration!
+          return unless api_configuration_available?
+          resolved_config = ApiConfiguration.resolve(tenant_id: resolved_tenant_id)
+          resolved_config.apply_to_ruby_llm!
+        rescue StandardError => e
+          Rails.logger.warn("[RubyLLM::Agents] Failed to apply API config: #{e.message}")
+        end
+        # Checks if API configuration table is available
+        #
+        # @return [Boolean] true if table exists and is accessible
+        def api_configuration_available?
+          return @api_config_available if defined?(@api_config_available)
+          @api_config_available = begin
+            ApiConfiguration.table_exists?
+          rescue StandardError
+            false
+          end
+        end
         # Builds a client with a specific model
         #
         # @param model_id [String] The model identifier
         # @return [RubyLLM::Chat] Configured chat client
         def build_client_with_model(model_id)
+          # Apply database-backed API configuration if available
+          apply_api_configuration!
           client = RubyLLM.chat
             .with_model(model_id)
             .with_temperature(temperature)

data/lib/ruby_llm/agents/base.rb CHANGED Viewed

@@ -136,6 +136,7 @@ module RubyLLM
         @options = options
         @accumulated_tool_calls = []
         validate_required_params!
+        resolve_tenant_context!  # Resolve tenant before building client for API key resolution
         @client = build_client
       end

data/lib/ruby_llm/agents/budget_tracker.rb CHANGED Viewed

@@ -36,11 +36,12 @@ module RubyLLM
         #
         # @param agent_type [String] The agent class name
         # @param tenant_id [String, nil] Optional tenant identifier (uses resolver if not provided)
+        # @param tenant_config [Hash, nil] Optional runtime tenant config (takes priority over resolver/DB)
         # @raise [Reliability::BudgetExceededError] If hard cap is exceeded
         # @return [void]
-        def check_budget!(agent_type, tenant_id: nil)
+        def check_budget!(agent_type, tenant_id: nil, tenant_config: nil)
           tenant_id = resolve_tenant_id(tenant_id)
-          budget_config = resolve_budget_config(tenant_id)
+          budget_config = resolve_budget_config(tenant_id, runtime_config: tenant_config)
           return unless budget_config[:enabled]
           return unless budget_config[:enforcement] == :hard
@@ -48,13 +49,31 @@ module RubyLLM
           check_budget_limits!(agent_type, tenant_id, budget_config)
         end
+        # Checks if the current token usage exceeds budget limits
+        #
+        # @param agent_type [String] The agent class name
+        # @param tenant_id [String, nil] Optional tenant identifier (uses resolver if not provided)
+        # @param tenant_config [Hash, nil] Optional runtime tenant config (takes priority over resolver/DB)
+        # @raise [Reliability::BudgetExceededError] If hard cap is exceeded
+        # @return [void]
+        def check_token_budget!(agent_type, tenant_id: nil, tenant_config: nil)
+          tenant_id = resolve_tenant_id(tenant_id)
+          budget_config = resolve_budget_config(tenant_id, runtime_config: tenant_config)
+          return unless budget_config[:enabled]
+          return unless budget_config[:enforcement] == :hard
+          check_token_limits!(agent_type, tenant_id, budget_config)
+        end
         # Records spend and checks for soft cap alerts
         #
         # @param agent_type [String] The agent class name
         # @param amount [Float] The amount spent in USD
         # @param tenant_id [String, nil] Optional tenant identifier (uses resolver if not provided)
+        # @param tenant_config [Hash, nil] Optional runtime tenant config (takes priority over resolver/DB)
         # @return [void]
-        def record_spend!(agent_type, amount, tenant_id: nil)
+        def record_spend!(agent_type, amount, tenant_id: nil, tenant_config: nil)
           return if amount.nil? || amount <= 0
           tenant_id = resolve_tenant_id(tenant_id)
@@ -66,10 +85,33 @@ module RubyLLM
           increment_spend(:agent, :monthly, amount, agent_type: agent_type, tenant_id: tenant_id)
           # Check for soft cap alerts
-          budget_config = resolve_budget_config(tenant_id)
+          budget_config = resolve_budget_config(tenant_id, runtime_config: tenant_config)
           check_soft_cap_alerts(agent_type, tenant_id, budget_config) if budget_config[:enabled]
         end
+        # Records token usage and checks for soft cap alerts
+        #
+        # @param agent_type [String] The agent class name
+        # @param tokens [Integer] The number of tokens used
+        # @param tenant_id [String, nil] Optional tenant identifier (uses resolver if not provided)
+        # @param tenant_config [Hash, nil] Optional runtime tenant config (takes priority over resolver/DB)
+        # @return [void]
+        def record_tokens!(agent_type, tokens, tenant_id: nil, tenant_config: nil)
+          return if tokens.nil? || tokens <= 0
+          tenant_id = resolve_tenant_id(tenant_id)
+          # Increment all relevant token counters
+          increment_tokens(:global, :daily, tokens, tenant_id: tenant_id)
+          increment_tokens(:global, :monthly, tokens, tenant_id: tenant_id)
+          increment_tokens(:agent, :daily, tokens, agent_type: agent_type, tenant_id: tenant_id)
+          increment_tokens(:agent, :monthly, tokens, agent_type: agent_type, tenant_id: tenant_id)
+          # Check for soft cap alerts
+          budget_config = resolve_budget_config(tenant_id, runtime_config: tenant_config)
+          check_soft_token_alerts(agent_type, tenant_id, budget_config) if budget_config[:enabled]
+        end
         # Returns the current spend for a scope and period
         #
         # @param scope [Symbol] :global or :agent
@@ -83,6 +125,17 @@ module RubyLLM
           (BudgetTracker.cache_read(key) || 0).to_f
         end
+        # Returns the current token usage for a period (global only)
+        #
+        # @param period [Symbol] :daily or :monthly
+        # @param tenant_id [String, nil] Optional tenant identifier (uses resolver if not provided)
+        # @return [Integer] Current token usage
+        def current_tokens(period, tenant_id: nil)
+          tenant_id = resolve_tenant_id(tenant_id)
+          key = token_cache_key(period, tenant_id: tenant_id)
+          (BudgetTracker.cache_read(key) || 0).to_i
+        end
         # Returns the remaining budget for a scope and period
         #
         # @param scope [Symbol] :global or :agent
@@ -110,6 +163,27 @@ module RubyLLM
           [limit - current_spend(scope, period, agent_type: agent_type, tenant_id: tenant_id), 0].max
         end
+        # Returns the remaining token budget for a period (global only)
+        #
+        # @param period [Symbol] :daily or :monthly
+        # @param tenant_id [String, nil] Optional tenant identifier (uses resolver if not provided)
+        # @return [Integer, nil] Remaining token budget, or nil if no limit configured
+        def remaining_token_budget(period, tenant_id: nil)
+          tenant_id = resolve_tenant_id(tenant_id)
+          budget_config = resolve_budget_config(tenant_id)
+          limit = case period
+          when :daily
+            budget_config[:global_daily_tokens]
+          when :monthly
+            budget_config[:global_monthly_tokens]
+          end
+          return nil unless limit
+          [limit - current_tokens(period, tenant_id: tenant_id), 0].max
+        end
         # Returns a summary of all budget statuses
         #
         # @param agent_type [String, nil] Optional agent type for per-agent budgets
@@ -123,10 +197,14 @@ module RubyLLM
             tenant_id: tenant_id,
             enabled: budget_config[:enabled],
             enforcement: budget_config[:enforcement],
+            # Cost budgets
             global_daily: budget_status(:global, :daily, budget_config[:global_daily], tenant_id: tenant_id),
             global_monthly: budget_status(:global, :monthly, budget_config[:global_monthly], tenant_id: tenant_id),
             per_agent_daily: agent_type ? budget_status(:agent, :daily, budget_config[:per_agent_daily]&.dig(agent_type), agent_type: agent_type, tenant_id: tenant_id) : nil,
             per_agent_monthly: agent_type ? budget_status(:agent, :monthly, budget_config[:per_agent_monthly]&.dig(agent_type), agent_type: agent_type, tenant_id: tenant_id) : nil,
+            # Token budgets (global only)
+            global_daily_tokens: token_status(:daily, budget_config[:global_daily_tokens], tenant_id: tenant_id),
+            global_monthly_tokens: token_status(:monthly, budget_config[:global_monthly_tokens], tenant_id: tenant_id),
             forecast: calculate_forecast(tenant_id: tenant_id)
           }.compact
         end
@@ -225,41 +303,86 @@ module RubyLLM
         # Resolves budget configuration for a tenant
         #
+        # Priority order:
+        # 1. runtime_config (passed to run())
+        # 2. tenant_config_resolver (configured lambda)
+        # 3. TenantBudget database record
+        # 4. Global configuration
+        #
         # @param tenant_id [String, nil] The tenant identifier
+        # @param runtime_config [Hash, nil] Runtime config passed to run()
         # @return [Hash] Budget configuration
-        def resolve_budget_config(tenant_id)
+        def resolve_budget_config(tenant_id, runtime_config: nil)
           config = RubyLLM::Agents.configuration
+          # Priority 1: Runtime config passed directly to run()
+          if runtime_config.present?
+            return normalize_budget_config(runtime_config, config)
+          end
           # If multi-tenancy is disabled or no tenant, use global config
           if tenant_id.nil? || !config.multi_tenancy_enabled?
-            return {
-              enabled: config.budgets_enabled?,
-              enforcement: config.budget_enforcement,
-              global_daily: config.budgets&.dig(:global_daily),
-              global_monthly: config.budgets&.dig(:global_monthly),
-              per_agent_daily: config.budgets&.dig(:per_agent_daily),
-              per_agent_monthly: config.budgets&.dig(:per_agent_monthly)
-            }
+            return global_budget_config(config)
+          end
+          # Priority 2: tenant_config_resolver lambda
+          if config.tenant_config_resolver.present?
+            resolved_config = config.tenant_config_resolver.call(tenant_id)
+            if resolved_config.present?
+              return normalize_budget_config(resolved_config, config)
+            end
           end
-          # Look up tenant-specific budget from database (if table exists)
+          # Priority 3: Look up tenant-specific budget from database
           tenant_budget = lookup_tenant_budget(tenant_id)
           if tenant_budget
             tenant_budget.to_budget_config
           else
-            # Fall back to global config for unknown tenants
-            {
-              enabled: config.budgets_enabled?,
-              enforcement: config.budget_enforcement,
-              global_daily: config.budgets&.dig(:global_daily),
-              global_monthly: config.budgets&.dig(:global_monthly),
-              per_agent_daily: config.budgets&.dig(:per_agent_daily),
-              per_agent_monthly: config.budgets&.dig(:per_agent_monthly)
-            }
+            # Priority 4: Fall back to global config for unknown tenants
+            global_budget_config(config)
           end
         end
+        # Builds global budget config from configuration
+        #
+        # @param config [Configuration] The configuration object
+        # @return [Hash] Budget configuration
+        def global_budget_config(config)
+          {
+            enabled: config.budgets_enabled?,
+            enforcement: config.budget_enforcement,
+            global_daily: config.budgets&.dig(:global_daily),
+            global_monthly: config.budgets&.dig(:global_monthly),
+            per_agent_daily: config.budgets&.dig(:per_agent_daily),
+            per_agent_monthly: config.budgets&.dig(:per_agent_monthly),
+            global_daily_tokens: config.budgets&.dig(:global_daily_tokens),
+            global_monthly_tokens: config.budgets&.dig(:global_monthly_tokens)
+          }
+        end
+        # Normalizes runtime/resolver config to standard budget config format
+        #
+        # @param raw_config [Hash] Raw config from runtime or resolver
+        # @param global_config [Configuration] Global config for fallbacks
+        # @return [Hash] Normalized budget configuration
+        def normalize_budget_config(raw_config, global_config)
+          enforcement = raw_config[:enforcement]&.to_sym || global_config.budget_enforcement
+          {
+            enabled: enforcement != :none,
+            enforcement: enforcement,
+            # Cost/budget limits (USD)
+            global_daily: raw_config[:daily_budget_limit],
+            global_monthly: raw_config[:monthly_budget_limit],
+            per_agent_daily: raw_config[:per_agent_daily] || {},
+            per_agent_monthly: raw_config[:per_agent_monthly] || {},
+            # Token limits
+            global_daily_tokens: raw_config[:daily_token_limit],
+            global_monthly_tokens: raw_config[:monthly_token_limit]
+          }
+        end
         # Safely looks up tenant budget, handling missing table
         #
         # @param tenant_id [String] The tenant identifier
@@ -465,6 +588,145 @@ module RubyLLM
             timestamp: Date.current.to_s
           })
         end
+        # Increments the token counter for a period
+        #
+        # @param scope [Symbol] :global (only global supported for tokens)
+        # @param period [Symbol] :daily or :monthly
+        # @param tokens [Integer] Tokens to add
+        # @param tenant_id [String, nil] The tenant identifier
+        # @return [Integer] New total
+        def increment_tokens(scope, period, tokens, agent_type: nil, tenant_id: nil)
+          # For now, we only track global token usage (not per-agent)
+          key = token_cache_key(period, tenant_id: tenant_id)
+          ttl = period == :daily ? 1.day : 31.days
+          current = (BudgetTracker.cache_read(key) || 0).to_i
+          new_total = current + tokens
+          BudgetTracker.cache_write(key, new_total, expires_in: ttl)
+          new_total
+        end
+        # Generates a cache key for token tracking
+        #
+        # @param period [Symbol] :daily or :monthly
+        # @param tenant_id [String, nil] The tenant identifier
+        # @return [String] Cache key
+        def token_cache_key(period, tenant_id: nil)
+          date_part = period == :daily ? Date.current.to_s : Date.current.strftime("%Y-%m")
+          tenant_part = tenant_id.present? ? "tenant:#{tenant_id}" : "global"
+          BudgetTracker.cache_key("tokens", tenant_part, date_part)
+        end
+        # Checks token limits and raises error if exceeded
+        #
+        # @param agent_type [String] The agent class name
+        # @param tenant_id [String, nil] The tenant identifier
+        # @param budget_config [Hash] The budget configuration
+        # @raise [Reliability::BudgetExceededError] If limit exceeded
+        # @return [void]
+        def check_token_limits!(agent_type, tenant_id, budget_config)
+          # Check global daily token budget
+          if budget_config[:global_daily_tokens]
+            current = current_tokens(:daily, tenant_id: tenant_id)
+            if current >= budget_config[:global_daily_tokens]
+              raise Reliability::BudgetExceededError.new(
+                :global_daily_tokens,
+                budget_config[:global_daily_tokens],
+                current,
+                tenant_id: tenant_id
+              )
+            end
+          end
+          # Check global monthly token budget
+          if budget_config[:global_monthly_tokens]
+            current = current_tokens(:monthly, tenant_id: tenant_id)
+            if current >= budget_config[:global_monthly_tokens]
+              raise Reliability::BudgetExceededError.new(
+                :global_monthly_tokens,
+                budget_config[:global_monthly_tokens],
+                current,
+                tenant_id: tenant_id
+              )
+            end
+          end
+        end
+        # Checks for soft cap token alerts after recording usage
+        #
+        # @param agent_type [String] The agent class name
+        # @param tenant_id [String, nil] The tenant identifier
+        # @param budget_config [Hash] Budget configuration
+        # @return [void]
+        def check_soft_token_alerts(agent_type, tenant_id, budget_config)
+          config = RubyLLM::Agents.configuration
+          return unless config.alerts_enabled?
+          return unless config.alert_events.include?(:token_soft_cap) || config.alert_events.include?(:token_hard_cap)
+          # Check global daily tokens
+          check_token_alert(:global_daily_tokens, budget_config[:global_daily_tokens],
+                           current_tokens(:daily, tenant_id: tenant_id),
+                           agent_type, tenant_id, budget_config)
+          # Check global monthly tokens
+          check_token_alert(:global_monthly_tokens, budget_config[:global_monthly_tokens],
+                           current_tokens(:monthly, tenant_id: tenant_id),
+                           agent_type, tenant_id, budget_config)
+        end
+        # Checks if a token alert should be fired
+        #
+        # @param scope [Symbol] Token scope
+        # @param limit [Integer, nil] Token limit
+        # @param current [Integer] Current token usage
+        # @param agent_type [String] Agent type
+        # @param tenant_id [String, nil] The tenant identifier
+        # @param budget_config [Hash] Budget configuration
+        # @return [void]
+        def check_token_alert(scope, limit, current, agent_type, tenant_id, budget_config)
+          return unless limit
+          return if current <= limit
+          event = budget_config[:enforcement] == :hard ? :token_hard_cap : :token_soft_cap
+          config = RubyLLM::Agents.configuration
+          return unless config.alert_events.include?(event)
+          # Prevent duplicate alerts
+          tenant_part = tenant_id.present? ? "tenant:#{tenant_id}" : "global"
+          alert_key = BudgetTracker.cache_key("token_alert", tenant_part, scope, Date.current.to_s)
+          return if BudgetTracker.cache_exist?(alert_key)
+          BudgetTracker.cache_write(alert_key, true, expires_in: 1.hour)
+          AlertManager.notify(event, {
+            scope: scope,
+            limit: limit,
+            total: current,
+            agent_type: agent_type,
+            tenant_id: tenant_id,
+            timestamp: Date.current.to_s
+          })
+        end
+        # Returns token status for a period
+        #
+        # @param period [Symbol] :daily or :monthly
+        # @param limit [Integer, nil] The token limit
+        # @param tenant_id [String, nil] The tenant identifier
+        # @return [Hash, nil] Status hash or nil if no limit
+        def token_status(period, limit, tenant_id: nil)
+          return nil unless limit
+          current = current_tokens(period, tenant_id: tenant_id)
+          {
+            limit: limit,
+            current: current,
+            remaining: [limit - current, 0].max,
+            percentage_used: ((current.to_f / limit) * 100).round(2)
+          }
+        end
       end
     end
   end

data/lib/ruby_llm/agents/configuration.rb CHANGED Viewed

@@ -195,6 +195,35 @@ module RubyLLM
       #   @example Using request store
       #     config.tenant_resolver = -> { RequestStore[:tenant_id] }
+      # @!attribute [rw] tenant_config_resolver
+      #   Lambda that returns tenant configuration without querying the database.
+      #   Called when resolving tenant budget config. If set, this takes priority
+      #   over the TenantBudget database lookup.
+      #   @return [Proc, nil] Tenant config resolver lambda (default: nil)
+      #   @example Using an external tenant service
+      #     config.tenant_config_resolver = ->(tenant_id) {
+      #       tenant = Tenant.find(tenant_id)
+      #       {
+      #         name: tenant.name,
+      #         daily_limit: tenant.subscription.daily_budget,
+      #         monthly_limit: tenant.subscription.monthly_budget,
+      #         daily_token_limit: tenant.subscription.daily_tokens,
+      #         monthly_token_limit: tenant.subscription.monthly_tokens,
+      #         enforcement: tenant.subscription.hard_limits? ? :hard : :soft
+      #       }
+      #     }
+      # @!attribute [rw] persist_messages_summary
+      #   Whether to persist a summary of conversation messages in execution records.
+      #   When true, stores message count and first/last messages (truncated).
+      #   Set to false to disable message summary persistence.
+      #   @return [Boolean] Enable messages summary persistence (default: true)
+      # @!attribute [rw] messages_summary_max_length
+      #   Maximum character length for message content in the summary.
+      #   Content exceeding this length will be truncated with "...".
+      #   @return [Integer] Max length for message content (default: 500)
       attr_accessor :default_model,
                     :default_temperature,
                     :default_timeout,
@@ -220,7 +249,10 @@ module RubyLLM
                     :persist_responses,
                     :redaction,
                     :multi_tenancy_enabled,
-                    :tenant_resolver
+                    :tenant_resolver,
+                    :tenant_config_resolver,
+                    :persist_messages_summary,
+                    :messages_summary_max_length
       attr_writer :cache_store
@@ -264,6 +296,11 @@ module RubyLLM
         # Multi-tenancy defaults (disabled for backward compatibility)
         @multi_tenancy_enabled = false
         @tenant_resolver = -> { nil }
+        @tenant_config_resolver = nil
+        # Messages summary defaults
+        @persist_messages_summary = true
+        @messages_summary_max_length = 500
       end
       # Returns the configured cache store, falling back to Rails.cache

data/lib/ruby_llm/agents/engine.rb CHANGED Viewed

@@ -34,6 +34,7 @@ module RubyLLM
       config.to_prepare do
         require_relative "execution_logger_job"
         require_relative "instrumentation"
+        require_relative "resolved_config"
         require_relative "base"
         require_relative "workflow"