RubyGems - llm_cost_tracker - Versions diffs - 0.5.0 → 0.5.2 - Mend

llm_cost_tracker 0.5.0 → 0.5.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (59) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +38 -0
data/README.md +116 -467
data/app/controllers/llm_cost_tracker/calls_controller.rb +2 -1
data/app/controllers/llm_cost_tracker/dashboard_controller.rb +3 -15
data/app/controllers/llm_cost_tracker/tags_controller.rb +7 -6
data/app/helpers/llm_cost_tracker/application_helper.rb +21 -6
data/app/helpers/llm_cost_tracker/dashboard_filter_options_helper.rb +3 -1
data/app/services/llm_cost_tracker/dashboard/date_range.rb +42 -0
data/app/services/llm_cost_tracker/dashboard/filter.rb +6 -8
data/app/services/llm_cost_tracker/dashboard/spend_anomaly.rb +6 -5
data/app/services/llm_cost_tracker/dashboard/tag_breakdown.rb +74 -18
data/app/services/llm_cost_tracker/dashboard/tag_key_explorer.rb +15 -4
data/app/views/llm_cost_tracker/shared/_tag_chips.html.erb +1 -1
data/app/views/llm_cost_tracker/tags/show.html.erb +4 -0
data/lib/llm_cost_tracker/configuration.rb +22 -16
data/lib/llm_cost_tracker/doctor.rb +1 -1
data/lib/llm_cost_tracker/generators/llm_cost_tracker/install_generator.rb +1 -0
data/lib/llm_cost_tracker/generators/llm_cost_tracker/templates/initializer.rb.erb +8 -2
data/lib/llm_cost_tracker/integrations/anthropic.rb +12 -3
data/lib/llm_cost_tracker/integrations/base.rb +77 -6
data/lib/llm_cost_tracker/integrations/object_reader.rb +1 -1
data/lib/llm_cost_tracker/integrations/openai.rb +14 -5
data/lib/llm_cost_tracker/integrations/registry.rb +3 -1
data/lib/llm_cost_tracker/integrations/ruby_llm.rb +171 -0
data/lib/llm_cost_tracker/llm_api_call.rb +10 -9
data/lib/llm_cost_tracker/middleware/faraday.rb +10 -6
data/lib/llm_cost_tracker/parsers/gemini.rb +8 -1
data/lib/llm_cost_tracker/parsers/openai_usage.rb +11 -2
data/lib/llm_cost_tracker/price_freshness.rb +3 -3
data/lib/llm_cost_tracker/price_registry.rb +3 -0
data/lib/llm_cost_tracker/price_sync/fetcher.rb +43 -12
data/lib/llm_cost_tracker/price_sync/registry_diff.rb +51 -0
data/lib/llm_cost_tracker/price_sync/registry_loader.rb +6 -0
data/lib/llm_cost_tracker/price_sync/registry_writer.rb +5 -1
data/lib/llm_cost_tracker/price_sync.rb +103 -111
data/lib/llm_cost_tracker/prices.json +225 -229
data/lib/llm_cost_tracker/pricing.rb +27 -15
data/lib/llm_cost_tracker/report.rb +8 -1
data/lib/llm_cost_tracker/report_data.rb +25 -9
data/lib/llm_cost_tracker/retention.rb +30 -7
data/lib/llm_cost_tracker/storage/dispatcher.rb +68 -0
data/lib/llm_cost_tracker/stream_capture.rb +7 -0
data/lib/llm_cost_tracker/stream_collector.rb +25 -1
data/lib/llm_cost_tracker/tag_sanitizer.rb +81 -0
data/lib/llm_cost_tracker/tracker.rb +7 -59
data/lib/llm_cost_tracker/version.rb +1 -1
data/lib/llm_cost_tracker.rb +1 -0
data/lib/tasks/llm_cost_tracker.rake +24 -78
metadata +26 -15
data/lib/llm_cost_tracker/price_sync/merger.rb +0 -72
data/lib/llm_cost_tracker/price_sync/model_catalog.rb +0 -77
data/lib/llm_cost_tracker/price_sync/raw_price.rb +0 -33
data/lib/llm_cost_tracker/price_sync/refresh_plan_builder.rb +0 -164
data/lib/llm_cost_tracker/price_sync/source.rb +0 -29
data/lib/llm_cost_tracker/price_sync/source_result.rb +0 -7
data/lib/llm_cost_tracker/price_sync/sources/litellm.rb +0 -90
data/lib/llm_cost_tracker/price_sync/sources/open_router.rb +0 -93
data/lib/llm_cost_tracker/price_sync/validator.rb +0 -66

data/lib/llm_cost_tracker/price_sync/sources/litellm.rb DELETED Viewed

@@ -1,90 +0,0 @@
-# frozen_string_literal: true
-require "json"
-module LlmCostTracker
-  module PriceSync
-    module Sources
-      class Litellm < Source
-        PER_TOKEN_TO_PER_MILLION = 1_000_000
-        SUPPORTED_MODES = %w[chat completion embedding responses].freeze
-        SUPPORTED_PROVIDERS = %w[openai anthropic gemini text-completion-openai].freeze
-        URL = "https://raw.githubusercontent.com/BerriAI/litellm/main/model_prices_and_context_window.json"
-        def priority
-          10
-        end
-        def url
-          URL
-        end
-        def fetch(current_models:, fetcher:)
-          response = fetcher.get(url)
-          payload = JSON.parse(response.body.to_s)
-          prices = []
-          missing_models = []
-          current_models.each_key do |our_model|
-            entry_id = ModelCatalog.resolve_from_litellm(our_model, payload)
-            entry = entry_id && payload[entry_id]
-            if entry && supported_entry?(entry)
-              prices << build_raw_price(our_model, entry, response)
-            else
-              missing_models << our_model
-            end
-          end
-          SourceResult.new(
-            prices: prices,
-            missing_models: missing_models.sort,
-            source_version: response_version(response)
-          )
-        rescue JSON::ParserError => e
-          raise Error, "Unable to parse #{url}: #{e.message}"
-        end
-        private
-        def supported_entry?(entry)
-          SUPPORTED_PROVIDERS.include?(entry["litellm_provider"]) &&
-            SUPPORTED_MODES.include?(entry["mode"]) &&
-            entry.key?("input_cost_per_token") &&
-            entry.key?("output_cost_per_token")
-        end
-        def build_raw_price(model, entry, response)
-          provider = normalize_provider(entry["litellm_provider"])
-          cache_read = price_per_million(entry["cache_read_input_token_cost"])
-          cache_write = price_per_million(entry["cache_creation_input_token_cost"])
-          RawPrice.new(
-            model: model,
-            provider: provider,
-            input: price_per_million(entry["input_cost_per_token"]),
-            output: price_per_million(entry["output_cost_per_token"]),
-            cache_read_input: cache_read,
-            cache_write_input: cache_write,
-            source: name,
-            source_version: response_version(response),
-            fetched_at: response.fetched_at
-          )
-        end
-        def normalize_provider(provider)
-          return "openai" if provider == "text-completion-openai"
-          provider
-        end
-        def price_per_million(value)
-          return nil if value.nil?
-          value.to_f * PER_TOKEN_TO_PER_MILLION
-        end
-      end
-    end
-  end
-end

data/lib/llm_cost_tracker/price_sync/sources/open_router.rb DELETED Viewed

@@ -1,93 +0,0 @@
-# frozen_string_literal: true
-require "json"
-module LlmCostTracker
-  module PriceSync
-    module Sources
-      class OpenRouter < Source
-        PER_TOKEN_TO_PER_MILLION = 1_000_000
-        SUPPORTED_PREFIXES = %w[openai anthropic google].freeze
-        URL = "https://openrouter.ai/api/v1/models"
-        def priority
-          20
-        end
-        def url
-          URL
-        end
-        def fetch(current_models:, fetcher:)
-          response = fetcher.get(url)
-          payload = JSON.parse(response.body.to_s)
-          index = payload.fetch("data", []).to_h { |entry| [entry["id"], entry] }
-          prices = []
-          missing_models = []
-          current_models.each_key do |our_model|
-            entry_id = ModelCatalog.resolve_from_openrouter(our_model, index)
-            entry = entry_id && index[entry_id]
-            if entry && supported_entry?(entry)
-              prices << build_raw_price(our_model, entry, response)
-            else
-              missing_models << our_model
-            end
-          end
-          SourceResult.new(
-            prices: prices,
-            missing_models: missing_models.sort,
-            source_version: response_version(response)
-          )
-        rescue JSON::ParserError => e
-          raise Error, "Unable to parse #{url}: #{e.message}"
-        end
-        private
-        def supported_entry?(entry)
-          pricing = entry["pricing"] || {}
-          provider = entry["id"].to_s.split("/").first
-          SUPPORTED_PREFIXES.include?(provider) &&
-            pricing["prompt"] &&
-            pricing["completion"]
-        end
-        def build_raw_price(model, entry, response)
-          pricing = entry.fetch("pricing", {})
-          provider = normalize_provider(entry.fetch("id").split("/").first)
-          cache_read = price_per_million(pricing["input_cache_read"])
-          cache_write = price_per_million(pricing["input_cache_write"])
-          RawPrice.new(
-            model: model,
-            provider: provider,
-            input: price_per_million(pricing["prompt"]),
-            output: price_per_million(pricing["completion"]),
-            cache_read_input: cache_read,
-            cache_write_input: cache_write,
-            source: name,
-            source_version: response_version(response),
-            fetched_at: response.fetched_at
-          )
-        end
-        def normalize_provider(provider)
-          return "gemini" if provider == "google"
-          provider
-        end
-        def price_per_million(value)
-          return nil if value.nil?
-          value.to_f * PER_TOKEN_TO_PER_MILLION
-        end
-      end
-    end
-  end
-end

data/lib/llm_cost_tracker/price_sync/validator.rb DELETED Viewed

@@ -1,66 +0,0 @@
-# frozen_string_literal: true
-module LlmCostTracker
-  module PriceSync
-    class Validator
-      Result = Data.define(:accepted, :rejected, :flagged)
-      Issue = Data.define(:model, :reason, :old_price, :new_price)
-      MAX_INPUT_PER_MILLION = 100.0
-      MAX_OUTPUT_PER_MILLION = 500.0
-      MAX_RELATIVE_CHANGE = 3.0
-      def validate_batch(merged_prices, existing_registry:)
-        merged_prices.each_with_object(Result.new(accepted: {}, rejected: [], flagged: [])) do |(model, price), result|
-          old_price = normalize_entry(existing_registry[model])
-          status, reason = validate(new_price: price, old_price: old_price)
-          case status
-          when :rejected
-            result.rejected << Issue.new(model: model, reason: reason, old_price: old_price, new_price: price)
-          when :flagged
-            result.flagged << Issue.new(model: model, reason: reason, old_price: old_price, new_price: price)
-            result.accepted[model] = price
-          else
-            result.accepted[model] = price
-          end
-        end
-      end
-      private
-      def validate(new_price:, old_price:)
-        overrides = Array(normalize_entry(old_price)["_validator_override"])
-        return [:rejected, "input > $#{MAX_INPUT_PER_MILLION}/1M"] if new_price.input > MAX_INPUT_PER_MILLION
-        return [:rejected, "output > $#{MAX_OUTPUT_PER_MILLION}/1M"] if new_price.output > MAX_OUTPUT_PER_MILLION
-        return [:ok, nil] if overrides.include?("skip_relative_change")
-        if old_price.any? && changed_too_much?(old_price, new_price)
-          return [:flagged, "price changed >#{MAX_RELATIVE_CHANGE}x"]
-        end
-        [:ok, nil]
-      end
-      def changed_too_much?(old_price, new_price)
-        %i[input output].any? do |field|
-          old_value = old_price[field.to_s].to_f
-          next false if old_value.zero?
-          new_value = new_price.public_send(field).to_f
-          next false if new_value.zero?
-          ratio = [new_value / old_value, old_value / new_value].max
-          ratio > MAX_RELATIVE_CHANGE
-        end
-      end
-      def normalize_entry(entry)
-        (entry || {}).each_with_object({}) do |(key, value), normalized|
-          normalized[key.to_s] = value
-        end
-      end
-    end
-  end
-end