RubyGems - dspy - Versions diffs - 0.6.3 → 0.8.0 - Mend

dspy 0.6.3 → 0.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

checksums.yaml +4 -4
data/README.md +6 -1
data/lib/dspy/lm/adapter.rb +8 -2
data/lib/dspy/lm/adapter_factory.rb +7 -2
data/lib/dspy/lm/adapters/anthropic_adapter.rb +2 -1
data/lib/dspy/lm/adapters/openai/schema_converter.rb +269 -0
data/lib/dspy/lm/adapters/openai_adapter.rb +30 -5
data/lib/dspy/lm/cache_manager.rb +151 -0
data/lib/dspy/lm/errors.rb +13 -0
data/lib/dspy/lm/retry_handler.rb +119 -0
data/lib/dspy/lm/strategies/anthropic_extraction_strategy.rb +78 -0
data/lib/dspy/lm/strategies/base_strategy.rb +53 -0
data/lib/dspy/lm/strategies/enhanced_prompting_strategy.rb +147 -0
data/lib/dspy/lm/strategies/openai_structured_output_strategy.rb +60 -0
data/lib/dspy/lm/strategy_selector.rb +79 -0
data/lib/dspy/lm.rb +56 -18
data/lib/dspy/predict.rb +20 -0
data/lib/dspy/signature.rb +13 -5
data/lib/dspy/version.rb +1 -1
data/lib/dspy.rb +13 -0
metadata +12 -4

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: ae1673ad31bc71e2573800124ebb74ea807cd94a1c14b9b58f3de94b7f62363a
-  data.tar.gz: f52d96924b536e5941ff34b45f1080ddb08dc9243095df51f11352cb65979ba1
+  metadata.gz: cc32a4fe2ec14d442c2a0603b69992528ab81c67c4e61ceed6a6d337278d0220
+  data.tar.gz: f901d0336e0a4c912dfb37428bdd0e359b74de35b340eb769edcb5e811e257fe
 SHA512:
-  metadata.gz: 98f1d7b285f9342b8dfc82cdc7606d2a4c8cbdb1df86713b7176a389893f7c652e7c5df473ddcf42335ab37a2cfffe35e9519310b45be396c9bfe8847c7fabc1
-  data.tar.gz: cbee70fb3afc5b5b7dce3caf2efbca258d5cbd12680f950fe52be30bd84754369b620c21617315c04a62e2f982fe485b0c05f7ed30676007c19527715c3fc9c0
+  metadata.gz: db9477a7f7900559bb7c362104d9921d79c12b84f18ccfe0e51006adafd6e478624d20a930184e9e3dfacf9d1c88321ef54b6688f89ddf627fa0ecef3da12c53
+  data.tar.gz: 5ef621dfd8a8ef83f2bf0d3eabb32b07ae881636fe4c1826fddc3e544d3b5193448ff96bd28f970046d499dca69d23affa42596d41315e8c3245c4e7db5be0b3

data/README.md CHANGED Viewed

@@ -25,6 +25,9 @@ The result? LLM applications that actually scale and don't break when you sneeze
 - **Basic Optimization** - Simple prompt optimization techniques
 **Production Features:**
+- **Reliable JSON Extraction** - Automatic strategy selection for OpenAI structured outputs, Anthropic patterns, and fallback modes
+- **Smart Retry Logic** - Progressive fallback with exponential backoff for handling transient failures
+- **Performance Caching** - Schema and capability caching for faster repeated operations
 - **File-based Storage** - Basic optimization result persistence
 - **Multi-Platform Observability** - OpenTelemetry, New Relic, and Langfuse integration
 - **Basic Instrumentation** - Event tracking and logging
@@ -78,7 +81,9 @@ end
 # Configure DSPy with your LLM
 DSPy.configure do |c|
-  c.lm = DSPy::LM.new('openai/gpt-4o-mini', api_key: ENV['OPENAI_API_KEY'])
+  c.lm = DSPy::LM.new('openai/gpt-4o-mini',
+                      api_key: ENV['OPENAI_API_KEY'],
+                      structured_outputs: true)  # Enable OpenAI's native JSON mode
 end
 # Create the predictor and run inference

data/lib/dspy/lm/adapter.rb CHANGED Viewed

@@ -14,9 +14,10 @@ module DSPy
       # Chat interface that all adapters must implement
       # @param messages [Array<Hash>] Array of message hashes with :role and :content
+      # @param signature [DSPy::Signature, nil] Optional signature for structured outputs
       # @param block [Proc] Optional streaming block
       # @return [DSPy::LM::Response] Normalized response
-      def chat(messages:, &block)
+      def chat(messages:, signature: nil, &block)
         raise NotImplementedError, "Subclasses must implement #chat method"
       end
@@ -24,7 +25,12 @@ module DSPy
       def validate_configuration!
         raise ConfigurationError, "Model is required" if model.nil? || model.empty?
-        raise ConfigurationError, "API key is required" if api_key.nil? || api_key.empty?
+      end
+      def validate_api_key!(api_key, provider)
+        if api_key.nil? || api_key.to_s.strip.empty?
+          raise MissingAPIKeyError.new(provider)
+        end
       end
       # Helper method to normalize message format

data/lib/dspy/lm/adapter_factory.rb CHANGED Viewed

@@ -14,12 +14,17 @@ module DSPy
         # Creates an adapter instance based on model_id
         # @param model_id [String] Full model identifier (e.g., "openai/gpt-4")
         # @param api_key [String] API key for the provider
+        # @param options [Hash] Additional adapter-specific options
         # @return [DSPy::LM::Adapter] Appropriate adapter instance
-        def create(model_id, api_key:)
+        def create(model_id, api_key:, **options)
           provider, model = parse_model_id(model_id)
           adapter_class = get_adapter_class(provider)
-          adapter_class.new(model: model, api_key: api_key)
+          # Pass provider-specific options
+          adapter_options = { model: model, api_key: api_key }
+          adapter_options.merge!(options) if provider == 'openai' # Only OpenAI accepts structured_outputs for now
+          adapter_class.new(**adapter_options)
         end
         private

data/lib/dspy/lm/adapters/anthropic_adapter.rb CHANGED Viewed

@@ -7,10 +7,11 @@ module DSPy
     class AnthropicAdapter < Adapter
       def initialize(model:, api_key:)
         super
+        validate_api_key!(api_key, 'anthropic')
         @client = Anthropic::Client.new(api_key: api_key)
       end
-      def chat(messages:, &block)
+      def chat(messages:, signature: nil, **extra_params, &block)
         # Anthropic requires system message to be separate from messages
         system_message, user_messages = extract_system_message(normalize_messages(messages))

data/lib/dspy/lm/adapters/openai/schema_converter.rb ADDED Viewed

@@ -0,0 +1,269 @@
+# frozen_string_literal: true
+require "sorbet-runtime"
+require_relative "../../cache_manager"
+module DSPy
+  class LM
+    module Adapters
+      module OpenAI
+        # Converts DSPy signatures to OpenAI structured output format
+        class SchemaConverter
+          extend T::Sig
+          # Models that support structured outputs as of July 2025
+          STRUCTURED_OUTPUT_MODELS = T.let([
+            "gpt-4o-mini",
+            "gpt-4o-2024-08-06",
+            "gpt-4o",
+            "gpt-4-turbo",
+            "gpt-4-turbo-2024-04-09"
+          ].freeze, T::Array[String])
+          sig { params(signature_class: T.class_of(DSPy::Signature), name: T.nilable(String), strict: T::Boolean).returns(T::Hash[Symbol, T.untyped]) }
+          def self.to_openai_format(signature_class, name: nil, strict: true)
+            # Build cache params from the method parameters
+            cache_params = { strict: strict }
+            cache_params[:name] = name if name
+            # Check cache first
+            cache_manager = DSPy::LM.cache_manager
+            cached_schema = cache_manager.get_schema(signature_class, "openai", cache_params)
+            if cached_schema
+              DSPy.logger.debug("Using cached schema for #{signature_class.name}")
+              return cached_schema
+            end
+            # Get the output JSON schema from the signature class
+            output_schema = signature_class.output_json_schema
+            # Build the complete schema
+            dspy_schema = {
+              "$schema": "http://json-schema.org/draft-06/schema#",
+              type: "object",
+              properties: output_schema[:properties] || {},
+              required: output_schema[:required] || []
+            }
+            # Generate a schema name if not provided
+            schema_name = name || generate_schema_name(signature_class)
+            # Remove the $schema field as OpenAI doesn't use it
+            openai_schema = dspy_schema.except(:$schema)
+            # Add additionalProperties: false for strict mode
+            if strict
+              openai_schema = add_additional_properties_recursively(openai_schema)
+            end
+            # Wrap in OpenAI's required format
+            result = {
+              type: "json_schema",
+              json_schema: {
+                name: schema_name,
+                strict: strict,
+                schema: openai_schema
+              }
+            }
+            # Cache the result with same params
+            cache_manager.cache_schema(signature_class, "openai", result, cache_params)
+            result
+          end
+          sig { params(model: String).returns(T::Boolean) }
+          def self.supports_structured_outputs?(model)
+            # Check cache first
+            cache_manager = DSPy::LM.cache_manager
+            cached_result = cache_manager.get_capability(model, "structured_outputs")
+            if !cached_result.nil?
+              DSPy.logger.debug("Using cached capability check for #{model}")
+              return cached_result
+            end
+            # Extract base model name without provider prefix
+            base_model = model.sub(/^openai\//, "")
+            # Check if it's a supported model or a newer version
+            result = STRUCTURED_OUTPUT_MODELS.any? { |supported| base_model.start_with?(supported) }
+            # Cache the result
+            cache_manager.cache_capability(model, "structured_outputs", result)
+            result
+          end
+          sig { params(schema: T::Hash[Symbol, T.untyped]).returns(T::Array[String]) }
+          def self.validate_compatibility(schema)
+            issues = []
+            # Check for deeply nested objects (OpenAI has depth limits)
+            depth = calculate_depth(schema)
+            if depth > 5
+              issues << "Schema depth (#{depth}) exceeds recommended limit of 5 levels"
+            end
+            # Check for unsupported JSON Schema features
+            if contains_pattern_properties?(schema)
+              issues << "Pattern properties are not supported in OpenAI structured outputs"
+            end
+            if contains_conditional_schemas?(schema)
+              issues << "Conditional schemas (if/then/else) are not supported"
+            end
+            issues
+          end
+          private
+          sig { params(schema: T::Hash[Symbol, T.untyped]).returns(T::Hash[Symbol, T.untyped]) }
+          def self.add_additional_properties_recursively(schema)
+            return schema unless schema.is_a?(Hash)
+            result = schema.dup
+            # Add additionalProperties: false if this is an object
+            if result[:type] == "object"
+              result[:additionalProperties] = false
+            end
+            # Process properties recursively
+            if result[:properties].is_a?(Hash)
+              result[:properties] = result[:properties].transform_values do |prop|
+                if prop.is_a?(Hash)
+                  processed = add_additional_properties_recursively(prop)
+                  # Special handling for arrays - ensure their items have additionalProperties if they're objects
+                  if processed[:type] == "array" && processed[:items].is_a?(Hash)
+                    processed[:items] = add_additional_properties_recursively(processed[:items])
+                  end
+                  processed
+                else
+                  prop
+                end
+              end
+            end
+            # Process array items
+            if result[:items].is_a?(Hash)
+              processed_items = add_additional_properties_recursively(result[:items])
+              # OpenAI requires additionalProperties on all objects, even in array items
+              if processed_items.is_a?(Hash) && processed_items[:type] == "object" && !processed_items.key?(:additionalProperties)
+                processed_items[:additionalProperties] = false
+              end
+              result[:items] = processed_items
+            elsif result[:items].is_a?(Array)
+              # Handle tuple validation
+              result[:items] = result[:items].map do |item|
+                processed = item.is_a?(Hash) ? add_additional_properties_recursively(item) : item
+                if processed.is_a?(Hash) && processed[:type] == "object" && !processed.key?(:additionalProperties)
+                  processed[:additionalProperties] = false
+                end
+                processed
+              end
+            end
+            # Process oneOf/anyOf/allOf
+            [:oneOf, :anyOf, :allOf].each do |key|
+              if result[key].is_a?(Array)
+                result[key] = result[key].map do |sub_schema|
+                  sub_schema.is_a?(Hash) ? add_additional_properties_recursively(sub_schema) : sub_schema
+                end
+              end
+            end
+            result
+          end
+          sig { params(signature_class: T.class_of(DSPy::Signature)).returns(String) }
+          def self.generate_schema_name(signature_class)
+            # Use the signature class name
+            class_name = signature_class.name&.split("::")&.last
+            if class_name
+              class_name.gsub(/[^a-zA-Z0-9_]/, "_").downcase
+            else
+              # Fallback to a generic name
+              "dspy_output_#{Time.now.to_i}"
+            end
+          end
+          sig { params(schema: T::Hash[Symbol, T.untyped], current_depth: Integer).returns(Integer) }
+          def self.calculate_depth(schema, current_depth = 0)
+            return current_depth unless schema.is_a?(Hash)
+            max_depth = current_depth
+            # Check properties
+            if schema[:properties].is_a?(Hash)
+              schema[:properties].each_value do |prop|
+                if prop.is_a?(Hash)
+                  prop_depth = calculate_depth(prop, current_depth + 1)
+                  max_depth = [max_depth, prop_depth].max
+                end
+              end
+            end
+            # Check array items
+            if schema[:items].is_a?(Hash)
+              items_depth = calculate_depth(schema[:items], current_depth + 1)
+              max_depth = [max_depth, items_depth].max
+            end
+            # Check oneOf/anyOf/allOf
+            [:oneOf, :anyOf, :allOf].each do |key|
+              if schema[key].is_a?(Array)
+                schema[key].each do |sub_schema|
+                  if sub_schema.is_a?(Hash)
+                    sub_depth = calculate_depth(sub_schema, current_depth + 1)
+                    max_depth = [max_depth, sub_depth].max
+                  end
+                end
+              end
+            end
+            max_depth
+          end
+          sig { params(schema: T::Hash[Symbol, T.untyped]).returns(T::Boolean) }
+          def self.contains_pattern_properties?(schema)
+            return true if schema[:patternProperties]
+            # Recursively check nested schemas
+            [:properties, :items, :oneOf, :anyOf, :allOf].each do |key|
+              value = schema[key]
+              case value
+              when Hash
+                return true if contains_pattern_properties?(value)
+              when Array
+                return true if value.any? { |v| v.is_a?(Hash) && contains_pattern_properties?(v) }
+              end
+            end
+            false
+          end
+          sig { params(schema: T::Hash[Symbol, T.untyped]).returns(T::Boolean) }
+          def self.contains_conditional_schemas?(schema)
+            return true if schema[:if] || schema[:then] || schema[:else]
+            # Recursively check nested schemas
+            [:properties, :items, :oneOf, :anyOf, :allOf].each do |key|
+              value = schema[key]
+              case value
+              when Hash
+                return true if contains_conditional_schemas?(value)
+              when Array
+                return true if value.any? { |v| v.is_a?(Hash) && contains_conditional_schemas?(v) }
+              end
+            end
+            false
+          end
+        end
+      end
+    end
+  end
+end

data/lib/dspy/lm/adapters/openai_adapter.rb CHANGED Viewed

@@ -1,22 +1,34 @@
 # frozen_string_literal: true
 require 'openai'
+require_relative 'openai/schema_converter'
 module DSPy
   class LM
     class OpenAIAdapter < Adapter
-      def initialize(model:, api_key:)
-        super
+      def initialize(model:, api_key:, structured_outputs: false)
+        super(model: model, api_key: api_key)
+        validate_api_key!(api_key, 'openai')
         @client = OpenAI::Client.new(api_key: api_key)
+        @structured_outputs_enabled = structured_outputs
       end
-      def chat(messages:, &block)
+      def chat(messages:, signature: nil, response_format: nil, &block)
         request_params = {
           model: model,
           messages: normalize_messages(messages),
           temperature: 0.0 # DSPy default for deterministic responses
         }
+        # Add response format if provided by strategy
+        if response_format
+          request_params[:response_format] = response_format
+        elsif @structured_outputs_enabled && signature && supports_structured_outputs?
+          # Legacy behavior for backward compatibility
+          response_format = DSPy::LM::Adapters::OpenAI::SchemaConverter.to_openai_format(signature)
+          request_params[:response_format] = response_format
+        end
         # Add streaming if block provided
         if block_given?
           request_params[:stream] = proc do |chunk, _bytesize|
@@ -31,9 +43,15 @@ module DSPy
             raise AdapterError, "OpenAI API error: #{response.error}"
           end
-          content = response.choices.first.message.content
+          message = response.choices.first.message
+          content = message.content
           usage = response.usage
+          # Handle structured output refusals
+          if message.respond_to?(:refusal) && message.refusal
+            raise AdapterError, "OpenAI refused to generate output: #{message.refusal}"
+          end
           Response.new(
             content: content,
             usage: usage.respond_to?(:to_h) ? usage.to_h : usage,
@@ -41,13 +59,20 @@ module DSPy
               provider: 'openai',
               model: model,
               response_id: response.id,
-              created: response.created
+              created: response.created,
+              structured_output: @structured_outputs_enabled && signature && supports_structured_outputs?
             }
           )
         rescue => e
           raise AdapterError, "OpenAI adapter error: #{e.message}"
         end
       end
+      private
+      def supports_structured_outputs?
+        DSPy::LM::Adapters::OpenAI::SchemaConverter.supports_structured_outputs?(model)
+      end
     end
   end
 end

data/lib/dspy/lm/cache_manager.rb ADDED Viewed

@@ -0,0 +1,151 @@
+# frozen_string_literal: true
+require "sorbet-runtime"
+module DSPy
+  class LM
+    # Manages caching for schemas and capability detection
+    class CacheManager
+      extend T::Sig
+      # Cache entry with TTL
+      class CacheEntry < T::Struct
+        extend T::Sig
+        const :value, T.untyped
+        const :expires_at, Time
+        sig { returns(T::Boolean) }
+        def expired?
+          Time.now > expires_at
+        end
+      end
+      DEFAULT_TTL = 3600 # 1 hour
+      sig { void }
+      def initialize
+        @schema_cache = {}
+        @capability_cache = {}
+        @mutex = Mutex.new
+      end
+      # Cache a schema for a signature class
+      sig { params(signature_class: T.class_of(DSPy::Signature), provider: String, schema: T.untyped, cache_params: T::Hash[Symbol, T.untyped]).void }
+      def cache_schema(signature_class, provider, schema, cache_params = {})
+        key = schema_key(signature_class, provider, cache_params)
+        @mutex.synchronize do
+          @schema_cache[key] = CacheEntry.new(
+            value: schema,
+            expires_at: Time.now + DEFAULT_TTL
+          )
+        end
+        DSPy.logger.debug("Cached schema for #{signature_class.name} (#{provider})")
+      end
+      # Get cached schema if available
+      sig { params(signature_class: T.class_of(DSPy::Signature), provider: String, cache_params: T::Hash[Symbol, T.untyped]).returns(T.nilable(T.untyped)) }
+      def get_schema(signature_class, provider, cache_params = {})
+        key = schema_key(signature_class, provider, cache_params)
+        @mutex.synchronize do
+          entry = @schema_cache[key]
+          if entry.nil?
+            nil
+          elsif entry.expired?
+            @schema_cache.delete(key)
+            nil
+          else
+            entry.value
+          end
+        end
+      end
+      # Cache capability detection result
+      sig { params(model: String, capability: String, result: T::Boolean).void }
+      def cache_capability(model, capability, result)
+        key = capability_key(model, capability)
+        @mutex.synchronize do
+          @capability_cache[key] = CacheEntry.new(
+            value: result,
+            expires_at: Time.now + DEFAULT_TTL * 24 # Capabilities change less frequently
+          )
+        end
+        DSPy.logger.debug("Cached capability #{capability} for #{model}: #{result}")
+      end
+      # Get cached capability if available
+      sig { params(model: String, capability: String).returns(T.nilable(T::Boolean)) }
+      def get_capability(model, capability)
+        key = capability_key(model, capability)
+        @mutex.synchronize do
+          entry = @capability_cache[key]
+          if entry.nil?
+            nil
+          elsif entry.expired?
+            @capability_cache.delete(key)
+            nil
+          else
+            entry.value
+          end
+        end
+      end
+      # Clear all caches
+      sig { void }
+      def clear!
+        @mutex.synchronize do
+          @schema_cache.clear
+          @capability_cache.clear
+        end
+        DSPy.logger.debug("Cleared all caches")
+      end
+      # Get cache statistics
+      sig { returns(T::Hash[Symbol, Integer]) }
+      def stats
+        @mutex.synchronize do
+          {
+            schema_entries: @schema_cache.size,
+            capability_entries: @capability_cache.size,
+            total_entries: @schema_cache.size + @capability_cache.size
+          }
+        end
+      end
+      private
+      sig { params(signature_class: T.class_of(DSPy::Signature), provider: String, cache_params: T::Hash[Symbol, T.untyped]).returns(String) }
+      def schema_key(signature_class, provider, cache_params = {})
+        params_str = cache_params.sort.map { |k, v| "#{k}:#{v}" }.join(":")
+        base_key = "schema:#{provider}:#{signature_class.name}"
+        params_str.empty? ? base_key : "#{base_key}:#{params_str}"
+      end
+      sig { params(model: String, capability: String).returns(String) }
+      def capability_key(model, capability)
+        "capability:#{model}:#{capability}"
+      end
+    end
+    # Global cache instance
+    @cache_manager = T.let(nil, T.nilable(CacheManager))
+    class << self
+      extend T::Sig
+      sig { returns(CacheManager) }
+      def cache_manager
+        @cache_manager ||= CacheManager.new
+      end
+    end
+  end
+end

data/lib/dspy/lm/errors.rb CHANGED Viewed

@@ -6,5 +6,18 @@ module DSPy
     class AdapterError < Error; end
     class UnsupportedProviderError < Error; end
     class ConfigurationError < Error; end
+    # Raised when API key is missing or invalid
+    class MissingAPIKeyError < Error
+      def initialize(provider)
+        env_var = case provider
+                  when 'openai' then 'OPENAI_API_KEY'
+                  when 'anthropic' then 'ANTHROPIC_API_KEY'
+                  else "#{provider.upcase}_API_KEY"
+                  end
+        super("API key is required but was not provided. Set it via the api_key parameter or #{env_var} environment variable.")
+      end
+    end
   end
 end