RubyGems - ragdoll - Versions diffs - 0.1.11 → 0.1.12 - Mend

ragdoll 0.1.11 → 0.1.12

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

checksums.yaml +4 -4
data/README.md +323 -384
data/app/models/ragdoll/document.rb +1 -1
data/app/models/ragdoll/unified_content.rb +216 -0
data/app/models/ragdoll/unified_document.rb +338 -0
data/app/services/ragdoll/audio_to_text_service.rb +200 -0
data/app/services/ragdoll/document_converter.rb +216 -0
data/app/services/ragdoll/document_processor.rb +197 -331
data/app/services/ragdoll/image_to_text_service.rb +322 -0
data/app/services/ragdoll/migration_service.rb +340 -0
data/app/services/ragdoll/text_extraction_service.rb +422 -0
data/app/services/ragdoll/unified_document_management.rb +300 -0
data/db/migrate/20250923000001_create_ragdoll_unified_contents.rb +87 -0
data/lib/ragdoll/core/version.rb +1 -1
data/lib/ragdoll/core.rb +7 -0
metadata +11 -2

data/app/services/ragdoll/image_to_text_service.rb ADDED Viewed

@@ -0,0 +1,322 @@
+# frozen_string_literal: true
+require "ruby_llm"
+require "base64"
+require "rmagick"
+module Ragdoll
+  class ImageToTextService
+    class DescriptionError < StandardError; end
+    DEFAULT_OPTIONS = {
+      model: "gemma3",
+      provider: :ollama,
+      assume_model_exists: true,
+      temperature: 0.2,
+      detail_level: :comprehensive
+    }.freeze
+    DEFAULT_FALLBACK_OPTIONS = {
+      model: "smollm2",
+      provider: :ollama,
+      assume_model_exists: true,
+      temperature: 0.4
+    }.freeze
+    DETAIL_LEVELS = {
+      minimal: "Provide a brief, one-sentence description of the image.",
+      standard: "Describe the main elements, objects, and overall composition of the image.",
+      comprehensive: "Provide a detailed description including objects, people, settings, colors, mood, style, and any text visible in the image.",
+      analytical: "Analyze the image thoroughly, describing composition, lighting, subjects, background, context, and any symbolic or artistic elements."
+    }.freeze
+    def self.convert(file_path, **options)
+      new(**options).convert(file_path)
+    end
+    def initialize(primary: DEFAULT_OPTIONS, fallback: DEFAULT_FALLBACK_OPTIONS, **options)
+      @options = DEFAULT_OPTIONS.merge(options)
+      @detail_level = @options[:detail_level] || :comprehensive
+      configure_ruby_llm_globally
+      # Setup primary model
+      primary_opts = primary.dup
+      primary_temp = primary_opts.delete(:temperature) || 0.2
+      @primary_prompt = build_prompt(@detail_level)
+      begin
+        @primary = RubyLLM.chat(**primary_opts).with_temperature(primary_temp)
+      rescue StandardError => e
+        puts "❌ ImageToTextService: Primary model creation failed: #{e.message}"
+        @primary = nil
+      end
+      # Setup fallback model
+      fallback_opts = fallback.dup
+      fallback_temp = fallback_opts.delete(:temperature) || 0.4
+      begin
+        @fallback = RubyLLM.chat(**fallback_opts).with_temperature(fallback_temp)
+      rescue StandardError => e
+        puts "❌ ImageToTextService: Fallback model creation failed: #{e.message}"
+        @fallback = nil
+      end
+      if @primary.nil? && @fallback.nil?
+        puts "⚠️  ImageToTextService: WARNING - No models available! Service will return metadata-based descriptions only."
+      end
+    end
+    def convert(file_path)
+      return "" unless File.exist?(file_path)
+      return "" unless image_file?(file_path)
+      start_time = Time.now
+      @image_path = file_path
+      # Try to read image and prepare data
+      begin
+        @image = Magick::Image.read(@image_path).first
+        image_data = prepare_image_data
+        return generate_fallback_description unless image_data
+      rescue StandardError => e
+        puts "❌ ImageToTextService: Failed to read image: #{e.message}"
+        return generate_fallback_description
+      end
+      # Attempt vision model description
+      if @primary
+        description = attempt_vision_description(image_data)
+        if description && !description.empty?
+          elapsed = Time.now - start_time
+          puts "✅ ImageToTextService: Vision description generated (#{elapsed.round(2)}s)"
+          return description
+        end
+      end
+      # Attempt fallback model with metadata
+      if @fallback
+        description = attempt_fallback_description
+        if description && !description.empty?
+          elapsed = Time.now - start_time
+          puts "✅ ImageToTextService: Fallback description generated (#{elapsed.round(2)}s)"
+          return description
+        end
+      end
+      # Final fallback to metadata-based description
+      elapsed = Time.now - start_time
+      puts "🔚 ImageToTextService: Using metadata-based description (#{elapsed.round(2)}s)"
+      generate_fallback_description
+    end
+    def supported_formats
+      %w[.jpg .jpeg .png .gif .bmp .webp .svg .ico .tiff .tif]
+    end
+    private
+    def configure_ruby_llm_globally
+      # Get Ragdoll configuration or use defaults
+      ragdoll_config = begin
+        Ragdoll.configuration
+      rescue StandardError
+        nil
+      end
+      ollama_endpoint = ragdoll_config&.ruby_llm_config&.dig(:ollama, :endpoint) ||
+                       ENV.fetch("OLLAMA_API_BASE", ENV.fetch("OLLAMA_ENDPOINT", "http://localhost:11434"))
+      RubyLLM.configure do |config|
+        config.openai_api_key         = ENV.fetch("OPENAI_API_KEY", nil)
+        config.openai_organization_id = ENV.fetch("OPENAI_ORGANIZATION_ID", nil)
+        config.openai_project_id      = ENV.fetch("OPENAI_PROJECT_ID", nil)
+        config.anthropic_api_key      = ENV.fetch("ANTHROPIC_API_KEY", nil)
+        config.gemini_api_key         = ENV.fetch("GEMINI_API_KEY", nil)
+        config.deepseek_api_key       = ENV.fetch("DEEPSEEK_API_KEY", nil)
+        config.openrouter_api_key     = ENV.fetch("OPENROUTER_API_KEY", nil)
+        config.bedrock_api_key        = ENV.fetch("BEDROCK_ACCESS_KEY_ID", nil)
+        config.bedrock_secret_key     = ENV.fetch("BEDROCK_SECRET_ACCESS_KEY", nil)
+        config.bedrock_region         = ENV.fetch("BEDROCK_REGION", nil)
+        config.bedrock_session_token  = ENV.fetch("BEDROCK_SESSION_TOKEN", nil)
+        config.ollama_api_base        = ollama_endpoint
+        config.openai_api_base        = ENV.fetch("OPENAI_API_BASE", nil)
+        config.log_level              = :error
+      end
+    rescue StandardError => e
+      puts "❌ ImageToTextService: Failed to configure RubyLLM: #{e.message}"
+    end
+    def build_prompt(detail_level)
+      base_instruction = DETAIL_LEVELS[detail_level] || DETAIL_LEVELS[:comprehensive]
+      case detail_level
+      when :analytical
+        <<~PROMPT
+          #{base_instruction}
+          Please organize your analysis into these sections:
+          1. Visual Elements: Objects, people, animals, and their relationships
+          2. Setting & Environment: Location, time of day, weather, atmosphere
+          3. Technical Aspects: Lighting, composition, colors, perspective
+          4. Text & Symbols: Any visible text, signs, logos, or symbolic elements
+          5. Context & Meaning: Possible purpose, story, or message conveyed
+          Provide a thorough but concise analysis suitable for search and retrieval.
+        PROMPT
+      when :comprehensive
+        <<~PROMPT
+          #{base_instruction}
+          Include details about:
+          - Main subjects and their actions or poses
+          - Setting, background, and environment
+          - Colors, lighting, and mood
+          - Any text, signs, or readable elements
+          - Style or artistic elements
+          - Objects and their relationships
+          Write in a natural, descriptive style that would help someone understand the image content for search purposes.
+        PROMPT
+      else
+        base_instruction
+      end
+    end
+    def attempt_vision_description(image_data)
+      begin
+        @primary.add_message(
+          role: "user",
+          content: [
+            { type: "text", text: @primary_prompt },
+            { type: "image_url", image_url: { url: "data:#{@image.mime_type};base64,#{image_data}" } }
+          ]
+        )
+        response = @primary.complete
+        description = extract_description(response)
+        clean_description(description)
+      rescue StandardError => e
+        puts "❌ ImageToTextService: Vision model failed: #{e.message}"
+        nil
+      end
+    end
+    def attempt_fallback_description
+      begin
+        prompt = build_fallback_prompt
+        response = @fallback.ask(prompt).content
+        clean_description(response)
+      rescue StandardError => e
+        puts "❌ ImageToTextService: Fallback model failed: #{e.message}"
+        nil
+      end
+    end
+    def build_fallback_prompt
+      <<~PROMPT
+        Based on the image file information below, generate a descriptive analysis of what this image likely contains:
+        **File Information:**
+        - Path: #{@image_path}
+        - Filename: #{File.basename(@image_path)}
+        - Dimensions: #{@image.columns}x#{@image.rows} pixels
+        - Format: #{@image.mime_type}
+        - File Size: #{@image.filesize} bytes
+        - Colors: #{@image.number_colors} unique colors
+        **Analysis Request:**
+        Consider the filename, aspect ratio (#{aspect_ratio_description}), file format, and size to make educated guesses about:
+        1. What type of image this might be (photo, diagram, artwork, screenshot, etc.)
+        2. Possible subject matter based on filename and characteristics
+        3. Likely content based on image properties
+        Provide a thoughtful description that could be useful for search and categorization, even without seeing the actual image content.
+      PROMPT
+    end
+    def image_file?(file_path)
+      extension = File.extname(file_path).downcase
+      supported_formats.include?(extension)
+    end
+    def prepare_image_data
+      Base64.strict_encode64(File.binread(@image_path))
+    rescue StandardError
+      nil
+    end
+    def extract_description(response)
+      if response.respond_to?(:content)
+        response.content
+      elsif response.is_a?(Hash) && response.dig("choices", 0, "message", "content")
+        response["choices"][0]["message"]["content"]
+      else
+        nil
+      end
+    end
+    def clean_description(description)
+      return nil unless description.is_a?(String)
+      cleaned = description
+                .strip
+                .sub(/\ADescription:?:?\s*/i, "")
+                .sub(/\AImage:?\s*/i, "")
+                .gsub(/\s+/, " ")
+                .gsub(@image_path, File.basename(@image_path))
+                .strip
+      # Ensure it ends with punctuation
+      cleaned << "." unless cleaned =~ /[.!?]\z/
+      cleaned
+    end
+    def generate_fallback_description
+      filename = File.basename(@image_path, File.extname(@image_path))
+      # Try to extract meaningful information from filename
+      descriptive_parts = filename
+                         .gsub(/[-_]+/, ' ')
+                         .gsub(/([a-z])([A-Z])/, '\1 \2')
+                         .split(' ')
+                         .reject { |part| part.match?(/^\d+$/) }  # Remove pure numbers
+                         .map(&:capitalize)
+      if descriptive_parts.any?
+        base_description = "Image: #{descriptive_parts.join(' ')}"
+      else
+        base_description = "Image file: #{File.basename(@image_path)}"
+      end
+      # Add technical details if available
+      if @image
+        details = []
+        details << "#{@image.columns}x#{@image.rows}"
+        details << aspect_ratio_description
+        details << File.extname(@image_path).upcase.sub('.', '') + " format"
+        "#{base_description} (#{details.join(', ')})"
+      else
+        base_description
+      end
+    end
+    def aspect_ratio_description
+      return "unknown aspect ratio" unless @image
+      ratio = @image.columns.to_f / @image.rows.to_f
+      case ratio
+      when 0.9..1.1 then "square"
+      when 1.1..1.5 then "landscape"
+      when 1.5..2.0 then "wide landscape"
+      when 2.0..Float::INFINITY then "panoramic"
+      when 0.5..0.9 then "portrait"
+      when 0.0..0.5 then "tall portrait"
+      else "unusual aspect ratio"
+      end
+    end
+  end
+end

data/app/services/ragdoll/migration_service.rb ADDED Viewed

@@ -0,0 +1,340 @@
+# frozen_string_literal: true
+module Ragdoll
+  # Migration service to transition from multi-modal to unified text-based RAG system
+  class MigrationService
+    class MigrationError < StandardError; end
+    def self.migrate_all_documents(**options)
+      new.migrate_all_documents(**options)
+    end
+    def self.migrate_document(document_id, **options)
+      new.migrate_document(document_id, **options)
+    end
+    def initialize
+      @converter = Ragdoll::DocumentConverter.new
+      @unified_management = Ragdoll::UnifiedDocumentManagement.new
+    end
+    # Migrate all existing documents to unified text-based system
+    def migrate_all_documents(**options)
+      return { error: "UnifiedDocument model not available" } unless defined?(Ragdoll::UnifiedDocument)
+      migration_stats = {
+        started_at: Time.current,
+        total_documents: 0,
+        migrated: 0,
+        skipped: 0,
+        errors: []
+      }
+      puts "🚀 Starting migration from multi-modal to unified text-based system..."
+      # Get all existing documents
+      Ragdoll::Document.find_each(batch_size: options[:batch_size] || 50) do |document|
+        migration_stats[:total_documents] += 1
+        begin
+          result = migrate_single_document(document, **options)
+          if result[:status] == :migrated
+            migration_stats[:migrated] += 1
+          else
+            migration_stats[:skipped] += 1
+          end
+        rescue StandardError => e
+          migration_stats[:errors] << {
+            document_id: document.id,
+            title: document.title,
+            error: e.message
+          }
+          puts "❌ Error migrating document #{document.id}: #{e.message}"
+        end
+        # Progress reporting
+        if migration_stats[:total_documents] % 10 == 0
+          puts "📊 Progress: #{migration_stats[:migrated]} migrated, #{migration_stats[:skipped]} skipped, #{migration_stats[:errors].length} errors"
+        end
+      end
+      migration_stats[:completed_at] = Time.current
+      migration_stats[:duration] = migration_stats[:completed_at] - migration_stats[:started_at]
+      puts "✅ Migration completed!"
+      puts "📊 Final stats: #{migration_stats[:migrated]} migrated, #{migration_stats[:skipped]} skipped, #{migration_stats[:errors].length} errors"
+      puts "⏱️  Duration: #{migration_stats[:duration].round(2)} seconds"
+      migration_stats
+    end
+    # Migrate a specific document
+    def migrate_document(document_id, **options)
+      document = Ragdoll::Document.find(document_id)
+      migrate_single_document(document, **options)
+    end
+    # Create comparison report between old and new systems
+    def create_comparison_report
+      return { error: "UnifiedDocument model not available" } unless defined?(Ragdoll::UnifiedDocument)
+      old_stats = Ragdoll::Document.stats
+      new_stats = Ragdoll::UnifiedDocument.stats
+      content_stats = Ragdoll::UnifiedContent.stats
+      {
+        migration_summary: {
+          old_system: {
+            total_documents: old_stats[:total_documents],
+            text_contents: old_stats[:total_text_contents],
+            image_contents: old_stats[:total_image_contents],
+            audio_contents: old_stats[:total_audio_contents],
+            total_embeddings: old_stats[:total_embeddings]
+          },
+          new_system: {
+            total_documents: new_stats[:total_documents],
+            unified_contents: content_stats[:total_contents],
+            total_embeddings: new_stats[:total_embeddings],
+            by_media_type: content_stats[:by_media_type]
+          }
+        },
+        benefits: {
+          simplified_architecture: "Single content model instead of STI",
+          unified_search: "All content searchable through text",
+          cross_modal_retrieval: "Images and audio searchable via descriptions/transcripts",
+          reduced_complexity: "One embedding pipeline instead of multiple"
+        },
+        recommendations: generate_migration_recommendations
+      }
+    end
+    # Validate migrated data integrity
+    def validate_migration
+      return { error: "UnifiedDocument model not available" } unless defined?(Ragdoll::UnifiedDocument)
+      validation_results = {
+        total_checks: 0,
+        passed: 0,
+        failed: 0,
+        issues: []
+      }
+      puts "🔍 Validating migration integrity..."
+      # Check 1: All documents have corresponding unified documents
+      validation_results[:total_checks] += 1
+      old_count = Ragdoll::Document.count
+      new_count = Ragdoll::UnifiedDocument.count
+      if old_count == new_count
+        validation_results[:passed] += 1
+        puts "✅ Document count matches: #{old_count} = #{new_count}"
+      else
+        validation_results[:failed] += 1
+        validation_results[:issues] << "Document count mismatch: #{old_count} old vs #{new_count} new"
+        puts "❌ Document count mismatch: #{old_count} old vs #{new_count} new"
+      end
+      # Check 2: All unified documents have content
+      validation_results[:total_checks] += 1
+      documents_without_content = Ragdoll::UnifiedDocument.without_content.count
+      if documents_without_content == 0
+        validation_results[:passed] += 1
+        puts "✅ All unified documents have content"
+      else
+        validation_results[:failed] += 1
+        validation_results[:issues] << "#{documents_without_content} documents without content"
+        puts "❌ #{documents_without_content} documents without content"
+      end
+      # Check 3: Content quality assessment
+      validation_results[:total_checks] += 1
+      quality_stats = content_quality_report
+      if quality_stats[:high_quality_percentage] >= 50
+        validation_results[:passed] += 1
+        puts "✅ Content quality acceptable: #{quality_stats[:high_quality_percentage]}% high quality"
+      else
+        validation_results[:failed] += 1
+        validation_results[:issues] << "Low content quality: only #{quality_stats[:high_quality_percentage]}% high quality"
+        puts "⚠️  Content quality concern: only #{quality_stats[:high_quality_percentage]}% high quality"
+      end
+      validation_results[:quality_report] = quality_stats
+      validation_results
+    end
+    private
+    def migrate_single_document(document, **options)
+      # Skip if already migrated (check by location)
+      if defined?(Ragdoll::UnifiedDocument) &&
+         Ragdoll::UnifiedDocument.exists?(location: document.location)
+        return { status: :skipped, reason: "already_migrated" }
+      end
+      # Extract unified text content from multi-modal document
+      unified_text = extract_unified_text_from_document(document)
+      if unified_text.blank?
+        return { status: :skipped, reason: "no_content" }
+      end
+      # Create unified document
+      unified_doc = Ragdoll::UnifiedDocument.create!(
+        location: document.location,
+        title: document.title,
+        document_type: document.document_type,
+        status: "pending",
+        file_modified_at: document.file_modified_at,
+        metadata: merge_document_metadata(document)
+      )
+      # Create unified content
+      unified_doc.unified_contents.create!(
+        content: unified_text,
+        original_media_type: determine_primary_media_type(document),
+        embedding_model: "text-embedding-3-large",
+        metadata: {
+          "migrated_at" => Time.current,
+          "migration_source" => "multi_modal_document",
+          "original_document_id" => document.id,
+          "conversion_method" => "migration_consolidation"
+        }
+      )
+      # Process the unified document if requested
+      if options[:process_embeddings]
+        unified_doc.process_document!
+      else
+        unified_doc.update!(status: "processed")
+      end
+      puts "✅ Migrated: #{document.title}"
+      { status: :migrated, unified_document: unified_doc }
+    rescue StandardError => e
+      puts "❌ Failed to migrate #{document.title}: #{e.message}"
+      raise MigrationError, "Migration failed for document #{document.id}: #{e.message}"
+    end
+    def extract_unified_text_from_document(document)
+      text_parts = []
+      # Collect text from all content types
+      if document.respond_to?(:text_contents)
+        document.text_contents.each do |tc|
+          text_parts << tc.content if tc.content.present?
+        end
+      end
+      if document.respond_to?(:image_contents)
+        document.image_contents.each do |ic|
+          text_parts << ic.description if ic.description.present?
+        end
+      end
+      if document.respond_to?(:audio_contents)
+        document.audio_contents.each do |ac|
+          text_parts << ac.transcript if ac.transcript.present?
+        end
+      end
+      # Fallback to document content field
+      if text_parts.empty? && document.content.present?
+        text_parts << document.content
+      end
+      # Join all text parts
+      unified_text = text_parts.compact.reject(&:empty?).join("\n\n")
+      # If still no content, try to regenerate from file
+      if unified_text.blank? && File.exist?(document.location)
+        begin
+          unified_text = @converter.convert_to_text(document.location, document.document_type)
+        rescue StandardError => e
+          puts "Warning: Could not regenerate content for #{document.location}: #{e.message}"
+        end
+      end
+      unified_text
+    end
+    def determine_primary_media_type(document)
+      # Determine the primary media type based on document structure
+      if document.respond_to?(:content_types)
+        content_types = document.content_types
+        return content_types.first if content_types.any?
+      end
+      # Fallback to document type
+      case document.document_type
+      when "text", "markdown", "html", "pdf", "docx"
+        "text"
+      when "image"
+        "image"
+      when "audio"
+        "audio"
+      else
+        "text"
+      end
+    end
+    def merge_document_metadata(document)
+      base_metadata = document.metadata || {}
+      # Add migration tracking
+      base_metadata.merge(
+        "migrated_from_multi_modal" => true,
+        "migration_timestamp" => Time.current,
+        "original_system" => "multi_modal_sti"
+      )
+    end
+    def content_quality_report
+      return {} unless defined?(Ragdoll::UnifiedContent)
+      total_contents = Ragdoll::UnifiedContent.count
+      return { error: "No content to analyze" } if total_contents == 0
+      high_quality = Ragdoll::UnifiedContent.where("LENGTH(content) > 100").count
+      medium_quality = Ragdoll::UnifiedContent.where("LENGTH(content) BETWEEN 50 AND 100").count
+      low_quality = Ragdoll::UnifiedContent.where("LENGTH(content) < 50").count
+      {
+        total_contents: total_contents,
+        high_quality: high_quality,
+        medium_quality: medium_quality,
+        low_quality: low_quality,
+        high_quality_percentage: (high_quality.to_f / total_contents * 100).round(1),
+        medium_quality_percentage: (medium_quality.to_f / total_contents * 100).round(1),
+        low_quality_percentage: (low_quality.to_f / total_contents * 100).round(1)
+      }
+    end
+    def generate_migration_recommendations
+      recommendations = []
+      # Check if UnifiedDocument is available
+      if defined?(Ragdoll::UnifiedDocument)
+        quality_report = content_quality_report
+        if quality_report[:low_quality_percentage] && quality_report[:low_quality_percentage] > 20
+          recommendations << "Consider reprocessing low-quality content with enhanced conversion settings"
+        end
+        if quality_report[:total_contents] && quality_report[:total_contents] > 0
+          recommendations << "Review content quality scores and adjust conversion parameters as needed"
+        end
+      else
+        recommendations << "Enable UnifiedDocument and UnifiedContent models to start migration"
+      end
+      recommendations << "Test search functionality with unified text-based approach"
+      recommendations << "Monitor embedding generation performance with single model"
+      recommendations << "Consider archiving old multi-modal content tables after validation"
+      recommendations
+    end
+  end
+end