RubyGems - fractor - Versions diffs - 0.1.0 → 0.1.1 - Mend

fractor 0.1.0 → 0.1.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (25) hide show

checksums.yaml +4 -4
data/.rubocop.yml +2 -0
data/.rubocop_todo.yml +82 -0
data/README.adoc +281 -41
data/examples/hierarchical_hasher/README.adoc +75 -0
data/examples/hierarchical_hasher/hierarchical_hasher.rb +150 -0
data/examples/multi_work_type/README.adoc +45 -0
data/examples/multi_work_type/multi_work_type.rb +319 -0
data/examples/pipeline_processing/README.adoc +44 -0
data/examples/pipeline_processing/pipeline_processing.rb +216 -0
data/examples/producer_subscriber/README.adoc +92 -0
data/examples/producer_subscriber/producer_subscriber.rb +256 -0
data/examples/scatter_gather/README.adoc +43 -0
data/examples/scatter_gather/scatter_gather.rb +327 -0
data/examples/simple/sample.rb +101 -0
data/examples/specialized_workers/README.adoc +45 -0
data/examples/specialized_workers/specialized_workers.rb +395 -0
data/lib/fractor/result_aggregator.rb +10 -1
data/lib/fractor/supervisor.rb +167 -70
data/lib/fractor/version.rb +1 -1
data/lib/fractor.rb +7 -9
metadata +16 -5
data/examples/hierarchical_hasher.rb +0 -158
data/examples/producer_subscriber.rb +0 -300
data/sample.rb +0 -64

data/examples/hierarchical_hasher/hierarchical_hasher.rb ADDED Viewed

@@ -0,0 +1,150 @@
+# frozen_string_literal: true
+require_relative "../../lib/fractor"
+require "digest/sha2" # Using SHA2 which is more Ractor-compatible
+module HierarchicalHasher
+  # Define our Work class
+  class ChunkWork < Fractor::Work
+    def initialize(data, start = 0, length = nil)
+      super({
+        data: data,
+        start: start,
+        length: length || data.bytesize
+      })
+    end
+    def data
+      input[:data]
+    end
+    def start
+      input[:start]
+    end
+    def length
+      input[:length]
+    end
+    def to_s
+      "ChunkWork: start=#{start}, length=#{length}, data_size=#{data.bytesize}"
+    end
+  end
+  # Define our Worker class
+  class HashWorker < Fractor::Worker
+    def process(work)
+      # Simulate some processing time
+      sleep(rand(0.01..0.05))
+      # Calculate SHA-256 hash for the chunk (using SHA2 which is Ractor-compatible)
+      begin
+        hash = Digest::SHA256.hexdigest(work.data)
+        # Return successful result
+        Fractor::WorkResult.new(
+          result: {
+            start: work.start,
+            length: work.length,
+            hash: hash
+          },
+          work: work
+        )
+      rescue StandardError => e
+        # Return error result if something goes wrong
+        Fractor::WorkResult.new(
+          error: "Failed to hash chunk: #{e.message}",
+          work: work
+        )
+      end
+    end
+  end
+  class FileHasher
+    attr_reader :file_path, :chunk_size, :final_hash
+    def initialize(file_path, chunk_size = 1024, worker_count = 4)
+      @file_path = file_path
+      @chunk_size = chunk_size
+      @worker_count = worker_count
+      @final_hash = nil
+    end
+    def hash_file
+      # Create the supervisor with our worker class in a worker pool
+      supervisor = Fractor::Supervisor.new(
+        worker_pools: [
+          { worker_class: HashWorker, num_workers: @worker_count }
+        ]
+      )
+      # Load the file and create work chunks
+      load_file_chunks(supervisor)
+      # Run the processing
+      supervisor.run
+      # Process the results to get the final hash
+      @final_hash = finalize_hash(supervisor.results)
+      @final_hash
+    end
+    private
+    def load_file_chunks(supervisor)
+      work_items = []
+      File.open(@file_path, "rb") do |file|
+        start_pos = 0
+        while (chunk = file.read(@chunk_size))
+          work_items << ChunkWork.new(chunk, start_pos, chunk.length)
+          start_pos += chunk.length
+        end
+      end
+      supervisor.add_work_items(work_items)
+    end
+    def finalize_hash(results_aggregator)
+      return nil if results_aggregator.results.empty?
+      # Sort results by start position
+      sorted_results = results_aggregator.results.sort_by { |result| result.result[:start] }
+      # Concatenate all hashes with newlines
+      combined_hash_string = sorted_results.map { |result| result.result[:hash] }.join("\n")
+      # Calculate final SHA-256 hash (instead of SHA3)
+      Digest::SHA256.hexdigest(combined_hash_string)
+    end
+  end
+end
+# Example usage
+if __FILE__ == $PROGRAM_NAME
+  if ARGV.empty?
+    puts "Usage: ruby hierarchical_hasher.rb <file_path> [worker_count]"
+    exit 1
+  end
+  file_path = ARGV[0]
+  worker_count = (ARGV[1] || 4).to_i
+  unless File.exist?(file_path)
+    puts "Error: File '#{file_path}' not found"
+    exit 1
+  end
+  puts "Starting hierarchical hasher with #{worker_count} workers..."
+  puts "Processing file: #{file_path}"
+  start_time = Time.now
+  hasher = HierarchicalHasher::FileHasher.new(file_path, 1024, worker_count)
+  final_hash = hasher.hash_file
+  end_time = Time.now
+  puts "Final SHA-256 hash: #{final_hash}"
+  puts "Processing completed in #{end_time - start_time} seconds"
+end

data/examples/multi_work_type/README.adoc ADDED Viewed

@@ -0,0 +1,45 @@
+= Multi-Work Type Example
+== Overview
+This example demonstrates how to handle multiple types of work items within a single Fractor supervisor. It shows how a single worker can process different work types intelligently, applying different strategies based on the work's type.
+== Key Concepts
+* *Multiple Work Types*: Supporting different work classes within the same system
+* *Polymorphic Processing*: Workers that adapt their processing based on work type
+* *Type Detection*: Identifying and handling different work types appropriately
+* *Unified Workflow*: Managing diverse work through a common supervisor
+== Example Explanation
+This example implements a system that processes two distinct work types:
+1. *TextWork*: Handles text in various formats (plain text, Markdown, HTML, JSON)
+2. *ImageWork*: Processes image data with different dimensions and formats
+A single worker type (`MultiFormatWorker`) is capable of handling both work types, adapting its processing strategies based on the work's class.
+== Features Demonstrated
+* Creating and using multiple work type classes
+* Designing workers that can handle diverse work types
+* Type-based processing logic
+* Proper error handling across different work types
+* Classification and reporting of heterogeneous results
+== Running the Example
+[source,sh]
+----
+ruby examples/multi_work_type/multi_work_type.rb
+----
+== Expected Output
+The example will show:
+* Processing of multiple work types
+* Different processing strategies applied to each type
+* Type-specific result formats
+* Performance statistics for each work type
+* Aggregated results organized by type

data/examples/multi_work_type/multi_work_type.rb ADDED Viewed

@@ -0,0 +1,319 @@
+# frozen_string_literal: true
+require_relative "../../lib/fractor"
+module MultiWorkType
+  # First work type for text data
+  class TextWork < Fractor::Work
+    def initialize(data, format = :plain, options = {})
+      super({ data: data, format: format, options: options })
+    end
+    def data
+      input[:data]
+    end
+    def format
+      input[:format]
+    end
+    def options
+      input[:options]
+    end
+    def to_s
+      "TextWork: format=#{format}, options=#{options}, data=#{data.to_s[0..30]}..."
+    end
+  end
+  # Second work type for image data
+  class ImageWork < Fractor::Work
+    def initialize(data, dimensions = [0, 0], format = :png)
+      super({ data: data, dimensions: dimensions, format: format })
+    end
+    def data
+      input[:data]
+    end
+    def dimensions
+      input[:dimensions]
+    end
+    def format
+      input[:format]
+    end
+    def to_s
+      "ImageWork: dimensions=#{dimensions.join("x")}, format=#{format}"
+    end
+  end
+  # A single worker that can process both work types
+  class MultiFormatWorker < Fractor::Worker
+    def process(work)
+      # Differentiate processing based on work class
+      if work.is_a?(TextWork)
+        process_text(work)
+      elsif work.is_a?(ImageWork)
+        process_image(work)
+      else
+        # Return error for unsupported work types
+        error = TypeError.new("Unsupported work type: #{work.class}")
+        Fractor::WorkResult.new(
+          error: error,
+          work: work
+        )
+      end
+    end
+    private
+    def process_text(work)
+      # Process text based on format
+      sleep(rand(0.01..0.05)) # Simulate processing time
+      processed_text = case work.format
+                       when :markdown then process_markdown(work.data, work.options)
+                       when :html then process_html(work.data, work.options)
+                       when :json then process_json(work.data, work.options)
+                       else work.data.upcase # Simple transformation for plain text
+                       end
+      Fractor::WorkResult.new(
+        result: {
+          work_type: :text,
+          original_format: work.format,
+          transformed_data: processed_text,
+          metadata: {
+            word_count: processed_text.split(/\s+/).size,
+            char_count: processed_text.length
+          }
+        },
+        work: work
+      )
+    end
+    def process_image(work)
+      # Simulate image processing operations
+      sleep(rand(0.03..0.1)) # Simulate processing time
+      # Creating a safe copy of the data to avoid memory issues
+      # Avoid calling methods directly on the input that might cause memory issues
+      input_size = work.data.is_a?(String) ? work.data.size : 0
+      # In a real implementation, this would use image processing libraries
+      simulated_result = {
+        work_type: :image,
+        dimensions: work.dimensions,
+        format: work.format,
+        applied_filters: %i[sharpen contrast],
+        processing_metadata: {
+          original_size: input_size,
+          processed_size: (input_size * 0.8).to_i # Simulate compression
+        }
+      }
+      Fractor::WorkResult.new(
+        result: simulated_result,
+        work: work
+      )
+    end
+    # Format-specific processing methods
+    def process_markdown(text, _options)
+      # Simulate Markdown processing
+      headers = text.scan(/^#+\s+(.+)$/).flatten
+      links = text.scan(/\[(.+?)\]\((.+?)\)/)
+      "Processed Markdown: #{text.length} chars, #{headers.size} headers, #{links.size} links\n" \
+        "Headers: #{headers.join(", ")}\n" \
+        "#{text.gsub(/^#+\s+(.+)$/, '💫 \1 💫')}"
+    end
+    def process_html(text, _options)
+      # Simulate HTML processing
+      tags = text.scan(/<(\w+)[^>]*>/).flatten
+      "Processed HTML: #{text.length} chars, #{tags.size} tags\n" \
+        "Tags: #{tags.uniq.join(", ")}\n" \
+        "#{text.gsub(%r{<(\w+)[^>]*>(.+?)</\1>}, '✨\2✨')}"
+    end
+    def process_json(text, _options)
+      # Simulate JSON processing
+      data = text.nil? ? {} : eval(text) # WARNING: Using eval for demonstration only
+      keys = data.keys
+      "Processed JSON: #{keys.size} top-level keys\n" \
+        "Keys: #{keys.join(", ")}\n" \
+        "Pretty-printed: #{data}"
+    rescue StandardError => e
+      "Invalid JSON: #{e.message}"
+    end
+  end
+  # Controller class for the example
+  class ContentProcessor
+    attr_reader :results
+    def initialize(worker_count = 4)
+      # Create supervisor with a MultiFormatWorker pool
+      @supervisor = Fractor::Supervisor.new(
+        worker_pools: [
+          { worker_class: MultiFormatWorker, num_workers: worker_count }
+        ]
+      )
+      @results = {
+        text: [],
+        image: [],
+        errors: []
+      }
+    end
+    def process_mixed_content(text_items, image_items)
+      # Create TextWork objects and add them to the supervisor
+      text_works = text_items.map do |item|
+        TextWork.new(item[:data], item[:format], item[:options] || {})
+      end
+      @supervisor.add_work_items(text_works)
+      # Create ImageWork objects and add them to the supervisor
+      image_works = image_items.map do |item|
+        ImageWork.new(item[:data], item[:dimensions], item[:format] || :png)
+      end
+      @supervisor.add_work_items(image_works)
+      # Process all work
+      @supervisor.run
+      # Separate results by work type
+      classify_results(@supervisor.results)
+      # Return the statistics
+      {
+        total_items: text_items.size + image_items.size,
+        processed: {
+          text: @results[:text].size,
+          image: @results[:image].size
+        },
+        errors: @results[:errors].size,
+        results: @results
+      }
+    end
+    private
+    def classify_results(results_aggregator)
+      # Group results by work type
+      results_aggregator.results.each do |result|
+        if result.work.is_a?(TextWork)
+          @results[:text] << result.result
+        elsif result.work.is_a?(ImageWork)
+          @results[:image] << result.result
+        end
+      end
+      # Record errors
+      results_aggregator.errors.each do |error_result|
+        @results[:errors] << {
+          error: error_result.error,
+          work_type: error_result.work.class.name
+        }
+      end
+      puts "Processed #{@results[:text].size} text items and #{@results[:image].size} image items"
+      puts "Encountered #{@results[:errors].size} errors"
+    end
+  end
+end
+# Example usage
+if __FILE__ == $PROGRAM_NAME
+  puts "Starting Multi-Work Type Processing Example"
+  puts "=========================================="
+  puts "This example demonstrates processing different types of work items:"
+  puts "1. Text documents in various formats (plain, markdown, HTML, JSON)"
+  puts "2. Image data with different formats and dimensions"
+  puts "Both are processed by the same worker but with different strategies"
+  puts
+  # Sample text items
+  text_items = [
+    {
+      data: "This is a plain text document. It has no special formatting.",
+      format: :plain
+    },
+    {
+      data: "# Markdown Document\n\nThis is a **bold** statement. Here's a [link](https://example.com).",
+      format: :markdown
+    },
+    {
+      data: "<html><body><h1>HTML Document</h1><p>This is a paragraph.</p></body></html>",
+      format: :html
+    },
+    {
+      data: "{name: 'Product', price: 29.99, tags: ['electronics', 'gadget']}",
+      format: :json,
+      options: { pretty: true }
+    }
+  ]
+  # Sample image items (simulated)
+  image_items = [
+    {
+      data: "simulated_jpeg_data_1",
+      dimensions: [800, 600],
+      format: :jpeg
+    },
+    {
+      data: "simulated_png_data_1",
+      dimensions: [1024, 768],
+      format: :png
+    },
+    {
+      data: "simulated_gif_data_1",
+      dimensions: [320, 240],
+      format: :gif
+    }
+  ]
+  worker_count = 4
+  puts "Processing with #{worker_count} workers..."
+  puts
+  start_time = Time.now
+  processor = MultiWorkType::ContentProcessor.new(worker_count)
+  result = processor.process_mixed_content(text_items, image_items)
+  end_time = Time.now
+  puts "Processing Results:"
+  puts "-----------------"
+  puts "Total items: #{result[:total_items]}"
+  puts "Processed text items: #{result[:processed][:text]}"
+  puts "Processed image items: #{result[:processed][:image]}"
+  puts "Errors: #{result[:errors]}"
+  puts
+  puts "Text Processing Results:"
+  result[:results][:text].each_with_index do |text_result, index|
+    puts "Text Item #{index + 1} (#{text_result[:original_format]}):"
+    puts "  #{text_result[:transformed_data].to_s.split("\n").first}"
+    puts "  Word count: #{text_result[:metadata][:word_count]}"
+    puts "  Character count: #{text_result[:metadata][:char_count]}"
+    puts
+  end
+  puts "Image Processing Results:"
+  result[:results][:image].each_with_index do |image_result, index|
+    puts "Image Item #{index + 1} (#{image_result[:format]}):"
+    puts "  Dimensions: #{image_result[:dimensions].join("x")}"
+    puts "  Applied filters: #{image_result[:applied_filters].join(", ")}"
+    puts "  Compression: #{(1 - image_result[:processing_metadata][:processed_size].to_f / image_result[:processing_metadata][:original_size]).round(2) * 100}%"
+    puts
+  end
+  puts "Processing completed in #{end_time - start_time} seconds"
+end

data/examples/pipeline_processing/README.adoc ADDED Viewed

@@ -0,0 +1,44 @@
+= Pipeline Processing Example
+== Overview
+This example demonstrates the Pipeline Processing pattern implemented with Fractor. In this pattern, data flows through a series of sequential processing stages, where the output of one stage becomes the input to the next.
+== Key Concepts
+* *Pipeline*: A series of connected processing stages
+* *Data Flow*: Information passes through each stage in sequence
+* *Transformation*: Each stage performs a specific operation on the data
+* *Concurrency*: Multiple items can be at different stages of the pipeline simultaneously
+== Example Explanation
+This example processes data through a multi-stage pipeline:
+1. *Input Stage*: Raw data is prepared for processing
+2. *Processing Stages*: Data moves through a series of transformations
+3. *Output Stage*: Final results are collected and reported
+Each stage of the pipeline can run concurrently on different workers, allowing for efficient parallel processing while maintaining the required order of operations.
+== Features Demonstrated
+* Sequential processing with dependencies between stages
+* Concurrent execution of pipeline stages
+* Processing optimizations through specialized workers
+* Handling data flow between processing stages
+== Running the Example
+[source,sh]
+----
+ruby examples/pipeline_processing/pipeline_processing.rb
+----
+== Expected Output
+The example will show:
+* Data moving through each stage of the pipeline
+* Workers processing different stages concurrently
+* The transformation of data at each stage
+* Final results after passing through the complete pipeline