RubyGems - fractor - Versions diffs - 0.1.4 → 0.1.6 - Mend

fractor 0.1.4 → 0.1.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

checksums.yaml +4 -4
data/.rubocop-https---raw-githubusercontent-com-riboseinc-oss-guides-main-ci-rubocop-yml +552 -0
data/.rubocop.yml +14 -8
data/.rubocop_todo.yml +162 -46
data/README.adoc +1364 -376
data/examples/auto_detection/auto_detection.rb +9 -9
data/examples/continuous_chat_common/message_protocol.rb +53 -0
data/examples/continuous_chat_fractor/README.adoc +217 -0
data/examples/continuous_chat_fractor/chat_client.rb +303 -0
data/examples/continuous_chat_fractor/chat_common.rb +83 -0
data/examples/continuous_chat_fractor/chat_server.rb +167 -0
data/examples/continuous_chat_fractor/simulate.rb +345 -0
data/examples/continuous_chat_server/README.adoc +135 -0
data/examples/continuous_chat_server/chat_client.rb +303 -0
data/examples/continuous_chat_server/chat_server.rb +359 -0
data/examples/continuous_chat_server/simulate.rb +343 -0
data/examples/hierarchical_hasher/hierarchical_hasher.rb +12 -8
data/examples/multi_work_type/multi_work_type.rb +30 -29
data/examples/pipeline_processing/pipeline_processing.rb +15 -15
data/examples/producer_subscriber/producer_subscriber.rb +20 -16
data/examples/scatter_gather/scatter_gather.rb +29 -28
data/examples/simple/sample.rb +5 -5
data/examples/specialized_workers/specialized_workers.rb +44 -37
data/lib/fractor/continuous_server.rb +188 -0
data/lib/fractor/result_aggregator.rb +1 -1
data/lib/fractor/supervisor.rb +277 -104
data/lib/fractor/version.rb +1 -1
data/lib/fractor/work_queue.rb +68 -0
data/lib/fractor/work_result.rb +1 -1
data/lib/fractor/worker.rb +2 -1
data/lib/fractor/wrapped_ractor.rb +12 -2
data/lib/fractor.rb +2 -0
metadata +15 -2

data/examples/hierarchical_hasher/hierarchical_hasher.rb CHANGED Viewed

@@ -10,7 +10,7 @@ module HierarchicalHasher
       super({
         data: data,
         start: start,
-        length: length || data.bytesize
+        length: length || data.bytesize,
       })
     end
@@ -46,15 +46,15 @@ module HierarchicalHasher
           result: {
             start: work.start,
             length: work.length,
-            hash: hash
+            hash: hash,
           },
-          work: work
+          work: work,
         )
       rescue StandardError => e
         # Return error result if something goes wrong
         Fractor::WorkResult.new(
           error: "Failed to hash chunk: #{e.message}",
-          work: work
+          work: work,
         )
       end
     end
@@ -74,8 +74,8 @@ module HierarchicalHasher
       # Create the supervisor with our worker class in a worker pool
       supervisor = Fractor::Supervisor.new(
         worker_pools: [
-          { worker_class: HashWorker, num_workers: @worker_count }
-        ]
+          { worker_class: HashWorker, num_workers: @worker_count },
+        ],
       )
       # Load the file and create work chunks
@@ -111,10 +111,14 @@ module HierarchicalHasher
       return nil if results_aggregator.results.empty?
       # Sort results by start position
-      sorted_results = results_aggregator.results.sort_by { |result| result.result[:start] }
+      sorted_results = results_aggregator.results.sort_by do |result|
+        result.result[:start]
+      end
       # Concatenate all hashes with newlines
-      combined_hash_string = sorted_results.map { |result| result.result[:hash] }.join("\n")
+      combined_hash_string = sorted_results.map do |result|
+        result.result[:hash]
+      end.join("\n")
       # Calculate final SHA-256 hash (instead of SHA3)
       Digest::SHA256.hexdigest(combined_hash_string)

data/examples/multi_work_type/multi_work_type.rb CHANGED Viewed

@@ -45,7 +45,7 @@ module MultiWorkType
     end
     def to_s
-      "ImageWork: dimensions=#{dimensions.join("x")}, format=#{format}"
+      "ImageWork: dimensions=#{dimensions.join('x')}, format=#{format}"
     end
   end
@@ -62,7 +62,7 @@ module MultiWorkType
         error = TypeError.new("Unsupported work type: #{work.class}")
         Fractor::WorkResult.new(
           error: error,
-          work: work
+          work: work,
         )
       end
     end
@@ -74,7 +74,8 @@ module MultiWorkType
       sleep(rand(0.01..0.05)) # Simulate processing time
       processed_text = case work.format
-                       when :markdown then process_markdown(work.data, work.options)
+                       when :markdown then process_markdown(work.data,
+                                                            work.options)
                        when :html then process_html(work.data, work.options)
                        when :json then process_json(work.data, work.options)
                        else work.data.upcase # Simple transformation for plain text
@@ -87,10 +88,10 @@ module MultiWorkType
           transformed_data: processed_text,
           metadata: {
             word_count: processed_text.split(/\s+/).size,
-            char_count: processed_text.length
-          }
+            char_count: processed_text.length,
+          },
         },
-        work: work
+        work: work,
       )
     end
@@ -110,13 +111,13 @@ module MultiWorkType
         applied_filters: %i[sharpen contrast],
         processing_metadata: {
           original_size: input_size,
-          processed_size: (input_size * 0.8).to_i # Simulate compression
-        }
+          processed_size: (input_size * 0.8).to_i, # Simulate compression
+        },
       }
       Fractor::WorkResult.new(
         result: simulated_result,
-        work: work
+        work: work,
       )
     end
@@ -127,7 +128,7 @@ module MultiWorkType
       links = text.scan(/\[(.+?)\]\((.+?)\)/)
       "Processed Markdown: #{text.length} chars, #{headers.size} headers, #{links.size} links\n" \
-        "Headers: #{headers.join(", ")}\n" \
+        "Headers: #{headers.join(', ')}\n" \
         "#{text.gsub(/^#+\s+(.+)$/, '💫 \1 💫')}"
     end
@@ -136,7 +137,7 @@ module MultiWorkType
       tags = text.scan(/<(\w+)[^>]*>/).flatten
       "Processed HTML: #{text.length} chars, #{tags.size} tags\n" \
-        "Tags: #{tags.uniq.join(", ")}\n" \
+        "Tags: #{tags.uniq.join(', ')}\n" \
         "#{text.gsub(%r{<(\w+)[^>]*>(.+?)</\1>}, '✨\2✨')}"
     end
@@ -147,7 +148,7 @@ module MultiWorkType
       keys = data.keys
       "Processed JSON: #{keys.size} top-level keys\n" \
-        "Keys: #{keys.join(", ")}\n" \
+        "Keys: #{keys.join(', ')}\n" \
         "Pretty-printed: #{data}"
     rescue StandardError => e
       "Invalid JSON: #{e.message}"
@@ -162,14 +163,14 @@ module MultiWorkType
       # Create supervisor with a MultiFormatWorker pool
       @supervisor = Fractor::Supervisor.new(
         worker_pools: [
-          { worker_class: MultiFormatWorker, num_workers: worker_count }
-        ]
+          { worker_class: MultiFormatWorker, num_workers: worker_count },
+        ],
       )
       @results = {
         text: [],
         image: [],
-        errors: []
+        errors: [],
       }
     end
@@ -197,10 +198,10 @@ module MultiWorkType
         total_items: text_items.size + image_items.size,
         processed: {
           text: @results[:text].size,
-          image: @results[:image].size
+          image: @results[:image].size,
         },
         errors: @results[:errors].size,
-        results: @results
+        results: @results,
       }
     end
@@ -220,7 +221,7 @@ module MultiWorkType
       results_aggregator.errors.each do |error_result|
         @results[:errors] << {
           error: error_result.error,
-          work_type: error_result.work.class.name
+          work_type: error_result.work.class.name,
         }
       end
@@ -244,21 +245,21 @@ if __FILE__ == $PROGRAM_NAME
   text_items = [
     {
       data: "This is a plain text document. It has no special formatting.",
-      format: :plain
+      format: :plain,
     },
     {
       data: "# Markdown Document\n\nThis is a **bold** statement. Here's a [link](https://example.com).",
-      format: :markdown
+      format: :markdown,
     },
     {
       data: "<html><body><h1>HTML Document</h1><p>This is a paragraph.</p></body></html>",
-      format: :html
+      format: :html,
     },
     {
       data: "{name: 'Product', price: 29.99, tags: ['electronics', 'gadget']}",
       format: :json,
-      options: { pretty: true }
-    }
+      options: { pretty: true },
+    },
   ]
   # Sample image items (simulated)
@@ -266,18 +267,18 @@ if __FILE__ == $PROGRAM_NAME
     {
       data: "simulated_jpeg_data_1",
       dimensions: [800, 600],
-      format: :jpeg
+      format: :jpeg,
     },
     {
       data: "simulated_png_data_1",
       dimensions: [1024, 768],
-      format: :png
+      format: :png,
     },
     {
       data: "simulated_gif_data_1",
       dimensions: [320, 240],
-      format: :gif
-    }
+      format: :gif,
+    },
   ]
   worker_count = 4
@@ -309,8 +310,8 @@ if __FILE__ == $PROGRAM_NAME
   puts "Image Processing Results:"
   result[:results][:image].each_with_index do |image_result, index|
     puts "Image Item #{index + 1} (#{image_result[:format]}):"
-    puts "  Dimensions: #{image_result[:dimensions].join("x")}"
-    puts "  Applied filters: #{image_result[:applied_filters].join(", ")}"
+    puts "  Dimensions: #{image_result[:dimensions].join('x')}"
+    puts "  Applied filters: #{image_result[:applied_filters].join(', ')}"
     puts "  Compression: #{(1 - image_result[:processing_metadata][:processed_size].to_f / image_result[:processing_metadata][:original_size]).round(2) * 100}%"
     puts
   end

data/examples/pipeline_processing/pipeline_processing.rb CHANGED Viewed

@@ -9,7 +9,7 @@ module PipelineProcessing
       super({
         data: data,
         stage: stage,
-        metadata: metadata
+        metadata: metadata,
       })
     end
@@ -29,7 +29,7 @@ module PipelineProcessing
       "MediaWork: stage=#{stage}, metadata=#{metadata}, data_size=#{begin
         data.bytesize
       rescue StandardError
-        "unknown"
+        'unknown'
       end}"
     end
   end
@@ -46,7 +46,7 @@ module PipelineProcessing
                else
                  return Fractor::WorkResult.new(
                    error: "Unknown stage: #{work.stage}",
-                   work: work
+                   work: work,
                  )
                end
@@ -58,7 +58,7 @@ module PipelineProcessing
       # Update metadata with processing information
       updated_metadata = work.metadata.merge(
         "#{work.stage}_completed" => true,
-        "#{work.stage}_time" => Time.now.to_s
+        "#{work.stage}_time" => Time.now.to_s,
       )
       # Return the result with next stage information
@@ -67,9 +67,9 @@ module PipelineProcessing
           processed_data: result,
           current_stage: work.stage,
           next_stage: next_stage,
-          metadata: updated_metadata
+          metadata: updated_metadata,
         },
-        work: work
+        work: work,
       )
     end
@@ -95,7 +95,7 @@ module PipelineProcessing
       sleep(rand(0.01..0.05)) # Simulate processing time
       tags = %w[landscape portrait nature urban abstract]
       selected_tags = tags.sample(rand(1..3))
-      "Tagged image: #{work.data} (tags: #{selected_tags.join(", ")})"
+      "Tagged image: #{work.data} (tags: #{selected_tags.join(', ')})"
     end
   end
@@ -106,8 +106,8 @@ module PipelineProcessing
     def initialize(worker_count = 4)
       @supervisor = Fractor::Supervisor.new(
         worker_pools: [
-          { worker_class: PipelineWorker, num_workers: worker_count }
-        ]
+          { worker_class: PipelineWorker, num_workers: worker_count },
+        ],
       )
       # Register callback to handle pipeline stage transitions
@@ -119,7 +119,7 @@ module PipelineProcessing
           new_work = MediaWork.new(
             result.result[:processed_data],
             next_stage,
-            result.result[:metadata]
+            result.result[:metadata],
           )
           @supervisor.add_work_item(new_work)
         end
@@ -127,7 +127,7 @@ module PipelineProcessing
       @results = {
         completed: [],
-        in_progress: []
+        in_progress: [],
       }
     end
@@ -137,7 +137,7 @@ module PipelineProcessing
         MediaWork.new(
           image,
           :resize,
-          { original_filename: image, started_at: Time.now.to_s }
+          { original_filename: image, started_at: Time.now.to_s },
         )
       end
@@ -159,7 +159,7 @@ module PipelineProcessing
         total_images: images.size,
         completed: @results[:completed].size,
         in_progress: @results[:in_progress].size,
-        results: @results[:completed]
+        results: @results[:completed],
       }
     end
   end
@@ -182,7 +182,7 @@ if __FILE__ == $PROGRAM_NAME
     "mountains.png",
     "beach.jpg",
     "city_skyline.jpg",
-    "forest.png"
+    "forest.png",
   ]
   worker_count = 4
@@ -205,7 +205,7 @@ if __FILE__ == $PROGRAM_NAME
     puts "Image #{index + 1}: #{image_result[:processed_data]}"
     puts "  Processing path:"
     image_result[:metadata].each do |key, value|
-      next unless key.to_s.end_with?("_completed") || key.to_s.end_with?("_time")
+      next unless key.to_s.end_with?("_completed", "_time")
       puts "    #{key}: #{value}"
     end

data/examples/producer_subscriber/producer_subscriber.rb CHANGED Viewed

@@ -8,7 +8,7 @@ module ProducerSubscriber
     def initialize(data, depth = 0)
       super({
         data: data,
-        depth: depth
+        depth: depth,
       })
     end
@@ -31,7 +31,7 @@ module ProducerSubscriber
       super({
         data: data,
         parent_id: parent_id,
-        depth: depth
+        depth: depth,
       })
     end
@@ -63,7 +63,7 @@ module ProducerSubscriber
       else
         Fractor::WorkResult.new(
           error: "Unknown work type: #{work.class}",
-          work: work
+          work: work,
         )
       end
     end
@@ -80,13 +80,13 @@ module ProducerSubscriber
       # Return the result with metadata about sub-works
       result = {
         processed_data: processed_data,
-        sub_works: [] # Will be populated by the supervisor
+        sub_works: [], # Will be populated by the supervisor
       }
       # Return a successful result
       Fractor::WorkResult.new(
         result: result,
-        work: work
+        work: work,
       )
     end
@@ -101,9 +101,9 @@ module ProducerSubscriber
       Fractor::WorkResult.new(
         result: {
           processed_data: processed_data,
-          parent_id: work.parent_id
+          parent_id: work.parent_id,
         },
-        work: work
+        work: work,
       )
     end
   end
@@ -122,8 +122,8 @@ module ProducerSubscriber
       # Create the supervisor
       supervisor = Fractor::Supervisor.new(
         worker_pools: [
-          { worker_class: MultiWorker, num_workers: @worker_count }
-        ]
+          { worker_class: MultiWorker, num_workers: @worker_count },
+        ],
       )
       # Create and add initial work items
@@ -144,12 +144,14 @@ module ProducerSubscriber
         # Create a new supervisor for sub-works
         sub_supervisor = Fractor::Supervisor.new(
           worker_pools: [
-            { worker_class: MultiWorker, num_workers: @worker_count }
-          ]
+            { worker_class: MultiWorker, num_workers: @worker_count },
+          ],
         )
         # Create and add the sub-work items
-        sub_work_items = sub_works.map { |sw| SubWork.new(sw[:data], sw[:parent_id], sw[:depth]) }
+        sub_work_items = sub_works.map do |sw|
+          SubWork.new(sw[:data], sw[:parent_id], sw[:depth])
+        end
         sub_supervisor.add_work_items(sub_work_items)
         sub_supervisor.run
@@ -179,12 +181,14 @@ module ProducerSubscriber
           sub_works << {
             data: sub_data,
             parent_id: work.object_id,
-            depth: work.depth + 1
+            depth: work.depth + 1,
           }
         end
         # Store the sub-work IDs in the result for reference
-        result.result[:sub_works] = sub_works.last(3).map { |sw| sw[:parent_id] }
+        result.result[:sub_works] = sub_works.last(3).map do |sw|
+          sw[:parent_id]
+        end
       end
       sub_works
@@ -195,7 +199,7 @@ module ProducerSubscriber
       initial_results.results.each do |result|
         @result_tree[result.work.object_id] = {
           data: result.result[:processed_data],
-          children: []
+          children: [],
         }
       end
@@ -236,7 +240,7 @@ if __FILE__ == $PROGRAM_NAME
   documents = [
     "Annual Report 2025",
     "Technical Documentation",
-    "Research Paper"
+    "Research Paper",
   ]
   worker_count = 4

data/examples/scatter_gather/scatter_gather.rb CHANGED Viewed

@@ -42,7 +42,7 @@ module ScatterGather
                  error = ArgumentError.new("Unknown source: #{work.source}")
                  return Fractor::WorkResult.new(
                    error: error,
-                   work: work
+                   work: work,
                  )
                end
@@ -53,9 +53,9 @@ module ScatterGather
           query: work.query,
           hits: result[:hits],
           metadata: result[:metadata],
-          timing: result[:timing]
+          timing: result[:timing],
         },
-        work: work
+        work: work,
       )
     end
@@ -72,12 +72,12 @@ module ScatterGather
       # Generate simulated records
       record_count = rand(3..10)
-      hits = record_count.times.map do |i|
+      hits = Array.new(record_count) do |i|
         {
           id: "db-#{i + 1}",
           title: "Database Result #{i + 1} for '#{work.query}'",
           content: "This is database content for #{work.query}",
-          relevance: rand(0.1..1.0).round(2)
+          relevance: rand(0.1..1.0).round(2),
         }
       end
@@ -86,9 +86,9 @@ module ScatterGather
         metadata: {
           source_type: "PostgreSQL Database",
           total_available: record_count + rand(10..50),
-          query_type: "Full-text search"
+          query_type: "Full-text search",
         },
-        timing: rand(0.01..0.3).round(3)
+        timing: rand(0.01..0.3).round(3),
       }
     end
@@ -98,12 +98,12 @@ module ScatterGather
       # Generate simulated API results
       record_count = rand(2..8)
-      hits = record_count.times.map do |i|
+      hits = Array.new(record_count) do |i|
         {
           id: "api-#{i + 1}",
           title: "API Result #{i + 1} for '#{work.query}'",
           content: "This is API content for #{work.query}",
-          relevance: rand(0.1..1.0).round(2)
+          relevance: rand(0.1..1.0).round(2),
         }
       end
@@ -112,9 +112,9 @@ module ScatterGather
         metadata: {
           source_type: "External REST API",
           provider: %w[Google Bing DuckDuckGo].sample,
-          response_code: 200
+          response_code: 200,
         },
-        timing: rand(0.1..0.5).round(3)
+        timing: rand(0.1..0.5).round(3),
       }
     end
@@ -128,12 +128,12 @@ module ScatterGather
       if cache_hit
         # Cache hit - return cached results
         record_count = rand(1..5)
-        hits = record_count.times.map do |i|
+        hits = Array.new(record_count) do |i|
           {
             id: "cache-#{i + 1}",
             title: "Cached Result #{i + 1} for '#{work.query}'",
             content: "This is cached content for #{work.query}",
-            relevance: rand(0.1..1.0).round(2)
+            relevance: rand(0.1..1.0).round(2),
           }
         end
@@ -142,9 +142,9 @@ module ScatterGather
           metadata: {
             source_type: "In-memory Cache",
             cache_hit: true,
-            age: rand(1..3600)
+            age: rand(1..3600),
           },
-          timing: rand(0.001..0.05).round(3)
+          timing: rand(0.001..0.05).round(3),
         }
       else
         # Cache miss
@@ -152,9 +152,9 @@ module ScatterGather
           hits: [],
           metadata: {
             source_type: "In-memory Cache",
-            cache_hit: false
+            cache_hit: false,
           },
-          timing: rand(0.001..0.01).round(3)
+          timing: rand(0.001..0.01).round(3),
         }
       end
     end
@@ -165,13 +165,13 @@ module ScatterGather
       # Generate simulated file results
       record_count = rand(1..12)
-      hits = record_count.times.map do |i|
+      hits = Array.new(record_count) do |i|
         {
           id: "file-#{i + 1}",
           title: "File Result #{i + 1} for '#{work.query}'",
           path: "/path/to/file_#{i + 1}.txt",
           content: "This is file content matching #{work.query}",
-          relevance: rand(0.1..1.0).round(2)
+          relevance: rand(0.1..1.0).round(2),
         }
       end
@@ -180,9 +180,9 @@ module ScatterGather
         metadata: {
           source_type: "File System",
           directories_searched: rand(5..20),
-          files_scanned: rand(50..500)
+          files_scanned: rand(50..500),
         },
-        timing: rand(0.01..0.2).round(3)
+        timing: rand(0.01..0.2).round(3),
       }
     end
   end
@@ -194,8 +194,8 @@ module ScatterGather
     def initialize(worker_count = 4)
       @supervisor = Fractor::Supervisor.new(
         worker_pools: [
-          { worker_class: SearchWorker, num_workers: worker_count }
-        ]
+          { worker_class: SearchWorker, num_workers: worker_count },
+        ],
       )
       @merged_results = nil
@@ -204,10 +204,11 @@ module ScatterGather
     def search(query, sources = nil)
       # Define search sources with their parameters
       sources ||= [
-        { source: :database, params: { max_results: 50, include_archived: false } },
+        { source: :database,
+          params: { max_results: 50, include_archived: false } },
         { source: :api, params: { format: "json", timeout: 5 } },
         { source: :cache, params: { max_age: 3600 } },
-        { source: :filesystem, params: { extensions: %w[txt md pdf] } }
+        { source: :filesystem, params: { extensions: %w[txt md pdf] } },
       ]
       start_time = Time.now
@@ -262,7 +263,7 @@ module ScatterGather
             content: hit[:content],
             source: source,
             original_relevance: hit[:relevance],
-            weighted_relevance: hit[:relevance] * source_weight
+            weighted_relevance: hit[:relevance] * source_weight,
           }
         end
       end
@@ -277,7 +278,7 @@ module ScatterGather
         execution_time: total_time,
         sources: results_by_source.keys,
         ranked_results: ranked_hits,
-        source_details: results_by_source
+        source_details: results_by_source,
       }
     end
   end
@@ -309,7 +310,7 @@ if __FILE__ == $PROGRAM_NAME
   puts "Query: #{results[:query]}"
   puts "Total hits: #{results[:total_hits]}"
   puts "Total execution time: #{results[:execution_time].round(3)} seconds"
-  puts "Sources searched: #{results[:sources].join(", ")}"
+  puts "Sources searched: #{results[:sources].join(', ')}"
   puts
   puts "Top 5 Results (by relevance):"