RubyGems - kumi - Versions diffs - 0.0.24 → 0.0.26 - Mend

kumi 0.0.24 → 0.0.26

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (234) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +14 -0
data/README.md +70 -71
data/data/functions/agg/boolean.yaml +6 -2
data/data/functions/agg/numeric.yaml +32 -16
data/data/functions/agg/string.yaml +4 -3
data/data/functions/core/arithmetic.yaml +62 -14
data/data/functions/core/boolean.yaml +12 -6
data/data/functions/core/comparison.yaml +25 -13
data/data/functions/core/constructor.yaml +16 -8
data/data/functions/core/select.yaml +3 -1
data/data/functions/core/stencil.yaml +14 -5
data/data/functions/core/string.yaml +9 -4
data/data/kernels/ruby/agg/numeric.yaml +1 -1
data/docs/UNSAT_DETECTION.md +83 -0
data/golden/array_element/expected/nast.txt +1 -1
data/golden/array_element/expected/schema_ruby.rb +1 -1
data/golden/array_index/expected/nast.txt +7 -7
data/golden/array_index/expected/schema_ruby.rb +1 -1
data/golden/array_operations/expected/nast.txt +2 -2
data/golden/array_operations/expected/schema_ruby.rb +1 -1
data/golden/array_operations/expected/snast.txt +3 -3
data/golden/cascade_logic/expected/lir_02_inlined.txt +8 -8
data/golden/cascade_logic/expected/schema_ruby.rb +1 -1
data/golden/cascade_logic/expected/snast.txt +2 -2
data/golden/chained_fusion/expected/lir_02_inlined.txt +36 -36
data/golden/chained_fusion/expected/lir_03_cse.txt +23 -23
data/golden/chained_fusion/expected/lir_04_1_loop_fusion.txt +25 -25
data/golden/chained_fusion/expected/lir_04_loop_invcm.txt +23 -23
data/golden/chained_fusion/expected/lir_06_const_prop.txt +23 -23
data/golden/chained_fusion/expected/nast.txt +2 -2
data/golden/chained_fusion/expected/schema_javascript.mjs +23 -23
data/golden/chained_fusion/expected/schema_ruby.rb +28 -28
data/golden/element_arrays/expected/nast.txt +2 -2
data/golden/element_arrays/expected/schema_ruby.rb +1 -1
data/golden/element_arrays/expected/snast.txt +1 -1
data/golden/empty_and_null_inputs/expected/lir_02_inlined.txt +18 -18
data/golden/empty_and_null_inputs/expected/lir_03_cse.txt +17 -17
data/golden/empty_and_null_inputs/expected/lir_04_1_loop_fusion.txt +17 -17
data/golden/empty_and_null_inputs/expected/lir_04_loop_invcm.txt +17 -17
data/golden/empty_and_null_inputs/expected/lir_06_const_prop.txt +17 -17
data/golden/empty_and_null_inputs/expected/nast.txt +3 -3
data/golden/empty_and_null_inputs/expected/schema_javascript.mjs +13 -13
data/golden/empty_and_null_inputs/expected/schema_ruby.rb +18 -18
data/golden/function_overload/expected/ast.txt +29 -0
data/golden/function_overload/expected/input_plan.txt +4 -0
data/golden/function_overload/expected/lir_00_unoptimized.txt +18 -0
data/golden/function_overload/expected/lir_01_hoist_scalar_references.txt +18 -0
data/golden/function_overload/expected/lir_02_inlined.txt +20 -0
data/golden/function_overload/expected/lir_03_cse.txt +20 -0
data/golden/function_overload/expected/lir_04_1_loop_fusion.txt +20 -0
data/golden/function_overload/expected/lir_04_loop_invcm.txt +20 -0
data/golden/function_overload/expected/lir_06_const_prop.txt +20 -0
data/golden/function_overload/expected/nast.txt +22 -0
data/golden/function_overload/expected/schema_javascript.mjs +12 -0
data/golden/function_overload/expected/schema_ruby.rb +39 -0
data/golden/function_overload/expected/snast.txt +22 -0
data/golden/function_overload/input.json +8 -0
data/golden/function_overload/schema.kumi +19 -0
data/golden/game_of_life/expected/lir_00_unoptimized.txt +4 -4
data/golden/game_of_life/expected/lir_01_hoist_scalar_references.txt +4 -4
data/golden/game_of_life/expected/lir_02_inlined.txt +1294 -1294
data/golden/game_of_life/expected/lir_03_cse.txt +403 -399
data/golden/game_of_life/expected/lir_04_1_loop_fusion.txt +403 -399
data/golden/game_of_life/expected/lir_04_loop_invcm.txt +403 -399
data/golden/game_of_life/expected/lir_06_const_prop.txt +403 -399
data/golden/game_of_life/expected/nast.txt +4 -4
data/golden/game_of_life/expected/schema_javascript.mjs +87 -85
data/golden/game_of_life/expected/schema_ruby.rb +88 -86
data/golden/game_of_life/expected/snast.txt +10 -10
data/golden/hash_keys/expected/schema_ruby.rb +1 -1
data/golden/hash_value/expected/nast.txt +1 -1
data/golden/hash_value/expected/schema_ruby.rb +1 -1
data/golden/hash_value/expected/snast.txt +1 -1
data/golden/hierarchical_complex/expected/lir_02_inlined.txt +15 -15
data/golden/hierarchical_complex/expected/lir_03_cse.txt +1 -1
data/golden/hierarchical_complex/expected/lir_04_1_loop_fusion.txt +1 -1
data/golden/hierarchical_complex/expected/lir_04_loop_invcm.txt +1 -1
data/golden/hierarchical_complex/expected/lir_06_const_prop.txt +1 -1
data/golden/hierarchical_complex/expected/nast.txt +3 -3
data/golden/hierarchical_complex/expected/schema_javascript.mjs +1 -1
data/golden/hierarchical_complex/expected/schema_ruby.rb +2 -2
data/golden/hierarchical_complex/expected/snast.txt +3 -3
data/golden/inline_rename_scope_leak/expected/nast.txt +3 -3
data/golden/inline_rename_scope_leak/expected/schema_ruby.rb +1 -1
data/golden/input_reference/expected/nast.txt +2 -2
data/golden/input_reference/expected/schema_ruby.rb +1 -1
data/golden/interleaved_fusion/expected/lir_02_inlined.txt +35 -35
data/golden/interleaved_fusion/expected/lir_03_cse.txt +26 -26
data/golden/interleaved_fusion/expected/lir_04_1_loop_fusion.txt +27 -26
data/golden/interleaved_fusion/expected/lir_04_loop_invcm.txt +26 -26
data/golden/interleaved_fusion/expected/lir_06_const_prop.txt +26 -26
data/golden/interleaved_fusion/expected/nast.txt +2 -2
data/golden/interleaved_fusion/expected/schema_javascript.mjs +23 -23
data/golden/interleaved_fusion/expected/schema_ruby.rb +29 -29
data/golden/let_inline/expected/nast.txt +4 -4
data/golden/let_inline/expected/schema_ruby.rb +1 -1
data/golden/loop_fusion/expected/lir_02_inlined.txt +17 -17
data/golden/loop_fusion/expected/lir_03_cse.txt +14 -14
data/golden/loop_fusion/expected/lir_04_1_loop_fusion.txt +14 -14
data/golden/loop_fusion/expected/lir_04_loop_invcm.txt +14 -14
data/golden/loop_fusion/expected/lir_06_const_prop.txt +14 -14
data/golden/loop_fusion/expected/nast.txt +1 -1
data/golden/loop_fusion/expected/schema_javascript.mjs +12 -12
data/golden/loop_fusion/expected/schema_ruby.rb +16 -16
data/golden/min_reduce_scope/expected/nast.txt +3 -3
data/golden/min_reduce_scope/expected/schema_ruby.rb +1 -1
data/golden/min_reduce_scope/expected/snast.txt +1 -1
data/golden/mixed_dimensions/expected/lir_02_inlined.txt +5 -5
data/golden/mixed_dimensions/expected/lir_03_cse.txt +5 -5
data/golden/mixed_dimensions/expected/lir_04_1_loop_fusion.txt +5 -5
data/golden/mixed_dimensions/expected/lir_04_loop_invcm.txt +5 -5
data/golden/mixed_dimensions/expected/lir_06_const_prop.txt +5 -5
data/golden/mixed_dimensions/expected/nast.txt +2 -2
data/golden/mixed_dimensions/expected/schema_javascript.mjs +3 -3
data/golden/mixed_dimensions/expected/schema_ruby.rb +6 -6
data/golden/multirank_hoisting/expected/lir_02_inlined.txt +48 -48
data/golden/multirank_hoisting/expected/lir_03_cse.txt +35 -35
data/golden/multirank_hoisting/expected/lir_04_1_loop_fusion.txt +35 -35
data/golden/multirank_hoisting/expected/lir_04_loop_invcm.txt +35 -35
data/golden/multirank_hoisting/expected/lir_06_const_prop.txt +35 -35
data/golden/multirank_hoisting/expected/nast.txt +7 -7
data/golden/multirank_hoisting/expected/schema_javascript.mjs +34 -34
data/golden/multirank_hoisting/expected/schema_ruby.rb +36 -36
data/golden/nested_hash/expected/nast.txt +1 -1
data/golden/nested_hash/expected/schema_ruby.rb +1 -1
data/golden/reduction_broadcast/expected/lir_02_inlined.txt +30 -30
data/golden/reduction_broadcast/expected/lir_03_cse.txt +22 -22
data/golden/reduction_broadcast/expected/lir_04_1_loop_fusion.txt +22 -22
data/golden/reduction_broadcast/expected/lir_04_loop_invcm.txt +22 -22
data/golden/reduction_broadcast/expected/lir_06_const_prop.txt +22 -22
data/golden/reduction_broadcast/expected/nast.txt +3 -3
data/golden/reduction_broadcast/expected/schema_javascript.mjs +18 -18
data/golden/reduction_broadcast/expected/schema_ruby.rb +23 -23
data/golden/reduction_broadcast/expected/snast.txt +1 -1
data/golden/roll/expected/schema_ruby.rb +1 -1
data/golden/shift/expected/schema_ruby.rb +1 -1
data/golden/shift_2d/expected/schema_ruby.rb +1 -1
data/golden/simple_math/expected/lir_00_unoptimized.txt +1 -1
data/golden/simple_math/expected/lir_01_hoist_scalar_references.txt +1 -1
data/golden/simple_math/expected/lir_02_inlined.txt +1 -1
data/golden/simple_math/expected/lir_03_cse.txt +1 -1
data/golden/simple_math/expected/lir_04_1_loop_fusion.txt +1 -1
data/golden/simple_math/expected/lir_04_loop_invcm.txt +1 -1
data/golden/simple_math/expected/lir_06_const_prop.txt +1 -1
data/golden/simple_math/expected/nast.txt +5 -5
data/golden/simple_math/expected/schema_ruby.rb +1 -1
data/golden/simple_math/expected/snast.txt +2 -2
data/golden/streaming_basics/expected/lir_02_inlined.txt +25 -25
data/golden/streaming_basics/expected/lir_03_cse.txt +13 -13
data/golden/streaming_basics/expected/lir_04_1_loop_fusion.txt +13 -13
data/golden/streaming_basics/expected/lir_04_loop_invcm.txt +13 -13
data/golden/streaming_basics/expected/lir_06_const_prop.txt +13 -13
data/golden/streaming_basics/expected/nast.txt +8 -8
data/golden/streaming_basics/expected/schema_javascript.mjs +13 -13
data/golden/streaming_basics/expected/schema_ruby.rb +14 -14
data/golden/streaming_basics/expected/snast.txt +1 -1
data/golden/tuples/expected/lir_00_unoptimized.txt +5 -5
data/golden/tuples/expected/lir_01_hoist_scalar_references.txt +5 -5
data/golden/tuples/expected/lir_02_inlined.txt +5 -5
data/golden/tuples/expected/lir_03_cse.txt +5 -5
data/golden/tuples/expected/lir_04_1_loop_fusion.txt +5 -5
data/golden/tuples/expected/lir_04_loop_invcm.txt +5 -5
data/golden/tuples/expected/lir_06_const_prop.txt +5 -5
data/golden/tuples/expected/nast.txt +4 -4
data/golden/tuples/expected/schema_ruby.rb +1 -1
data/golden/tuples/expected/snast.txt +6 -6
data/golden/tuples_and_arrays/expected/lir_00_unoptimized.txt +1 -1
data/golden/tuples_and_arrays/expected/lir_01_hoist_scalar_references.txt +1 -1
data/golden/tuples_and_arrays/expected/lir_02_inlined.txt +17 -17
data/golden/tuples_and_arrays/expected/lir_03_cse.txt +13 -13
data/golden/tuples_and_arrays/expected/lir_04_1_loop_fusion.txt +13 -13
data/golden/tuples_and_arrays/expected/lir_04_loop_invcm.txt +13 -13
data/golden/tuples_and_arrays/expected/lir_06_const_prop.txt +13 -13
data/golden/tuples_and_arrays/expected/nast.txt +3 -3
data/golden/tuples_and_arrays/expected/schema_javascript.mjs +13 -13
data/golden/tuples_and_arrays/expected/schema_ruby.rb +14 -14
data/golden/tuples_and_arrays/expected/snast.txt +2 -2
data/golden/us_tax_2024/expected/ast.txt +63 -670
data/golden/us_tax_2024/expected/input_plan.txt +8 -45
data/golden/us_tax_2024/expected/lir_00_unoptimized.txt +253 -863
data/golden/us_tax_2024/expected/lir_01_hoist_scalar_references.txt +253 -863
data/golden/us_tax_2024/expected/lir_02_inlined.txt +1215 -5139
data/golden/us_tax_2024/expected/lir_03_cse.txt +587 -2460
data/golden/us_tax_2024/expected/lir_04_1_loop_fusion.txt +632 -2480
data/golden/us_tax_2024/expected/lir_04_loop_invcm.txt +587 -2400
data/golden/us_tax_2024/expected/lir_06_const_prop.txt +587 -2400
data/golden/us_tax_2024/expected/nast.txt +123 -826
data/golden/us_tax_2024/expected/schema_javascript.mjs +127 -581
data/golden/us_tax_2024/expected/schema_ruby.rb +135 -610
data/golden/us_tax_2024/expected/snast.txt +155 -858
data/golden/us_tax_2024/expected.json +120 -1
data/golden/us_tax_2024/input.json +18 -9
data/golden/us_tax_2024/schema.kumi +48 -178
data/golden/with_constants/expected/lir_00_unoptimized.txt +1 -1
data/golden/with_constants/expected/lir_01_hoist_scalar_references.txt +1 -1
data/golden/with_constants/expected/lir_02_inlined.txt +1 -1
data/golden/with_constants/expected/lir_03_cse.txt +1 -1
data/golden/with_constants/expected/lir_04_1_loop_fusion.txt +1 -1
data/golden/with_constants/expected/lir_04_loop_invcm.txt +1 -1
data/golden/with_constants/expected/lir_06_const_prop.txt +1 -1
data/golden/with_constants/expected/nast.txt +2 -2
data/golden/with_constants/expected/schema_ruby.rb +1 -1
data/golden/with_constants/expected/snast.txt +2 -2
data/lib/kumi/analyzer.rb +12 -12
data/lib/kumi/core/analyzer/passes/formal_constraint_propagator.rb +236 -0
data/lib/kumi/core/analyzer/passes/input_collector.rb +22 -4
data/lib/kumi/core/analyzer/passes/lir/inline_declarations_pass.rb +118 -74
data/lib/kumi/core/analyzer/passes/nast_dimensional_analyzer_pass.rb +64 -18
data/lib/kumi/core/analyzer/passes/normalize_to_nast_pass.rb +9 -4
data/lib/kumi/core/analyzer/passes/snast_pass.rb +3 -1
data/lib/kumi/core/analyzer/passes/unsat_detector.rb +172 -198
data/lib/kumi/core/error_reporter.rb +36 -1
data/lib/kumi/core/errors.rb +33 -1
data/lib/kumi/core/functions/function_spec.rb +5 -4
data/lib/kumi/core/functions/loader.rb +17 -1
data/lib/kumi/core/functions/overload_resolver.rb +164 -0
data/lib/kumi/core/functions/type_error_reporter.rb +118 -0
data/lib/kumi/core/functions/type_rules.rb +155 -35
data/lib/kumi/core/types/inference.rb +29 -22
data/lib/kumi/core/types/normalizer.rb +29 -45
data/lib/kumi/core/types/validator.rb +16 -27
data/lib/kumi/core/types/value_objects.rb +116 -0
data/lib/kumi/core/types.rb +45 -37
data/lib/kumi/registry_v2/loader.rb +90 -0
data/lib/kumi/registry_v2.rb +18 -1
data/lib/kumi/version.rb +1 -1
metadata +21 -7
data/lib/kumi/core/analyzer/unsat_constant_evaluator.rb +0 -59
data/lib/kumi/core/atom_unsat_solver.rb +0 -396
data/lib/kumi/core/constraint_relationship_solver.rb +0 -641
data/lib/kumi/core/types/builder.rb +0 -23
data/lib/kumi/core/types/compatibility.rb +0 -96
data/lib/kumi/core/types/formatter.rb +0 -26

data/lib/kumi/core/functions/overload_resolver.rb ADDED Viewed

@@ -0,0 +1,164 @@
+# frozen_string_literal: true
+module Kumi
+  module Core
+    module Functions
+      # OverloadResolver handles type-aware function overload resolution
+      # Given a function alias/id and argument types, finds the best matching function
+      #
+      # Responsibilities:
+      # - Track all function overloads per alias
+      # - Match argument types against parameter constraints
+      # - Provide clear error messages when resolution fails
+      class OverloadResolver
+        def initialize(functions_by_id)
+          @functions = functions_by_id                # "core.mul" => Function
+          @by_id = functions_by_id                    # Direct lookup
+          @alias_overloads = build_alias_overloads(functions_by_id)
+        end
+        # Resolve a function alias or ID to a specific function ID based on argument types
+        #
+        # @param alias_or_id [String, Symbol] Function alias or full function ID
+        # @param arg_types [Array<Symbol>] Inferred types of arguments
+        # @return [String] The resolved function_id
+        # @raise [ResolutionError] If function cannot be resolved
+        def resolve(alias_or_id, arg_types)
+          s = alias_or_id.to_s
+          # If it's already a full function ID, validate and return it
+          if @functions.key?(s)
+            validate_arity!(s, arg_types)
+            return s
+          end
+          # Get all candidate overloads for this alias
+          candidates = @alias_overloads[s]
+          raise ResolutionError, "unknown function #{alias_or_id}" if candidates.nil?
+          # Single overload - use it directly
+          if candidates.size == 1
+            validate_arity!(candidates.first, arg_types)
+            return candidates.first
+          end
+          # Multiple overloads - find best match by type constraints (prefer exact matches)
+          candidates_with_scores = candidates.map do |fn_id|
+            fn = @functions[fn_id]
+            score = match_score(fn.params, arg_types)
+            [fn_id, score]
+          end
+          best_match, score = candidates_with_scores.max_by { |_, s| s }
+          if score > 0
+            return best_match
+          end
+          # No match found - provide helpful error
+          available = candidates.map { |id| @functions[id].id }.join(", ")
+          raise ResolutionError,
+                "no overload of '#{alias_or_id}' matches argument types #{arg_types.inspect}. " \
+                "Available overloads: #{available}"
+        end
+        # Get function object by ID (already resolved)
+        def function(id)
+          @functions.fetch(id) do
+            raise ResolutionError, "unknown function #{id}"
+          end
+        end
+        # Check if a function exists
+        def exists?(id)
+          @functions.key?(id.to_s)
+        end
+        private
+        def build_alias_overloads(functions)
+          # Maps each alias to an array of all function_ids that have that alias
+          functions.values.each_with_object({}) do |func, acc|
+            func.aliases.each do |al|
+              acc[al] ||= []
+              acc[al] << func.id
+            end
+          end
+        end
+        def params_match?(params, arg_types)
+          # Check arity first
+          return false if params.size != arg_types.size
+          # Check each parameter constraint
+          params.zip(arg_types).all? do |param, arg_type|
+            param_dtype = param["dtype"]
+            param_dtype.nil? || type_compatible?(param_dtype, arg_type)
+          end
+        end
+        def match_score(params, arg_types)
+          # Returns match quality: higher is better
+          # 0 = no match, 1 = matches with unconstrained params, 2 = exact match
+          return 0 unless params_match?(params, arg_types)
+          # Count exact constraint matches (all arg_types are Type objects now)
+          exact_matches = params.zip(arg_types).count do |param, arg_type|
+            param_dtype = param["dtype"]
+            score_type_object_match(param_dtype, arg_type)
+          end
+          exact_matches
+        end
+        def score_type_object_match(param_dtype, type_obj)
+          case param_dtype&.to_s
+          when "string"
+            type_obj.is_a?(Kumi::Core::Types::ScalarType) && type_obj.kind == :string
+          when "array"
+            type_obj.is_a?(Kumi::Core::Types::ArrayType)
+          when "integer"
+            type_obj.is_a?(Kumi::Core::Types::ScalarType) && type_obj.kind == :integer
+          when "float"
+            type_obj.is_a?(Kumi::Core::Types::ScalarType) && type_obj.kind == :float
+          when "hash"
+            type_obj.is_a?(Kumi::Core::Types::ScalarType) && type_obj.kind == :hash
+          else
+            false
+          end
+        end
+        def type_compatible?(param_dtype_str, arg_type)
+          raise ArgumentError, "arg_type must be a Type object, got #{arg_type.inspect}" unless arg_type.is_a?(Kumi::Core::Types::Type)
+          case param_dtype_str
+          when "string"
+            arg_type.is_a?(Kumi::Core::Types::ScalarType) && arg_type.kind == :string
+          when "array"
+            arg_type.is_a?(Kumi::Core::Types::ArrayType)
+          when "integer"
+            arg_type.is_a?(Kumi::Core::Types::ScalarType) && arg_type.kind == :integer
+          when "float"
+            arg_type.is_a?(Kumi::Core::Types::ScalarType) && arg_type.kind == :float
+          when "hash"
+            arg_type.is_a?(Kumi::Core::Types::ScalarType) && arg_type.kind == :hash
+          else
+            # No constraint, any type matches
+            true
+          end
+        end
+        def validate_arity!(fn_id, arg_types)
+          fn = @functions[fn_id]
+          return if fn.params.size == arg_types.size
+          raise ResolutionError,
+                "function #{fn_id} expects #{fn.params.size} arguments, got #{arg_types.size}"
+        end
+        # Custom error for function resolution failures
+        class ResolutionError < StandardError; end
+      end
+    end
+  end
+end

data/lib/kumi/core/functions/type_error_reporter.rb ADDED Viewed

@@ -0,0 +1,118 @@
+# frozen_string_literal: true
+module Kumi
+  module Core
+    module Functions
+      # TypeErrorReporter provides typed error reporting for function resolution and type checking
+      # Ensures all type errors have proper location information for better diagnostics
+      module TypeErrorReporter
+        # Report function overload resolution failure with proper location
+        #
+        # @param errors [Array] Error accumulator
+        # @param alias_or_id [String, Symbol] Function alias or ID that couldn't be resolved
+        # @param arg_types [Array<Symbol>] Argument types that didn't match any overload
+        # @param available_overloads [Array<String>] Available function overload IDs
+        # @param location [Syntax::Location, nil] Where the error occurred
+        def self.report_overload_resolution_error(errors, alias_or_id, arg_types, available_overloads, location)
+          message = format_overload_error(alias_or_id, arg_types, available_overloads)
+          error = Core::ErrorReporter.create_error(
+            message,
+            location: location,
+            type: :type,
+            context: {
+              alias: alias_or_id.to_s,
+              arg_types: arg_types,
+              candidates: available_overloads
+            }
+          )
+          errors << error
+          error
+        end
+        # Report arity mismatch (wrong number of arguments)
+        #
+        # @param errors [Array] Error accumulator
+        # @param fn_id [String] Full function ID
+        # @param expected [Integer] Expected number of arguments
+        # @param actual [Integer] Actual number of arguments provided
+        # @param location [Syntax::Location, nil] Where the error occurred
+        def self.report_arity_mismatch(errors, fn_id, expected, actual, location)
+          message = "function '#{fn_id}' expects #{expected} argument(s), got #{actual}"
+          error = Core::ErrorReporter.create_error(
+            message,
+            location: location,
+            type: :type,
+            context: {
+              function: fn_id.to_s,
+              expected: expected,
+              actual: actual
+            }
+          )
+          errors << error
+          error
+        end
+        # Report type constraint violation (parameter type doesn't match argument type)
+        #
+        # @param errors [Array] Error accumulator
+        # @param fn_id [String] Full function ID
+        # @param param_name [String] Parameter name
+        # @param expected_type [String] Expected type constraint
+        # @param actual_type [Symbol] Actual argument type
+        # @param location [Syntax::Location, nil] Where the error occurred
+        def self.report_type_constraint_violation(errors, fn_id, param_name, expected_type, actual_type, location)
+          message = "function '#{fn_id}' parameter '#{param_name}' expects type #{expected_type.inspect}, " \
+                    "got #{actual_type.inspect}"
+          error = Core::ErrorReporter.create_error(
+            message,
+            location: location,
+            type: :type,
+            context: {
+              function: fn_id.to_s,
+              parameter: param_name.to_s,
+              expected_type: expected_type.to_s,
+              actual_type: actual_type.to_s
+            }
+          )
+          errors << error
+          error
+        end
+        # Report unknown function
+        #
+        # @param errors [Array] Error accumulator
+        # @param alias_or_id [String, Symbol] Function name/alias that doesn't exist
+        # @param location [Syntax::Location, nil] Where the error occurred
+        def self.report_unknown_function(errors, alias_or_id, location)
+          message = "unknown function '#{alias_or_id}'"
+          error = Core::ErrorReporter.create_error(
+            message,
+            location: location,
+            type: :semantic,
+            context: { function: alias_or_id.to_s }
+          )
+          errors << error
+          error
+        end
+        private
+        def self.format_overload_error(alias_or_id, arg_types, available_overloads)
+          arg_types_str = arg_types.map(&:inspect).join(", ")
+          available_str = available_overloads.map { |id| "'#{id}'" }.join(", ")
+          "no overload of '#{alias_or_id}' matches argument types (#{arg_types_str}). " \
+          "Available overloads: #{available_str}"
+        end
+      end
+    end
+  end
+end

data/lib/kumi/core/functions/type_rules.rb CHANGED Viewed

@@ -6,17 +6,62 @@ module Kumi
       module TypeRules
         module_function
+        # Convert Type objects or symbols to Type objects
+        def to_type_object(type_input)
+          return type_input if type_input.is_a?(Kumi::Core::Types::Type)
+          # Convert symbol/string to Type object
+          case type_input
+          when :string
+            Kumi::Core::Types.scalar(:string)
+          when :integer
+            Kumi::Core::Types.scalar(:integer)
+          when :float
+            Kumi::Core::Types.scalar(:float)
+          when :boolean
+            Kumi::Core::Types.scalar(:boolean)
+          when :hash
+            Kumi::Core::Types.scalar(:hash)
+          when String
+            # Handle string type representations like "array<integer>" or "tuple<float, integer>"
+            parse_string_type(type_input)
+          else
+            # For any other type representation, normalize first
+            normalized = Kumi::Core::Types.normalize(type_input)
+            to_type_object(normalized)
+          end
+        end
+        def parse_string_type(str_type)
+          # Handle array types: "array<integer>"
+          if (m = /\Aarray<(.+)>\z/.match(str_type))
+            element_str = m[1]
+            element_type = to_type_object(element_str.to_sym)
+            return Kumi::Core::Types.array(element_type)
+          end
+          # Handle tuple types: "tuple<integer, float>"
+          if (m = /\Atuple<(.+)>\z/.match(str_type))
+            element_strs = m[1].split(",").map(&:strip)
+            element_types = element_strs.map { |s| to_type_object(s.to_sym) }
+            return Kumi::Core::Types.tuple(element_types)
+          end
+          # Try as symbol
+          to_type_object(str_type.to_sym)
+        end
         def normalize_type_symbol(type_symbol)
           Kumi::Core::Types.normalize(type_symbol)
         end
-        # Minimal type promotion for NAST analysis
+        # Type promotion for NAST analysis - returns Type objects
         def promote_types(*input_types)
-          normalized = input_types.flatten.compact.uniq
-          return :float if normalized.include?(:float)
-          return :integer if normalized.include?(:integer)
+          types = input_types.flatten.compact.uniq
+          return Kumi::Core::Types.scalar(:float) if types.any? { |t| float_type?(t) }
+          return Kumi::Core::Types.scalar(:integer) if types.any? { |t| integer_type?(t) }
-          normalized.first
+          to_type_object(types.first)
         end
         def common_type(element_types)
@@ -26,81 +71,156 @@ module Kumi
         def unify_types(type1, type2)
           return type1 if type1 == type2
-          promote_types(type1, type2) # Fall back to promotion for now
+          promote_types(type1, type2)
         end
-        def same_type_as(reference_type_symbol)
-          normalize_type_symbol(reference_type_symbol)
+        def same_type_as(reference_type)
+          to_type_object(reference_type)
         rescue StandardError
-          # binding.pry
-          # raise
-          # TODO CHECK HOW HANDLE THIS
+          to_type_object(reference_type)
         end
         def array_type(element_type)
-          :"array<#{element_type}>"
+          element_obj = to_type_object(element_type)
+          Kumi::Core::Types.array(element_obj)
         end
         def tuple_type(*element_types)
-          :"tuple<#{element_types.join(', ')}>"
+          element_objs = element_types.map { |t| to_type_object(t) }
+          Kumi::Core::Types.tuple(element_objs)
         end
-        # Parses a collection type symbol to find its element type.
+        # Extract element type from collection Type objects
         def element_type_of(collection_type)
-          str_type = collection_type.to_s
-          if (m = /\Aarray<(.+)>\z/.match(str_type))
-            return m[1].to_sym
+          type_obj = to_type_object(collection_type)
+          case type_obj
+          when Kumi::Core::Types::ArrayType
+            type_obj.element_type
+          when Kumi::Core::Types::TupleType
+            # Promote all element types to common type
+            promote_types(*type_obj.element_types)
+          else
+            type_obj
           end
+        end
-          if (m = /\Atuple<(.+)>\z/.match(str_type))
-            # The "element type" of a tuple is the common promoted type of its members.
-            # e.g., tuple<integer, float> -> float
-            member_types = m[1].split(",").map { |s| s.strip.to_sym }
-            return promote_types(member_types)
+        # --- Typed Rule Builders (Direct Type Construction) ---
+        # Build rule: return the type of a specific parameter
+        def build_same_as(param_name)
+          ->(named) { same_type_as(named.fetch(param_name)) }
+        end
+        # Build rule: promote types of multiple parameters
+        def build_promote(*param_names)
+          ->(named) { promote_types(*param_names.map { |k| named.fetch(k) }) }
+        end
+        # Build rule: extract element type from a collection parameter
+        def build_element_of(param_name)
+          ->(named) { element_type_of(named.fetch(param_name)) }
+        end
+        # Build rule: unify types of two parameters
+        def build_unify(param_name1, param_name2)
+          ->(named) { unify_types(named.fetch(param_name1), named.fetch(param_name2)) }
+        end
+        # Build rule: common type among array elements
+        def build_common_type(param_name)
+          ->(named) { common_type(named.fetch(param_name)) }
+        end
+        # Build rule: array of a specific element type
+        def build_array(element_type_or_param_name)
+          # Check if it's a known scalar kind or Type object
+          if element_type_or_param_name.is_a?(Kumi::Core::Types::Type)
+            # Type object - use directly
+            type_obj = element_type_or_param_name
+            ->(_) { Kumi::Core::Types.array(type_obj) }
+          elsif element_type_or_param_name.is_a?(Symbol) && Kumi::Core::Types::Validator.valid_kind?(element_type_or_param_name)
+            # Known scalar kind - create Type and wrap
+            type_obj = to_type_object(element_type_or_param_name)
+            ->(_) { Kumi::Core::Types.array(type_obj) }
+          else
+            # Treat as parameter name reference
+            ->(named) { array_type(named.fetch(element_type_or_param_name)) }
           end
+        end
+        # Build rule: tuple of specific element types
+        def build_tuple(*element_types_or_param_names)
+          # If single symbol and NOT a known scalar kind, treat as parameter reference
+          if element_types_or_param_names.size == 1 && element_types_or_param_names[0].is_a?(Symbol)
+            sym = element_types_or_param_names[0]
+            unless Kumi::Core::Types::Validator.valid_kind?(sym)
+              # Not a known kind - treat as parameter name (holds array of types)
+              return ->(named) { tuple_type(*named.fetch(sym)) }
+            end
+          end
+          # Interpret as explicit types
+          type_objs = element_types_or_param_names.map { |t| to_type_object(t) }
+          ->(_) { Kumi::Core::Types.tuple(type_objs) }
+        end
-          normalize_type_symbol(str_type)
+        # Build rule: constant scalar type
+        def build_scalar(kind)
+          ->(_) { to_type_object(kind) }
         end
-        # Compile dtype rule string into callable
+        # --- Compile dtype rule string into callable (backward compatible) ---
         def compile_dtype_rule(rule_string, _parameter_names)
           rule = rule_string.to_s.strip
-          # --- NEW: Handle the "element_of" rule ---
           if (m = /\Aelement_of\((.+)\)\z/.match(rule))
             key = m[1].strip.to_sym
-            return ->(named) { element_type_of(named.fetch(key)) }
+            return build_element_of(key)
           end
-          # Handle existing function-based rules
           if (m = /\Apromote\((.+)\)\z/.match(rule))
             keys = m[1].split(",").map { |s| s.strip.to_sym }
-            return ->(named) { promote_types(*keys.map { |k| named.fetch(k) }) }
+            return build_promote(*keys)
           end
           if (m = /\Asame_as\((.+)\)\z/.match(rule))
             key = m[1].strip.to_sym
-            return ->(named) { same_type_as(named.fetch(key)) }
+            return build_same_as(key)
           end
-          if (m = /\Aunify\(([^,]+),\s*([^)]+)\)\z/.match(rule)) # TODO: - check if needed or is just the promote
+          if (m = /\Aunify\(([^,]+),\s*([^)]+)\)\z/.match(rule))
             k1 = m[1].strip.to_sym
             k2 = m[2].strip.to_sym
-            return ->(named) { unify_types(named.fetch(k1), named.fetch(k2)) }
+            return build_unify(k1, k2)
           end
           if (m = /\Acommon_type\((.+)\)\z/.match(rule))
             param_name = m[1].strip.to_sym
-            return ->(named) { common_type(named.fetch(param_name)) }
+            return build_common_type(param_name)
           end
           if (m = /\Aarray\((.+)\)\z/.match(rule))
             inner_rule = m[1].strip
-            inner_compiled = compile_dtype_rule(inner_rule, []) # param_names not needed here
+            inner_compiled = compile_dtype_rule(inner_rule, [])
             return ->(named) { array_type(inner_compiled.call(named)) }
           end
           if (m = /\Atuple\(types\((.+)\)\)\z/.match(rule))
             param_name = m[1].strip.to_sym
-            return ->(named) { tuple_type(*named.fetch(param_name)) }
+            return build_tuple(param_name)
           end
-          ->(_) { normalize_type_symbol(rule.to_sym) }
+          # Constant scalar type
+          build_scalar(rule.to_sym)
+        end
+        def float_type?(t)
+          t.is_a?(Kumi::Core::Types::ScalarType) ? t.kind == :float : t == :float
+        end
+        def integer_type?(t)
+          t.is_a?(Kumi::Core::Types::ScalarType) ? t.kind == :integer : t == :integer
         end
       end
     end

data/lib/kumi/core/types/inference.rb CHANGED Viewed

@@ -9,31 +9,38 @@ module Kumi
       class Inference
         def self.infer_from_value(value)
           case value
-          when String then :string
-          when Integer then :integer
-          when Float then :float
-          when TrueClass, FalseClass then :boolean
-          when Symbol then :symbol
-          when Regexp then :regexp
-          when Time then :time
-          when DateTime then :datetime
-          when Date then :date
+          when String
+            Kumi::Core::Types.scalar(:string)
+          when Integer
+            Kumi::Core::Types.scalar(:integer)
+          when Float
+            Kumi::Core::Types.scalar(:float)
+          when TrueClass, FalseClass
+            Kumi::Core::Types.scalar(:boolean)
+          when Symbol
+            Kumi::Core::Types.scalar(:symbol)
+          when Regexp
+            Kumi::Core::Types.scalar(:regexp)
+          when Time
+            Kumi::Core::Types.scalar(:time)
+          when DateTime
+            Kumi::Core::Types.scalar(:datetime)
+          when Date
+            Kumi::Core::Types.scalar(:date)
           when Array
-            return Kumi::Core::Types.array(:any) if value.empty?
-            # Infer element type from first element (simple heuristic)
-            first_elem_type = infer_from_value(value.first)
-            Kumi::Core::Types.array(first_elem_type)
+            if value.empty?
+              Kumi::Core::Types.array(Kumi::Core::Types.scalar(:any))
+            else
+              # Infer element type from first element (simple heuristic)
+              elem_type = infer_from_value(value.first)
+              Kumi::Core::Types.array(elem_type)
+            end
           when Hash
-            return Kumi::Core::Types.hash(:any, :any) if value.empty?
-            # Infer key/value types from first pair (simple heuristic)
-            first_key, first_value = value.first
-            key_type = infer_from_value(first_key)
-            value_type = infer_from_value(first_value)
-            Kumi::Core::Types.hash(key_type, value_type)
+            # Kumi treats hash as scalar, not key/value pair type
+            # So we just return scalar(:hash) regardless of contents
+            Kumi::Core::Types.scalar(:hash)
           else
-            :any
+            Kumi::Core::Types.scalar(:any)
           end
         end
       end