kumi 0.0.17 → 0.0.19
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/.rubocop.yml +4 -1
- data/.ruby-version +1 -0
- data/CHANGELOG.md +28 -0
- data/CLAUDE.md +26 -139
- data/README.md +143 -372
- data/data/functions/agg/boolean.yaml +14 -0
- data/data/functions/agg/numeric.yaml +80 -0
- data/data/functions/agg/string.yaml +8 -0
- data/data/functions/core/arithmetic.yaml +50 -0
- data/data/functions/core/boolean.yaml +18 -0
- data/data/functions/core/comparison.yaml +42 -0
- data/data/functions/core/constructor.yaml +32 -0
- data/data/functions/core/select.yaml +7 -0
- data/data/functions/core/stencil.yaml +21 -0
- data/data/functions/core/string.yaml +19 -0
- data/data/kernels/javascript/agg/boolean.yaml +12 -0
- data/data/kernels/javascript/agg/numeric.yaml +27 -0
- data/data/kernels/javascript/agg/string.yaml +5 -0
- data/data/kernels/javascript/core/arithmetic.yaml +32 -0
- data/data/kernels/javascript/core/boolean.yaml +12 -0
- data/data/kernels/javascript/core/comparison.yaml +24 -0
- data/data/kernels/javascript/core/constructor.yaml +15 -0
- data/data/kernels/javascript/core/select.yaml +7 -0
- data/data/kernels/javascript/core/string.yaml +12 -0
- data/data/kernels/ruby/agg/boolean.yaml +18 -0
- data/data/kernels/ruby/agg/numeric.yaml +29 -0
- data/data/kernels/ruby/agg/string.yaml +5 -0
- data/data/kernels/ruby/core/arithmetic.yaml +38 -0
- data/data/kernels/ruby/core/boolean.yaml +15 -0
- data/data/kernels/ruby/core/comparison.yaml +30 -0
- data/data/kernels/ruby/core/constructor.yaml +17 -0
- data/data/kernels/ruby/core/select.yaml +4 -0
- data/data/kernels/ruby/core/string.yaml +15 -0
- data/debug_ordering.rb +52 -0
- data/docs/FORM_SCHEMA.md +85 -0
- data/docs/OUTPUT_SCHEMA.md +69 -0
- data/docs/SYNTAX.md +626 -373
- data/golden/array_element/expected/ast.txt +21 -0
- data/golden/array_element/expected/input_plan.txt +5 -0
- data/golden/array_element/expected/lir_00_unoptimized.txt +13 -0
- data/golden/array_element/expected/lir_01_hoist_scalar_references.txt +13 -0
- data/golden/array_element/expected/lir_02_inlined.txt +13 -0
- data/golden/array_element/expected/lir_03_cse.txt +13 -0
- data/golden/array_element/expected/lir_04_1_loop_fusion.txt +13 -0
- data/golden/array_element/expected/lir_04_loop_invcm.txt +13 -0
- data/golden/array_element/expected/lir_06_const_prop.txt +13 -0
- data/golden/array_element/expected/nast.txt +7 -0
- data/golden/array_element/expected/schema_javascript.mjs +13 -0
- data/golden/array_element/expected/schema_ruby.rb +41 -0
- data/golden/array_element/expected/snast.txt +7 -0
- data/golden/array_element/expected.json +5 -0
- data/golden/array_element/input.json +9 -0
- data/golden/array_element/schema.kumi +11 -0
- data/golden/array_index/expected/ast.txt +59 -0
- data/golden/array_index/expected/input_plan.txt +5 -0
- data/golden/array_index/expected/lir_00_unoptimized.txt +41 -0
- data/golden/array_index/expected/lir_01_hoist_scalar_references.txt +41 -0
- data/golden/array_index/expected/lir_02_inlined.txt +42 -0
- data/golden/array_index/expected/lir_03_cse.txt +40 -0
- data/golden/array_index/expected/lir_04_1_loop_fusion.txt +40 -0
- data/golden/array_index/expected/lir_04_loop_invcm.txt +40 -0
- data/golden/array_index/expected/lir_06_const_prop.txt +40 -0
- data/golden/array_index/expected/nast.txt +33 -0
- data/golden/array_index/expected/schema_javascript.mjs +46 -0
- data/golden/array_index/expected/schema_ruby.rb +75 -0
- data/golden/array_index/expected/snast.txt +33 -0
- data/golden/array_index/expected.json +5 -0
- data/golden/array_index/input.json +1 -0
- data/golden/array_index/schema.kumi +19 -0
- data/golden/array_operations/expected/ast.txt +50 -0
- data/golden/array_operations/expected/input_plan.txt +10 -0
- data/golden/array_operations/expected/lir_00_unoptimized.txt +47 -0
- data/golden/array_operations/expected/lir_01_hoist_scalar_references.txt +47 -0
- data/golden/array_operations/expected/lir_02_inlined.txt +47 -0
- data/golden/array_operations/expected/lir_03_cse.txt +47 -0
- data/golden/array_operations/expected/lir_04_1_loop_fusion.txt +47 -0
- data/golden/array_operations/expected/lir_04_loop_invcm.txt +47 -0
- data/golden/array_operations/expected/lir_06_const_prop.txt +47 -0
- data/golden/array_operations/expected/nast.txt +32 -0
- data/golden/array_operations/expected/schema_javascript.mjs +60 -0
- data/golden/array_operations/expected/schema_ruby.rb +91 -0
- data/golden/array_operations/expected/snast.txt +32 -0
- data/golden/array_operations/expected.json +27 -0
- data/golden/array_operations/input.json +8 -0
- data/golden/array_operations/schema.kumi +12 -10
- data/golden/cascade_logic/expected/ast.txt +37 -0
- data/golden/cascade_logic/expected/input_plan.txt +2 -0
- data/golden/cascade_logic/expected/lir_00_unoptimized.txt +29 -0
- data/golden/cascade_logic/expected/lir_01_hoist_scalar_references.txt +29 -0
- data/golden/cascade_logic/expected/lir_02_inlined.txt +37 -0
- data/golden/cascade_logic/expected/lir_03_cse.txt +30 -0
- data/golden/cascade_logic/expected/lir_04_1_loop_fusion.txt +30 -0
- data/golden/cascade_logic/expected/lir_04_loop_invcm.txt +30 -0
- data/golden/cascade_logic/expected/lir_06_const_prop.txt +30 -0
- data/golden/cascade_logic/expected/nast.txt +32 -0
- data/golden/cascade_logic/expected/schema_javascript.mjs +31 -0
- data/golden/cascade_logic/expected/schema_ruby.rb +57 -0
- data/golden/cascade_logic/expected/snast.txt +32 -0
- data/golden/cascade_logic/expected.json +5 -0
- data/golden/cascade_logic/input.json +4 -0
- data/golden/cascade_logic/schema.kumi +1 -3
- data/golden/chained_fusion/expected/ast.txt +57 -0
- data/golden/chained_fusion/expected/input_plan.txt +13 -0
- data/golden/chained_fusion/expected/lir_00_unoptimized.txt +76 -0
- data/golden/chained_fusion/expected/lir_01_hoist_scalar_references.txt +76 -0
- data/golden/chained_fusion/expected/lir_02_inlined.txt +114 -0
- data/golden/chained_fusion/expected/lir_03_cse.txt +97 -0
- data/golden/chained_fusion/expected/lir_04_1_loop_fusion.txt +99 -0
- data/golden/chained_fusion/expected/lir_04_loop_invcm.txt +97 -0
- data/golden/chained_fusion/expected/lir_06_const_prop.txt +97 -0
- data/golden/chained_fusion/expected/nast.txt +55 -0
- data/golden/chained_fusion/expected/schema_javascript.mjs +116 -0
- data/golden/chained_fusion/expected/schema_ruby.rb +149 -0
- data/golden/chained_fusion/expected/snast.txt +55 -0
- data/golden/chained_fusion/expected.json +45 -0
- data/golden/chained_fusion/input.json +51 -0
- data/golden/chained_fusion/schema.kumi +52 -0
- data/golden/element_arrays/expected/ast.txt +55 -0
- data/golden/element_arrays/expected/input_plan.txt +7 -0
- data/golden/element_arrays/expected/lir_00_unoptimized.txt +81 -0
- data/golden/element_arrays/expected/lir_01_hoist_scalar_references.txt +81 -0
- data/golden/element_arrays/expected/lir_02_inlined.txt +85 -0
- data/golden/element_arrays/expected/lir_03_cse.txt +83 -0
- data/golden/element_arrays/expected/lir_04_1_loop_fusion.txt +83 -0
- data/golden/element_arrays/expected/lir_04_loop_invcm.txt +83 -0
- data/golden/element_arrays/expected/lir_06_const_prop.txt +83 -0
- data/golden/element_arrays/expected/nast.txt +42 -0
- data/golden/element_arrays/expected/schema_javascript.mjs +106 -0
- data/golden/element_arrays/expected/schema_ruby.rb +141 -0
- data/golden/element_arrays/expected/snast.txt +42 -0
- data/golden/element_arrays/expected.json +55 -0
- data/golden/element_arrays/input.json +12 -0
- data/golden/element_arrays/schema.kumi +21 -0
- data/golden/empty_and_null_inputs/expected/ast.txt +42 -0
- data/golden/empty_and_null_inputs/expected/input_plan.txt +12 -0
- data/golden/empty_and_null_inputs/expected/lir_00_unoptimized.txt +31 -0
- data/golden/empty_and_null_inputs/expected/lir_01_hoist_scalar_references.txt +31 -0
- data/golden/empty_and_null_inputs/expected/lir_02_inlined.txt +51 -0
- data/golden/empty_and_null_inputs/expected/lir_03_cse.txt +49 -0
- data/golden/empty_and_null_inputs/expected/lir_04_1_loop_fusion.txt +49 -0
- data/golden/empty_and_null_inputs/expected/lir_04_loop_invcm.txt +49 -0
- data/golden/empty_and_null_inputs/expected/lir_06_const_prop.txt +49 -0
- data/golden/empty_and_null_inputs/expected/nast.txt +18 -0
- data/golden/empty_and_null_inputs/expected/schema_javascript.mjs +47 -0
- data/golden/empty_and_null_inputs/expected/schema_ruby.rb +79 -0
- data/golden/empty_and_null_inputs/expected/snast.txt +18 -0
- data/golden/empty_and_null_inputs/expected.json +8 -0
- data/golden/empty_and_null_inputs/input.json +16 -0
- data/golden/empty_and_null_inputs/schema.kumi +30 -0
- data/golden/game_of_life/expected/ast.txt +118 -0
- data/golden/game_of_life/expected/input_plan.txt +5 -0
- data/golden/game_of_life/expected/lir_00_unoptimized.txt +343 -0
- data/golden/game_of_life/expected/lir_01_hoist_scalar_references.txt +343 -0
- data/golden/game_of_life/expected/lir_02_inlined.txt +1918 -0
- data/golden/game_of_life/expected/lir_03_cse.txt +766 -0
- data/golden/game_of_life/expected/lir_04_1_loop_fusion.txt +766 -0
- data/golden/game_of_life/expected/lir_04_loop_invcm.txt +766 -0
- data/golden/game_of_life/expected/lir_06_const_prop.txt +766 -0
- data/golden/game_of_life/expected/nast.txt +104 -0
- data/golden/game_of_life/expected/schema_javascript.mjs +98 -0
- data/golden/game_of_life/expected/schema_ruby.rb +125 -0
- data/golden/game_of_life/expected/snast.txt +104 -0
- data/golden/game_of_life/expected.json +3 -0
- data/golden/game_of_life/input.json +8 -0
- data/golden/game_of_life/schema.kumi +33 -0
- data/golden/hash_keys/expected/ast.txt +29 -0
- data/golden/hash_keys/expected/input_plan.txt +2 -0
- data/golden/hash_keys/expected/lir_00_unoptimized.txt +18 -0
- data/golden/hash_keys/expected/lir_01_hoist_scalar_references.txt +18 -0
- data/golden/hash_keys/expected/lir_02_inlined.txt +18 -0
- data/golden/hash_keys/expected/lir_03_cse.txt +18 -0
- data/golden/hash_keys/expected/lir_04_1_loop_fusion.txt +18 -0
- data/golden/hash_keys/expected/lir_04_loop_invcm.txt +18 -0
- data/golden/hash_keys/expected/lir_06_const_prop.txt +18 -0
- data/golden/hash_keys/expected/nast.txt +46 -0
- data/golden/hash_keys/expected/schema_javascript.mjs +34 -0
- data/golden/hash_keys/expected/schema_ruby.rb +61 -0
- data/golden/hash_keys/expected/snast.txt +46 -0
- data/golden/hash_keys/expected.json +20 -0
- data/golden/hash_keys/input.json +4 -0
- data/golden/hash_keys/schema.kumi +14 -0
- data/golden/hash_value/expected/ast.txt +37 -0
- data/golden/hash_value/expected/input_plan.txt +7 -0
- data/golden/hash_value/expected/lir_00_unoptimized.txt +30 -0
- data/golden/hash_value/expected/lir_01_hoist_scalar_references.txt +30 -0
- data/golden/hash_value/expected/lir_02_inlined.txt +36 -0
- data/golden/hash_value/expected/lir_03_cse.txt +33 -0
- data/golden/hash_value/expected/lir_04_1_loop_fusion.txt +33 -0
- data/golden/hash_value/expected/lir_04_loop_invcm.txt +33 -0
- data/golden/hash_value/expected/lir_06_const_prop.txt +33 -0
- data/golden/hash_value/expected/nast.txt +25 -0
- data/golden/hash_value/expected/schema_javascript.mjs +46 -0
- data/golden/hash_value/expected/schema_ruby.rb +75 -0
- data/golden/hash_value/expected/snast.txt +25 -0
- data/golden/hash_value/expected.json +19 -0
- data/golden/hash_value/input.json +12 -0
- data/golden/hash_value/schema.kumi +19 -0
- data/golden/hierarchical_complex/expected/ast.txt +85 -0
- data/golden/hierarchical_complex/expected/input_plan.txt +23 -0
- data/golden/hierarchical_complex/expected/lir_00_unoptimized.txt +87 -0
- data/golden/hierarchical_complex/expected/lir_01_hoist_scalar_references.txt +87 -0
- data/golden/hierarchical_complex/expected/lir_02_inlined.txt +115 -0
- data/golden/hierarchical_complex/expected/lir_03_cse.txt +89 -0
- data/golden/hierarchical_complex/expected/lir_04_1_loop_fusion.txt +89 -0
- data/golden/hierarchical_complex/expected/lir_04_loop_invcm.txt +89 -0
- data/golden/hierarchical_complex/expected/lir_06_const_prop.txt +89 -0
- data/golden/hierarchical_complex/expected/nast.txt +49 -0
- data/golden/hierarchical_complex/expected/schema_javascript.mjs +121 -0
- data/golden/hierarchical_complex/expected/schema_ruby.rb +151 -0
- data/golden/hierarchical_complex/expected/snast.txt +49 -0
- data/golden/hierarchical_complex/expected.json +34 -0
- data/golden/hierarchical_complex/input.json +26 -0
- data/golden/hierarchical_complex/schema.kumi +38 -0
- data/golden/input_reference/expected/ast.txt +46 -0
- data/golden/input_reference/expected/input_plan.txt +15 -0
- data/golden/input_reference/expected/lir_00_unoptimized.txt +39 -0
- data/golden/input_reference/expected/lir_01_hoist_scalar_references.txt +39 -0
- data/golden/input_reference/expected/lir_02_inlined.txt +39 -0
- data/golden/input_reference/expected/lir_03_cse.txt +39 -0
- data/golden/input_reference/expected/lir_04_1_loop_fusion.txt +39 -0
- data/golden/input_reference/expected/lir_04_loop_invcm.txt +39 -0
- data/golden/input_reference/expected/lir_06_const_prop.txt +39 -0
- data/golden/input_reference/expected/nast.txt +21 -0
- data/golden/input_reference/expected/schema_javascript.mjs +45 -0
- data/golden/input_reference/expected/schema_ruby.rb +74 -0
- data/golden/input_reference/expected/snast.txt +21 -0
- data/golden/input_reference/expected.json +7 -0
- data/golden/input_reference/input.json +11 -0
- data/golden/input_reference/schema.kumi +22 -0
- data/golden/interleaved_fusion/expected/ast.txt +51 -0
- data/golden/interleaved_fusion/expected/input_plan.txt +13 -0
- data/golden/interleaved_fusion/expected/lir_00_unoptimized.txt +53 -0
- data/golden/interleaved_fusion/expected/lir_01_hoist_scalar_references.txt +53 -0
- data/golden/interleaved_fusion/expected/lir_02_inlined.txt +89 -0
- data/golden/interleaved_fusion/expected/lir_03_cse.txt +77 -0
- data/golden/interleaved_fusion/expected/lir_04_1_loop_fusion.txt +77 -0
- data/golden/interleaved_fusion/expected/lir_04_loop_invcm.txt +77 -0
- data/golden/interleaved_fusion/expected/lir_06_const_prop.txt +77 -0
- data/golden/interleaved_fusion/expected/nast.txt +41 -0
- data/golden/interleaved_fusion/expected/schema_javascript.mjs +86 -0
- data/golden/interleaved_fusion/expected/schema_ruby.rb +122 -0
- data/golden/interleaved_fusion/expected/snast.txt +41 -0
- data/golden/interleaved_fusion/expected.json +37 -0
- data/golden/interleaved_fusion/input.json +26 -0
- data/golden/interleaved_fusion/schema.kumi +57 -0
- data/golden/let_inline/expected/ast.txt +33 -0
- data/golden/let_inline/expected/input_plan.txt +2 -0
- data/golden/let_inline/expected/lir_00_unoptimized.txt +26 -0
- data/golden/let_inline/expected/lir_01_hoist_scalar_references.txt +26 -0
- data/golden/let_inline/expected/lir_02_inlined.txt +36 -0
- data/golden/let_inline/expected/lir_03_cse.txt +30 -0
- data/golden/let_inline/expected/lir_04_1_loop_fusion.txt +30 -0
- data/golden/let_inline/expected/lir_04_loop_invcm.txt +30 -0
- data/golden/let_inline/expected/lir_06_const_prop.txt +30 -0
- data/golden/let_inline/expected/nast.txt +26 -0
- data/golden/let_inline/expected/schema_javascript.mjs +11 -0
- data/golden/let_inline/expected/schema_ruby.rb +37 -0
- data/golden/let_inline/expected/snast.txt +26 -0
- data/golden/let_inline/expected.json +1 -0
- data/golden/let_inline/input.json +1 -0
- data/golden/let_inline/schema.kumi +11 -0
- data/golden/loop_fusion/expected/ast.txt +44 -0
- data/golden/loop_fusion/expected/input_plan.txt +13 -0
- data/golden/loop_fusion/expected/lir_00_unoptimized.txt +43 -0
- data/golden/loop_fusion/expected/lir_01_hoist_scalar_references.txt +43 -0
- data/golden/loop_fusion/expected/lir_02_inlined.txt +62 -0
- data/golden/loop_fusion/expected/lir_03_cse.txt +57 -0
- data/golden/loop_fusion/expected/lir_04_1_loop_fusion.txt +57 -0
- data/golden/loop_fusion/expected/lir_04_loop_invcm.txt +57 -0
- data/golden/loop_fusion/expected/lir_06_const_prop.txt +57 -0
- data/golden/loop_fusion/expected/nast.txt +32 -0
- data/golden/loop_fusion/expected/schema_javascript.mjs +64 -0
- data/golden/loop_fusion/expected/schema_ruby.rb +97 -0
- data/golden/loop_fusion/expected/snast.txt +32 -0
- data/golden/loop_fusion/expected.json +30 -0
- data/golden/loop_fusion/input.json +28 -0
- data/golden/loop_fusion/schema.kumi +32 -0
- data/golden/min_reduce_scope/expected/ast.txt +49 -0
- data/golden/min_reduce_scope/expected/input_plan.txt +9 -0
- data/golden/min_reduce_scope/expected/lir_00_unoptimized.txt +59 -0
- data/golden/min_reduce_scope/expected/lir_01_hoist_scalar_references.txt +59 -0
- data/golden/min_reduce_scope/expected/lir_02_inlined.txt +63 -0
- data/golden/min_reduce_scope/expected/lir_03_cse.txt +60 -0
- data/golden/min_reduce_scope/expected/lir_04_1_loop_fusion.txt +60 -0
- data/golden/min_reduce_scope/expected/lir_04_loop_invcm.txt +60 -0
- data/golden/min_reduce_scope/expected/lir_06_const_prop.txt +60 -0
- data/golden/min_reduce_scope/expected/nast.txt +29 -0
- data/golden/min_reduce_scope/expected/schema_javascript.mjs +66 -0
- data/golden/min_reduce_scope/expected/schema_ruby.rb +99 -0
- data/golden/min_reduce_scope/expected/snast.txt +29 -0
- data/golden/min_reduce_scope/expected.json +9 -0
- data/golden/min_reduce_scope/input.json +18 -0
- data/golden/min_reduce_scope/schema.kumi +25 -0
- data/golden/mixed_dimensions/expected/ast.txt +54 -0
- data/golden/mixed_dimensions/expected/input_plan.txt +15 -0
- data/golden/mixed_dimensions/expected/lir_00_unoptimized.txt +42 -0
- data/golden/mixed_dimensions/expected/lir_01_hoist_scalar_references.txt +42 -0
- data/golden/mixed_dimensions/expected/lir_02_inlined.txt +48 -0
- data/golden/mixed_dimensions/expected/lir_03_cse.txt +48 -0
- data/golden/mixed_dimensions/expected/lir_04_1_loop_fusion.txt +48 -0
- data/golden/mixed_dimensions/expected/lir_04_loop_invcm.txt +48 -0
- data/golden/mixed_dimensions/expected/lir_06_const_prop.txt +48 -0
- data/golden/mixed_dimensions/expected/nast.txt +22 -0
- data/golden/mixed_dimensions/expected/schema_javascript.mjs +53 -0
- data/golden/mixed_dimensions/expected/schema_ruby.rb +84 -0
- data/golden/mixed_dimensions/expected/snast.txt +22 -0
- data/golden/mixed_dimensions/expected.json +6 -0
- data/golden/mixed_dimensions/input.json +22 -0
- data/golden/mixed_dimensions/schema.kumi +35 -0
- data/golden/multirank_hoisting/expected/ast.txt +72 -0
- data/golden/multirank_hoisting/expected/input_plan.txt +18 -0
- data/golden/multirank_hoisting/expected/lir_00_unoptimized.txt +75 -0
- data/golden/multirank_hoisting/expected/lir_01_hoist_scalar_references.txt +75 -0
- data/golden/multirank_hoisting/expected/lir_02_inlined.txt +126 -0
- data/golden/multirank_hoisting/expected/lir_03_cse.txt +109 -0
- data/golden/multirank_hoisting/expected/lir_04_1_loop_fusion.txt +109 -0
- data/golden/multirank_hoisting/expected/lir_04_loop_invcm.txt +109 -0
- data/golden/multirank_hoisting/expected/lir_06_const_prop.txt +109 -0
- data/golden/multirank_hoisting/expected/nast.txt +39 -0
- data/golden/multirank_hoisting/expected/schema_javascript.mjs +128 -0
- data/golden/multirank_hoisting/expected/schema_ruby.rb +162 -0
- data/golden/multirank_hoisting/expected/snast.txt +39 -0
- data/golden/multirank_hoisting/expected.json +15 -0
- data/golden/multirank_hoisting/input.json +19 -0
- data/golden/multirank_hoisting/schema.kumi +38 -0
- data/golden/nested_hash/expected/ast.txt +22 -0
- data/golden/nested_hash/expected/input_plan.txt +5 -0
- data/golden/nested_hash/expected/lir_00_unoptimized.txt +10 -0
- data/golden/nested_hash/expected/lir_01_hoist_scalar_references.txt +10 -0
- data/golden/nested_hash/expected/lir_02_inlined.txt +10 -0
- data/golden/nested_hash/expected/lir_03_cse.txt +10 -0
- data/golden/nested_hash/expected/lir_04_1_loop_fusion.txt +10 -0
- data/golden/nested_hash/expected/lir_04_loop_invcm.txt +10 -0
- data/golden/nested_hash/expected/lir_06_const_prop.txt +10 -0
- data/golden/nested_hash/expected/nast.txt +8 -0
- data/golden/nested_hash/expected/schema_javascript.mjs +9 -0
- data/golden/nested_hash/expected/schema_ruby.rb +35 -0
- data/golden/nested_hash/expected/snast.txt +8 -0
- data/golden/nested_hash/expected.json +3 -0
- data/golden/nested_hash/input.json +7 -0
- data/golden/nested_hash/schema.kumi +11 -0
- data/golden/reduction_broadcast/expected/ast.txt +49 -0
- data/golden/reduction_broadcast/expected/input_plan.txt +13 -0
- data/golden/reduction_broadcast/expected/lir_00_unoptimized.txt +49 -0
- data/golden/reduction_broadcast/expected/lir_01_hoist_scalar_references.txt +49 -0
- data/golden/reduction_broadcast/expected/lir_02_inlined.txt +80 -0
- data/golden/reduction_broadcast/expected/lir_03_cse.txt +68 -0
- data/golden/reduction_broadcast/expected/lir_04_1_loop_fusion.txt +68 -0
- data/golden/reduction_broadcast/expected/lir_04_loop_invcm.txt +68 -0
- data/golden/reduction_broadcast/expected/lir_06_const_prop.txt +68 -0
- data/golden/reduction_broadcast/expected/nast.txt +24 -0
- data/golden/reduction_broadcast/expected/schema_javascript.mjs +74 -0
- data/golden/reduction_broadcast/expected/schema_ruby.rb +110 -0
- data/golden/reduction_broadcast/expected/snast.txt +24 -0
- data/golden/reduction_broadcast/expected.json +25 -0
- data/golden/reduction_broadcast/input.json +19 -0
- data/golden/reduction_broadcast/schema.kumi +34 -0
- data/golden/roll/expected/ast.txt +36 -0
- data/golden/roll/expected/input_plan.txt +3 -0
- data/golden/roll/expected/lir_00_unoptimized.txt +56 -0
- data/golden/roll/expected/lir_01_hoist_scalar_references.txt +56 -0
- data/golden/roll/expected/lir_02_inlined.txt +56 -0
- data/golden/roll/expected/lir_03_cse.txt +55 -0
- data/golden/roll/expected/lir_04_1_loop_fusion.txt +55 -0
- data/golden/roll/expected/lir_04_loop_invcm.txt +55 -0
- data/golden/roll/expected/lir_06_const_prop.txt +55 -0
- data/golden/roll/expected/nast.txt +26 -0
- data/golden/roll/expected/schema_javascript.mjs +65 -0
- data/golden/roll/expected/schema_ruby.rb +95 -0
- data/golden/roll/expected/snast.txt +26 -0
- data/golden/roll/expected.json +6 -0
- data/golden/roll/input.json +1 -0
- data/golden/roll/schema.kumi +13 -0
- data/golden/shift/expected/ast.txt +48 -0
- data/golden/shift/expected/input_plan.txt +3 -0
- data/golden/shift/expected/lir_00_unoptimized.txt +96 -0
- data/golden/shift/expected/lir_01_hoist_scalar_references.txt +96 -0
- data/golden/shift/expected/lir_02_inlined.txt +96 -0
- data/golden/shift/expected/lir_03_cse.txt +90 -0
- data/golden/shift/expected/lir_04_1_loop_fusion.txt +90 -0
- data/golden/shift/expected/lir_04_loop_invcm.txt +90 -0
- data/golden/shift/expected/lir_06_const_prop.txt +90 -0
- data/golden/shift/expected/nast.txt +38 -0
- data/golden/shift/expected/schema_javascript.mjs +106 -0
- data/golden/shift/expected/schema_ruby.rb +138 -0
- data/golden/shift/expected/snast.txt +38 -0
- data/golden/shift/expected.json +8 -0
- data/golden/shift/input.json +1 -0
- data/golden/shift/schema.kumi +15 -0
- data/golden/shift_2d/expected/ast.txt +88 -0
- data/golden/shift_2d/expected/input_plan.txt +5 -0
- data/golden/shift_2d/expected/lir_00_unoptimized.txt +274 -0
- data/golden/shift_2d/expected/lir_01_hoist_scalar_references.txt +274 -0
- data/golden/shift_2d/expected/lir_02_inlined.txt +274 -0
- data/golden/shift_2d/expected/lir_03_cse.txt +262 -0
- data/golden/shift_2d/expected/lir_04_1_loop_fusion.txt +262 -0
- data/golden/shift_2d/expected/lir_04_loop_invcm.txt +262 -0
- data/golden/shift_2d/expected/lir_06_const_prop.txt +262 -0
- data/golden/shift_2d/expected/nast.txt +74 -0
- data/golden/shift_2d/expected/schema_javascript.mjs +320 -0
- data/golden/shift_2d/expected/schema_ruby.rb +358 -0
- data/golden/shift_2d/expected/snast.txt +74 -0
- data/golden/shift_2d/expected.json +15 -0
- data/golden/shift_2d/input.json +14 -0
- data/golden/shift_2d/schema.kumi +25 -0
- data/golden/simple_math/expected/ast.txt +40 -0
- data/golden/simple_math/expected/input_plan.txt +2 -0
- data/golden/simple_math/expected/lir_00_unoptimized.txt +31 -0
- data/golden/simple_math/expected/lir_01_hoist_scalar_references.txt +31 -0
- data/golden/simple_math/expected/lir_02_inlined.txt +31 -0
- data/golden/simple_math/expected/lir_03_cse.txt +31 -0
- data/golden/simple_math/expected/lir_04_1_loop_fusion.txt +31 -0
- data/golden/simple_math/expected/lir_04_loop_invcm.txt +31 -0
- data/golden/simple_math/expected/lir_06_const_prop.txt +31 -0
- data/golden/simple_math/expected/nast.txt +33 -0
- data/golden/simple_math/expected/schema_javascript.mjs +33 -0
- data/golden/simple_math/expected/schema_ruby.rb +59 -0
- data/golden/simple_math/expected/snast.txt +33 -0
- data/golden/simple_math/expected.json +1 -0
- data/golden/simple_math/input.json +4 -0
- data/golden/simple_math/schema.kumi +2 -1
- data/golden/streaming_basics/expected/ast.txt +64 -0
- data/golden/streaming_basics/expected/input_plan.txt +8 -0
- data/golden/streaming_basics/expected/lir_00_unoptimized.txt +73 -0
- data/golden/streaming_basics/expected/lir_01_hoist_scalar_references.txt +73 -0
- data/golden/streaming_basics/expected/lir_02_inlined.txt +100 -0
- data/golden/streaming_basics/expected/lir_03_cse.txt +84 -0
- data/golden/streaming_basics/expected/lir_04_1_loop_fusion.txt +84 -0
- data/golden/streaming_basics/expected/lir_04_loop_invcm.txt +84 -0
- data/golden/streaming_basics/expected/lir_06_const_prop.txt +84 -0
- data/golden/streaming_basics/expected/nast.txt +48 -0
- data/golden/streaming_basics/expected/schema_javascript.mjs +94 -0
- data/golden/streaming_basics/expected/schema_ruby.rb +127 -0
- data/golden/streaming_basics/expected/snast.txt +48 -0
- data/golden/streaming_basics/expected.json +10 -0
- data/golden/streaming_basics/input.json +8 -0
- data/golden/streaming_basics/schema.kumi +24 -0
- data/golden/tuples/expected/ast.txt +48 -0
- data/golden/tuples/expected/input_plan.txt +1 -0
- data/golden/tuples/expected/lir_00_unoptimized.txt +40 -0
- data/golden/tuples/expected/lir_01_hoist_scalar_references.txt +40 -0
- data/golden/tuples/expected/lir_02_inlined.txt +48 -0
- data/golden/tuples/expected/lir_03_cse.txt +48 -0
- data/golden/tuples/expected/lir_04_1_loop_fusion.txt +48 -0
- data/golden/tuples/expected/lir_04_loop_invcm.txt +48 -0
- data/golden/tuples/expected/lir_06_const_prop.txt +48 -0
- data/golden/tuples/expected/nast.txt +42 -0
- data/golden/tuples/expected/schema_javascript.mjs +51 -0
- data/golden/tuples/expected/schema_ruby.rb +77 -0
- data/golden/tuples/expected/snast.txt +42 -0
- data/golden/tuples/expected.json +7 -0
- data/golden/tuples/input.json +3 -0
- data/golden/tuples/schema.kumi +11 -0
- data/golden/tuples_and_arrays/expected/ast.txt +44 -0
- data/golden/tuples_and_arrays/expected/input_plan.txt +7 -0
- data/golden/tuples_and_arrays/expected/lir_00_unoptimized.txt +41 -0
- data/golden/tuples_and_arrays/expected/lir_01_hoist_scalar_references.txt +41 -0
- data/golden/tuples_and_arrays/expected/lir_02_inlined.txt +62 -0
- data/golden/tuples_and_arrays/expected/lir_03_cse.txt +51 -0
- data/golden/tuples_and_arrays/expected/lir_04_1_loop_fusion.txt +51 -0
- data/golden/tuples_and_arrays/expected/lir_04_loop_invcm.txt +51 -0
- data/golden/tuples_and_arrays/expected/lir_06_const_prop.txt +51 -0
- data/golden/tuples_and_arrays/expected/nast.txt +28 -0
- data/golden/tuples_and_arrays/expected/schema_javascript.mjs +58 -0
- data/golden/tuples_and_arrays/expected/schema_ruby.rb +88 -0
- data/golden/tuples_and_arrays/expected/snast.txt +28 -0
- data/golden/tuples_and_arrays/expected.json +18 -0
- data/golden/tuples_and_arrays/input.json +7 -0
- data/golden/tuples_and_arrays/schema.kumi +38 -0
- data/golden/with_constants/expected/ast.txt +28 -0
- data/golden/with_constants/expected/input_plan.txt +2 -0
- data/golden/with_constants/expected/lir_00_unoptimized.txt +17 -0
- data/golden/with_constants/expected/lir_01_hoist_scalar_references.txt +17 -0
- data/golden/with_constants/expected/lir_02_inlined.txt +17 -0
- data/golden/with_constants/expected/lir_03_cse.txt +17 -0
- data/golden/with_constants/expected/lir_04_1_loop_fusion.txt +17 -0
- data/golden/with_constants/expected/lir_04_loop_invcm.txt +17 -0
- data/golden/with_constants/expected/lir_06_const_prop.txt +17 -0
- data/golden/with_constants/expected/nast.txt +21 -0
- data/golden/with_constants/expected/schema_javascript.mjs +18 -0
- data/golden/with_constants/expected/schema_ruby.rb +44 -0
- data/golden/with_constants/expected/snast.txt +15 -0
- data/golden/with_constants/schema.kumi +10 -0
- data/lib/kumi/analyzer.rb +76 -24
- data/lib/kumi/configuration.rb +60 -0
- data/lib/kumi/core/analyzer/binder.rb +121 -0
- data/lib/kumi/core/analyzer/checkpoint.rb +15 -9
- data/lib/kumi/core/analyzer/constant_evaluator.rb +32 -37
- data/lib/kumi/core/analyzer/constant_folding_helpers.rb +55 -0
- data/lib/kumi/core/analyzer/debug.rb +14 -16
- data/lib/kumi/core/analyzer/fn_aliases.rb +46 -0
- data/lib/kumi/core/analyzer/folder.rb +94 -0
- data/lib/kumi/core/analyzer/macro_expander.rb +69 -0
- data/lib/kumi/core/analyzer/passes/assemble_irv2_pass.rb +130 -0
- data/lib/kumi/core/analyzer/passes/attach_anchors_pass.rb +71 -0
- data/lib/kumi/core/analyzer/passes/attach_terminal_info_pass.rb +181 -0
- data/lib/kumi/core/analyzer/passes/codegen/js/declaration_emitter.rb +317 -0
- data/lib/kumi/core/analyzer/passes/codegen/js/emitter.rb +75 -0
- data/lib/kumi/core/analyzer/passes/codegen/js/output_buffer.rb +103 -0
- data/lib/kumi/core/analyzer/passes/codegen/js_pass.rb +27 -0
- data/lib/kumi/core/analyzer/passes/codegen/ruby/declaration_emitter.rb +321 -0
- data/lib/kumi/core/analyzer/passes/codegen/ruby/emitter.rb +85 -0
- data/lib/kumi/core/analyzer/passes/codegen/ruby/output_buffer.rb +111 -0
- data/lib/kumi/core/analyzer/passes/codegen/ruby_pass.rb +32 -0
- data/lib/kumi/core/analyzer/passes/constant_folding_pass.rb +33 -0
- data/lib/kumi/core/analyzer/passes/contract_checker_pass.rb +220 -0
- data/lib/kumi/core/analyzer/passes/dependency_resolver.rb +5 -6
- data/lib/kumi/core/analyzer/passes/input_access_planner_pass.rb +7 -3
- data/lib/kumi/core/analyzer/passes/input_collector.rb +74 -122
- data/lib/kumi/core/analyzer/passes/input_form_schema_pass.rb +43 -0
- data/lib/kumi/core/analyzer/passes/ir_dependency_pass.rb +1 -1
- data/lib/kumi/core/analyzer/passes/ir_execution_schedule_pass.rb +1 -1
- data/lib/kumi/core/analyzer/passes/join_reduce_planning_pass.rb +21 -23
- data/lib/kumi/core/analyzer/passes/lir/constant_propagation_pass.rb +84 -0
- data/lib/kumi/core/analyzer/passes/lir/dead_code_elimination_pass.rb +93 -0
- data/lib/kumi/core/analyzer/passes/lir/hoist_scalar_references_pass.rb +115 -0
- data/lib/kumi/core/analyzer/passes/lir/inline_declarations_pass.rb +274 -0
- data/lib/kumi/core/analyzer/passes/lir/instruction_scheduling_pass.rb +198 -0
- data/lib/kumi/core/analyzer/passes/lir/kernel_binding_pass.rb +30 -0
- data/lib/kumi/core/analyzer/passes/lir/local_cse_pass.rb +121 -0
- data/lib/kumi/core/analyzer/passes/lir/loop_fusion_pass.rb +156 -0
- data/lib/kumi/core/analyzer/passes/lir/loop_invariant_code_motion_pass.rb +148 -0
- data/lib/kumi/core/analyzer/passes/lir/lower_pass.rb +407 -0
- data/lib/kumi/core/analyzer/passes/lir/stencil_emitter.rb +243 -0
- data/lib/kumi/core/analyzer/passes/lir/validation_pass.rb +83 -0
- data/lib/kumi/core/analyzer/passes/load_input_cse.rb +17 -16
- data/lib/kumi/core/analyzer/passes/lower_to_ir_pass.rb +4 -2
- data/lib/kumi/core/analyzer/passes/lower_to_irv2_pass.rb +197 -0
- data/lib/kumi/core/analyzer/passes/name_indexer.rb +4 -1
- data/lib/kumi/core/analyzer/passes/nast_dimensional_analyzer_pass.rb +237 -0
- data/lib/kumi/core/analyzer/passes/normalize_to_nast_pass.rb +156 -0
- data/lib/kumi/core/analyzer/passes/output_schema_pass.rb +38 -0
- data/lib/kumi/core/analyzer/passes/pass_base.rb +30 -4
- data/lib/kumi/core/analyzer/passes/precompute_access_paths_pass.rb +93 -0
- data/lib/kumi/core/analyzer/passes/scope_resolution_pass.rb +33 -30
- data/lib/kumi/core/analyzer/passes/semantic_constraint_validator.rb +5 -26
- data/lib/kumi/core/analyzer/passes/snast_pass.rb +229 -0
- data/lib/kumi/core/analyzer/passes/toposorter.rb +1 -0
- data/lib/kumi/core/analyzer/passes/type_checker.rb +13 -0
- data/lib/kumi/core/analyzer/passes/type_inferencer_pass.rb +14 -16
- data/lib/kumi/core/analyzer/passes/unsat_detector.rb +2 -1
- data/lib/kumi/core/analyzer/plans.rb +12 -0
- data/lib/kumi/core/analyzer/state_serde.rb +4 -4
- data/lib/kumi/core/analyzer/structs/access_plan.rb +2 -2
- data/lib/kumi/core/analyzer/unsat_constant_evaluator.rb +59 -0
- data/lib/kumi/core/compiler/access_codegen.rb +1 -1
- data/lib/kumi/core/compiler/access_emit/base.rb +9 -5
- data/lib/kumi/core/compiler/access_emit/each_indexed.rb +10 -3
- data/lib/kumi/core/compiler/access_emit/materialize.rb +12 -5
- data/lib/kumi/core/compiler/access_emit/ravel.rb +10 -3
- data/lib/kumi/core/compiler/access_emit/read.rb +4 -1
- data/lib/kumi/core/compiler/access_planner.rb +42 -4
- data/lib/kumi/core/compiler/access_planner_v2.rb +164 -0
- data/lib/kumi/core/explain.rb +18 -11
- data/lib/kumi/core/functions/loader.rb +47 -0
- data/lib/kumi/core/functions/model.rb +10 -0
- data/lib/kumi/core/functions/type_rules.rb +108 -0
- data/lib/kumi/core/ir/execution_engine/interpreter.rb +1 -1
- data/lib/kumi/core/ir/execution_engine/profiler.rb +107 -97
- data/lib/kumi/core/ir.rb +6 -2
- data/lib/kumi/core/irv2/builder.rb +48 -0
- data/lib/kumi/core/irv2/declaration.rb +28 -0
- data/lib/kumi/core/irv2/module.rb +108 -0
- data/lib/kumi/core/irv2/value.rb +28 -0
- data/lib/kumi/core/lir/analyze.rb +64 -0
- data/lib/kumi/core/lir/build.rb +363 -0
- data/lib/kumi/core/lir/emit.rb +62 -0
- data/lib/kumi/core/lir/structs/instruction.rb +44 -0
- data/lib/kumi/core/lir/structs/literal.rb +14 -0
- data/lib/kumi/core/lir/structs/stamp.rb +13 -0
- data/lib/kumi/core/lir/support/error.rb +9 -0
- data/lib/kumi/core/lir/support/ids.rb +34 -0
- data/lib/kumi/core/lir/validate.rb +74 -0
- data/lib/kumi/core/lir.rb +34 -0
- data/lib/kumi/core/nast.rb +216 -0
- data/lib/kumi/core/ruby_parser/dsl.rb +2 -2
- data/lib/kumi/core/ruby_parser/dsl_cascade_builder.rb +1 -1
- data/lib/kumi/core/ruby_parser/expression_converter.rb +10 -0
- data/lib/kumi/core/ruby_parser/input_builder.rb +16 -17
- data/lib/kumi/core/ruby_parser/schema_builder.rb +36 -10
- data/lib/kumi/core/ruby_parser/sugar.rb +64 -0
- data/lib/kumi/core/types/builder.rb +2 -2
- data/lib/kumi/core/types/normalizer.rb +2 -0
- data/lib/kumi/core/types/validator.rb +10 -3
- data/lib/kumi/core/types.rb +7 -0
- data/lib/kumi/dev/codegen.rb +194 -0
- data/lib/kumi/dev/golden/generator.rb +105 -0
- data/lib/kumi/dev/golden/reporter.rb +160 -0
- data/lib/kumi/dev/golden/representation.rb +45 -0
- data/lib/kumi/dev/golden/result.rb +98 -0
- data/lib/kumi/dev/golden/runtime_test.rb +93 -0
- data/lib/kumi/dev/golden/suite.rb +131 -0
- data/lib/kumi/dev/golden/verifier.rb +76 -0
- data/lib/kumi/dev/golden.rb +75 -0
- data/lib/kumi/dev/ir.rb +4 -4
- data/lib/kumi/dev/parse.rb +1 -1
- data/lib/kumi/dev/pretty_printer.rb +229 -0
- data/lib/kumi/dev/printer/irv2_formatter.rb +163 -0
- data/lib/kumi/dev/printer/width_aware_json.rb +44 -0
- data/lib/kumi/dev/profile_aggregator.rb +36 -38
- data/lib/kumi/dev/profile_runner.rb +19 -23
- data/lib/kumi/dev/runner.rb +12 -22
- data/lib/kumi/dev/support/kumi_runner.mjs +39 -0
- data/lib/kumi/dev.rb +3 -3
- data/lib/kumi/frontends/ruby.rb +12 -12
- data/lib/kumi/frontends/text.rb +26 -21
- data/lib/kumi/frontends.rb +6 -8
- data/lib/kumi/kernel_registry.rb +59 -0
- data/lib/kumi/pack/builder.rb +229 -0
- data/lib/kumi/pack.rb +15 -0
- data/lib/kumi/registry_v2/loader.rb +81 -0
- data/lib/kumi/registry_v2.rb +118 -0
- data/lib/kumi/schema.rb +83 -43
- data/lib/kumi/support/diff.rb +3 -2
- data/lib/kumi/support/ir_render.rb +1 -1
- data/lib/kumi/support/lir_printer.rb +143 -0
- data/lib/kumi/support/nast_printer.rb +93 -0
- data/lib/kumi/support/s_expression_printer.rb +5 -4
- data/lib/kumi/support/snast_printer.rb +111 -0
- data/lib/kumi/syntax/call_expression.rb +1 -1
- data/lib/kumi/syntax/input_declaration.rb +2 -2
- data/lib/kumi/syntax/node.rb +4 -12
- data/lib/kumi/syntax/root.rb +10 -0
- data/lib/kumi/syntax/trait_declaration.rb +1 -0
- data/lib/kumi/syntax/value_declaration.rb +1 -0
- data/lib/kumi/version.rb +1 -1
- data/lib/kumi.rb +47 -5
- metadata +571 -54
- data/docs/AST.md +0 -133
- data/docs/DSL.md +0 -154
- data/docs/FUNCTIONS.md +0 -176
- data/docs/VECTOR_SEMANTICS.md +0 -286
- data/docs/compiler_design_principles.md +0 -86
- data/docs/dev/analyzer-debug.md +0 -52
- data/docs/dev/parse-command.md +0 -64
- data/docs/dev/vm-profiling.md +0 -95
- data/docs/development/README.md +0 -120
- data/docs/development/error-reporting.md +0 -361
- data/docs/features/README.md +0 -58
- data/docs/features/analysis-type-inference.md +0 -42
- data/docs/features/analysis-unsat-detection.md +0 -71
- data/docs/features/hierarchical-broadcasting.md +0 -415
- data/docs/features/input-declaration-system.md +0 -58
- data/docs/features/performance.md +0 -14
- data/docs/features/s-expression-printer.md +0 -77
- data/docs/schema_metadata/broadcasts.md +0 -53
- data/docs/schema_metadata/cascades.md +0 -45
- data/docs/schema_metadata/declarations.md +0 -54
- data/docs/schema_metadata/dependencies.md +0 -57
- data/docs/schema_metadata/evaluation_order.md +0 -29
- data/docs/schema_metadata/examples.md +0 -95
- data/docs/schema_metadata/inferred_types.md +0 -46
- data/docs/schema_metadata/inputs.md +0 -86
- data/docs/schema_metadata.md +0 -108
- data/golden/mixed_nesting/schema.kumi +0 -42
- data/lib/kumi/core/function_registry/collection_functions.rb +0 -298
- data/lib/kumi/core/function_registry/comparison_functions.rb +0 -33
- data/lib/kumi/core/function_registry/conditional_functions.rb +0 -48
- data/lib/kumi/core/function_registry/function_builder.rb +0 -184
- data/lib/kumi/core/function_registry/logical_functions.rb +0 -214
- data/lib/kumi/core/function_registry/math_functions.rb +0 -74
- data/lib/kumi/core/function_registry/stat_functions.rb +0 -156
- data/lib/kumi/core/function_registry/string_functions.rb +0 -57
- data/lib/kumi/core/function_registry/type_functions.rb +0 -53
- data/lib/kumi/core/function_registry.rb +0 -176
- data/lib/kumi/registry.rb +0 -32
- data/lib/kumi/runtime/executable.rb +0 -135
- data/lib/kumi/runtime/run.rb +0 -105
- data/performance_results.txt +0 -63
- data/scripts/analyze_broadcast_methods.rb +0 -68
- data/scripts/analyze_cascade_methods.rb +0 -74
- data/scripts/check_broadcasting_coverage.rb +0 -51
- data/scripts/find_dead_code.rb +0 -114
- data/scripts/generate_function_docs.rb +0 -71
- data/scripts/test_mixed_nesting_performance.rb +0 -206
@@ -0,0 +1,274 @@
|
|
1
|
+
# frozen_string_literal: true
|
2
|
+
|
3
|
+
module Kumi
|
4
|
+
module Core
|
5
|
+
module Analyzer
|
6
|
+
module Passes
|
7
|
+
module LIR
|
8
|
+
class InlineDeclarationsPass < PassBase
|
9
|
+
LIR = Kumi::Core::LIR
|
10
|
+
MAX_PASSES = 30
|
11
|
+
|
12
|
+
def run(_errors)
|
13
|
+
current_ops = get_state(:lir_module)
|
14
|
+
@ids = get_state(:id_generator)
|
15
|
+
|
16
|
+
MAX_PASSES.times do
|
17
|
+
new_ops, changed = run_one_pass(current_ops)
|
18
|
+
|
19
|
+
unless changed
|
20
|
+
new_ops.freeze
|
21
|
+
return state.with(:lir_module, new_ops).with(:lir_02_inlined_ops_by_decl, new_ops)
|
22
|
+
end
|
23
|
+
current_ops = new_ops
|
24
|
+
end
|
25
|
+
|
26
|
+
raise "LIR inlining did not converge after #{MAX_PASSES} passes."
|
27
|
+
end
|
28
|
+
|
29
|
+
private
|
30
|
+
|
31
|
+
# --- UNCHANGED: Top-level pass logic ---
|
32
|
+
def run_one_pass(ops_by_decl)
|
33
|
+
@ops_by_decl = ops_by_decl
|
34
|
+
@gamma = detect_all_gammas(@ops_by_decl)
|
35
|
+
changed = false
|
36
|
+
fused = {}
|
37
|
+
@ops_by_decl.each do |name, payload|
|
38
|
+
original_ops = Array(payload[:operations])
|
39
|
+
|
40
|
+
# Call the new top-level inliner
|
41
|
+
inlined_ops = inline_top_level_decl(original_ops)
|
42
|
+
|
43
|
+
fused[name] = { operations: inlined_ops }
|
44
|
+
changed ||= (inlined_ops != original_ops)
|
45
|
+
end
|
46
|
+
[fused, changed]
|
47
|
+
end
|
48
|
+
|
49
|
+
# --- NEW: Top-level entry point for the recursive processor ---
|
50
|
+
def inline_top_level_decl(ops)
|
51
|
+
env = Env.new
|
52
|
+
reg_map = {}
|
53
|
+
rename_map = {}
|
54
|
+
processed_ops, hoisted_ops = process_and_hoist_block(ops, env, reg_map, rename_map)
|
55
|
+
|
56
|
+
# Hoisting is not allowed at the top level of a declaration
|
57
|
+
raise "Orphaned code was hoisted to top level" unless hoisted_ops.empty?
|
58
|
+
|
59
|
+
processed_ops
|
60
|
+
end
|
61
|
+
|
62
|
+
# --- NEW: The core recursive block processor ---
|
63
|
+
# Returns two arrays: [ processed_instructions_for_this_block, instructions_to_hoist_up_one_level ]
|
64
|
+
def process_and_hoist_block(block_ops, env, reg_map, rename_map)
|
65
|
+
out_ops = []
|
66
|
+
hoisted_out_ops = [] # Operations to be returned to the parent scope
|
67
|
+
i = 0
|
68
|
+
|
69
|
+
while i < block_ops.length
|
70
|
+
ins = block_ops[i]
|
71
|
+
case ins.opcode
|
72
|
+
when :LoopStart
|
73
|
+
end_idx = find_matching_loop_end(block_ops, i)
|
74
|
+
loop_body = block_ops[(i + 1)...end_idx]
|
75
|
+
|
76
|
+
env.push(ins)
|
77
|
+
processed_body, hoisted_from_child = process_and_hoist_block(loop_body, env, reg_map, rename_map)
|
78
|
+
env.pop
|
79
|
+
|
80
|
+
# This is the crucial step: emit code hoisted from the child loop
|
81
|
+
# BEFORE emitting the child loop itself.
|
82
|
+
out_ops.concat(hoisted_from_child)
|
83
|
+
|
84
|
+
# Now, emit the reconstructed loop with its processed body
|
85
|
+
out_ops << rewrite(ins, reg_map, rename_map)
|
86
|
+
out_ops.concat(processed_body)
|
87
|
+
out_ops << rewrite(block_ops[end_idx], reg_map, rename_map)
|
88
|
+
|
89
|
+
i = end_idx # Jump iterator past the entire loop block
|
90
|
+
|
91
|
+
when :LoadDeclaration
|
92
|
+
# This helper now decides if ops go inline or get returned for hoisting
|
93
|
+
inline_ops, hoist_ops = handle_load_declaration(ins, env, reg_map, rename_map)
|
94
|
+
out_ops.concat(inline_ops)
|
95
|
+
hoisted_out_ops.concat(hoist_ops)
|
96
|
+
|
97
|
+
else
|
98
|
+
out_ops << rewrite(ins, reg_map, rename_map)
|
99
|
+
end
|
100
|
+
i += 1
|
101
|
+
end
|
102
|
+
|
103
|
+
[out_ops, hoisted_out_ops]
|
104
|
+
end
|
105
|
+
|
106
|
+
# --- NEW: Helper to manage LoadDeclaration logic ---
|
107
|
+
# Returns two arrays: [ instructions_to_add_inline, instructions_to_hoist ]
|
108
|
+
def handle_load_declaration(ins, env, reg_map, rename_map)
|
109
|
+
callee = ins.immediates.first.value.to_sym
|
110
|
+
decl_axes = ins.attributes.fetch(:axes)
|
111
|
+
site_axes = env.axes
|
112
|
+
|
113
|
+
body, yield_reg, callee_regs = inline_callee_core(callee)
|
114
|
+
remap = remap_axes(callee_regs, env)
|
115
|
+
_acc, fresh_ops = freshen(body, reg_map, pre_map: remap)
|
116
|
+
|
117
|
+
rename_yielded_register(ins, yield_reg, reg_map, remap, rename_map)
|
118
|
+
|
119
|
+
# Case 1: Hoisting
|
120
|
+
if prefix?(decl_axes, site_axes) && decl_axes.length < site_axes.length
|
121
|
+
[[], fresh_ops] # Return ops in the 'hoist' bucket
|
122
|
+
# Case 2: In-place
|
123
|
+
elsif decl_axes == site_axes
|
124
|
+
[fresh_ops, []] # Return ops in the 'inline' bucket
|
125
|
+
# Case 3: Cannot inline
|
126
|
+
else
|
127
|
+
[[rewrite(ins, reg_map, rename_map)], []]
|
128
|
+
end
|
129
|
+
end
|
130
|
+
|
131
|
+
# --- UNCHANGED AND ORIGINAL HELPERS ---
|
132
|
+
|
133
|
+
def find_matching_loop_end(ops, start_index)
|
134
|
+
depth = 1; (start_index + 1...ops.length).each do |i|
|
135
|
+
op = ops[i].opcode
|
136
|
+
depth += 1 if op == :LoopStart
|
137
|
+
depth -= 1 if op == :LoopEnd
|
138
|
+
return i if depth.zero?
|
139
|
+
end
|
140
|
+
raise "Unbalanced LoopStart at index #{start_index}"
|
141
|
+
end
|
142
|
+
|
143
|
+
def remap_axes(callee_axis_regs, env)
|
144
|
+
callee_axis_regs.each_with_object({}) do |r, h|
|
145
|
+
caller = env.reg_for_axis(r[:axis])
|
146
|
+
h[r[:el]] = caller[:el]
|
147
|
+
h[r[:idx]] = caller[:idx]
|
148
|
+
end
|
149
|
+
end
|
150
|
+
|
151
|
+
def rename_yielded_register(ins, yielded_reg, reg_map, axis_remap, rename)
|
152
|
+
return unless ins.result_register && yielded_reg
|
153
|
+
|
154
|
+
mapped = reg_map.fetch(yielded_reg, axis_remap.fetch(yielded_reg, yielded_reg))
|
155
|
+
rename[ins.result_register] = mapped
|
156
|
+
end
|
157
|
+
|
158
|
+
# (Your original `detect_all_gammas`, `detect_gamma`, `inline_callee_core`,
|
159
|
+
# `Env`, `freshen`, `rewrite`, and `prefix?` methods go here, unchanged)
|
160
|
+
class Env
|
161
|
+
def initialize = @frames = []
|
162
|
+
def axes = @frames.map { _1[:axis] }
|
163
|
+
|
164
|
+
def push(loop_ins)
|
165
|
+
@frames << { axis: loop_ins.attributes[:axis], el: loop_ins.attributes[:as_element], idx: loop_ins.attributes[:as_index] }
|
166
|
+
end
|
167
|
+
|
168
|
+
def pop = @frames.pop
|
169
|
+
def reg_for_axis(axis) = @frames.reverse.find { _1[:axis] == axis } || raise("no element for #{axis}")
|
170
|
+
end
|
171
|
+
|
172
|
+
def detect_all_gammas(ops_by_decl) = ops_by_decl.transform_values { |p| detect_gamma(Array(p[:operations])) }
|
173
|
+
GammaInfo = Struct.new(:start_idx, :axes, :axis_regs, keyword_init: true)
|
174
|
+
def detect_gamma(ops)
|
175
|
+
frames = []
|
176
|
+
ops.each do |ins|
|
177
|
+
case ins.opcode
|
178
|
+
when :LoopStart
|
179
|
+
frames << { axis: ins.attributes[:axis], el: ins.attributes[:as_element], idx: ins.attributes[:as_index] }
|
180
|
+
when :LoopEnd
|
181
|
+
frames.pop
|
182
|
+
when :Yield
|
183
|
+
axes = frames.map { _1[:axis] }
|
184
|
+
axis_regs = frames.map do |f|
|
185
|
+
{ axis: f[:axis], el: f[:el], idx: f[:idx] }
|
186
|
+
end
|
187
|
+
return GammaInfo.new(start_idx: nil, axes: axes, axis_regs: axis_regs)
|
188
|
+
end
|
189
|
+
end
|
190
|
+
GammaInfo.new(start_idx: nil, axes: [], axis_regs: [])
|
191
|
+
end
|
192
|
+
|
193
|
+
def inline_callee_core(callee_name)
|
194
|
+
ops = Array(@ops_by_decl.fetch(callee_name)[:operations])
|
195
|
+
info = @gamma.fetch(callee_name)
|
196
|
+
axes = info.axes
|
197
|
+
k = axes.length
|
198
|
+
yield_index = ops.rindex { |ins| ins.opcode == :Yield } or raise "callee #{callee_name} has no Yield"
|
199
|
+
yielded_reg = Array(ops[yield_index].inputs).first
|
200
|
+
first_loop_index = ops.index { |ins| ins.opcode == :LoopStart }
|
201
|
+
return [ops[0...yield_index], yielded_reg, info.axis_regs] unless first_loop_index
|
202
|
+
|
203
|
+
prologue = ops[0...first_loop_index]
|
204
|
+
main_part = ops[first_loop_index...yield_index]
|
205
|
+
inner_body = []
|
206
|
+
open_gamma = 0
|
207
|
+
kind_stack = []
|
208
|
+
main_part.each do |ins|
|
209
|
+
case ins.opcode
|
210
|
+
when :LoopStart
|
211
|
+
if open_gamma < k && ins.attributes[:axis] == axes[open_gamma]
|
212
|
+
kind_stack << :gamma
|
213
|
+
open_gamma += 1
|
214
|
+
else
|
215
|
+
kind_stack << :inner
|
216
|
+
inner_body << ins
|
217
|
+
end
|
218
|
+
when :LoopEnd
|
219
|
+
kind = kind_stack.pop or raise "unbalanced loops in #{callee_name}"
|
220
|
+
inner_body << ins if kind == :inner
|
221
|
+
else
|
222
|
+
inner_body << ins
|
223
|
+
end
|
224
|
+
end
|
225
|
+
[prologue + inner_body, yielded_reg, info.axis_regs]
|
226
|
+
end
|
227
|
+
|
228
|
+
def freshen(block_ops, reg_map, pre_map: {})
|
229
|
+
acc_map = {}
|
230
|
+
new_ops = block_ops.map do |ins|
|
231
|
+
res = ins.result_register
|
232
|
+
reg_map[res] ||= @ids.generate_temp if res
|
233
|
+
new_inputs = Array(ins.inputs).map do |r|
|
234
|
+
r1 = pre_map.fetch(r, r)
|
235
|
+
reg_map.fetch(r1, r1)
|
236
|
+
end
|
237
|
+
attrs = (ins.attributes || {}).dup
|
238
|
+
case ins.opcode
|
239
|
+
when :DeclareAccumulator
|
240
|
+
original_acc = ins.result_register
|
241
|
+
acc_map[original_acc] ||= @ids.generate_acc
|
242
|
+
res = acc_map[original_acc]
|
243
|
+
when :Accumulate
|
244
|
+
original_acc = ins.result_register
|
245
|
+
acc_map[original_acc] ||= @ids.generate_acc
|
246
|
+
res = acc_map[original_acc]
|
247
|
+
when :LoadAccumulator
|
248
|
+
original_acc = ins.inputs.first
|
249
|
+
acc_map[original_acc] ||= @ids.generate_acc
|
250
|
+
new_inputs[0] = acc_map[original_acc]
|
251
|
+
when :LoopStart
|
252
|
+
attrs[:id] = @ids.generate_loop_id
|
253
|
+
end
|
254
|
+
LIR::Instruction.new(opcode: ins.opcode, result_register: res ? reg_map.fetch(res, res) : nil, stamp: ins.stamp, inputs: new_inputs,
|
255
|
+
immediates: ins.immediates, attributes: attrs, location: ins.location)
|
256
|
+
end
|
257
|
+
[acc_map, new_ops]
|
258
|
+
end
|
259
|
+
|
260
|
+
def rewrite(ins, _reg_map, rename)
|
261
|
+
new_inputs = Array(ins.inputs).map do |r|
|
262
|
+
rename.fetch(r, r)
|
263
|
+
end
|
264
|
+
LIR::Instruction.new(opcode: ins.opcode, result_register: ins.result_register, stamp: ins.stamp, inputs: new_inputs,
|
265
|
+
immediates: ins.immediates, attributes: ins.attributes, location: ins.location)
|
266
|
+
end
|
267
|
+
|
268
|
+
def prefix?(pre, full) = pre.each_with_index.all? { |tok, i| full[i] == tok }
|
269
|
+
end
|
270
|
+
end
|
271
|
+
end
|
272
|
+
end
|
273
|
+
end
|
274
|
+
end
|
@@ -0,0 +1,198 @@
|
|
1
|
+
# frozen_string_literal: true
|
2
|
+
|
3
|
+
require "set"
|
4
|
+
|
5
|
+
module Kumi
|
6
|
+
module Core
|
7
|
+
module Analyzer
|
8
|
+
module Passes
|
9
|
+
module LIR
|
10
|
+
# InstructionSchedulingPass
|
11
|
+
# -------------------------
|
12
|
+
# This pass reorders instructions within a block to improve opportunities for
|
13
|
+
# other passes, particularly LoopFusionPass. It treats a block of LIR as a
|
14
|
+
# graph of atomic items (single instructions or entire loops), builds a
|
15
|
+
# dependency graph, and then re-emits the instructions in an optimal order
|
16
|
+
# determined by a topological sort.
|
17
|
+
class InstructionSchedulingPass < PassBase
|
18
|
+
def run(_errors)
|
19
|
+
scheduled_module = get_state(:lir_module).transform_values do |decl|
|
20
|
+
debug "\n--- Scheduling: Processing declaration: #{decl[:name]} ---"
|
21
|
+
{ operations: schedule_block(Array(decl[:operations])) }
|
22
|
+
end
|
23
|
+
|
24
|
+
state.with(:lir_module, scheduled_module)
|
25
|
+
end
|
26
|
+
|
27
|
+
private
|
28
|
+
|
29
|
+
def schedule_block(ops, depth = 0)
|
30
|
+
new_ops = []
|
31
|
+
i = 0
|
32
|
+
while i < ops.length
|
33
|
+
ins = ops[i]
|
34
|
+
if ins.opcode == :LoopStart
|
35
|
+
end_index = find_matching_loop_end(ops, i)
|
36
|
+
loop_body = ops[(i + 1)...end_index]
|
37
|
+
|
38
|
+
scheduler = Scheduler.new(self, loop_body, depth + 1)
|
39
|
+
scheduled_body = scheduler.schedule
|
40
|
+
|
41
|
+
new_ops << ins
|
42
|
+
new_ops.concat(scheduled_body)
|
43
|
+
new_ops << ops[end_index]
|
44
|
+
|
45
|
+
i = end_index + 1
|
46
|
+
else
|
47
|
+
new_ops << ins
|
48
|
+
i += 1
|
49
|
+
end
|
50
|
+
end
|
51
|
+
new_ops
|
52
|
+
end
|
53
|
+
|
54
|
+
def find_matching_loop_end(ops, start_index)
|
55
|
+
depth = 1
|
56
|
+
(start_index + 1...ops.length).each do |i|
|
57
|
+
return i if ops[i].opcode == :LoopEnd && (depth -= 1).zero?
|
58
|
+
|
59
|
+
depth += 1 if ops[i].opcode == :LoopStart
|
60
|
+
end
|
61
|
+
raise "Unbalanced LoopStart at index #{start_index}"
|
62
|
+
end
|
63
|
+
|
64
|
+
# --- Main Scheduler Logic ---
|
65
|
+
class Scheduler
|
66
|
+
Item = Struct.new(:id, :ops, :defs, :uses, keyword_init: true)
|
67
|
+
|
68
|
+
def initialize(pass, ops, depth)
|
69
|
+
@pass = pass
|
70
|
+
@ops = ops
|
71
|
+
@depth = depth
|
72
|
+
@prefix = " " * @depth
|
73
|
+
end
|
74
|
+
|
75
|
+
def schedule
|
76
|
+
debug "#{@prefix}> Starting instruction scheduling for block of #{@ops.size} instructions."
|
77
|
+
items = group_into_atomic_items(@ops)
|
78
|
+
return @ops if items.size <= 1
|
79
|
+
|
80
|
+
graph, in_degree = build_dependency_graph(items)
|
81
|
+
debug_graph(items, graph)
|
82
|
+
|
83
|
+
sorted_item_ids = topological_sort(graph, in_degree, items.map(&:id))
|
84
|
+
debug "#{@prefix} - Final schedule order: #{sorted_item_ids.join(' -> ')}"
|
85
|
+
|
86
|
+
items_by_id = items.to_h { |item| [item.id, item] }
|
87
|
+
sorted_item_ids.flat_map { |id| items_by_id[id].ops }
|
88
|
+
end
|
89
|
+
|
90
|
+
private
|
91
|
+
|
92
|
+
def group_into_atomic_items(ops)
|
93
|
+
items = []
|
94
|
+
i = 0
|
95
|
+
while i < ops.length
|
96
|
+
ins = ops[i]
|
97
|
+
if ins.opcode == :LoopStart
|
98
|
+
end_index = find_matching_loop_end(ops, i)
|
99
|
+
loop_ops = ops[i..end_index]
|
100
|
+
items << Item.new(id: "Loop(#{ins.attributes[:id]})", ops: loop_ops)
|
101
|
+
i = end_index
|
102
|
+
else
|
103
|
+
id_val = ins.result_register || "op_#{ins.object_id}"
|
104
|
+
items << Item.new(id: "Inst(#{id_val})", ops: [ins])
|
105
|
+
end
|
106
|
+
i += 1
|
107
|
+
end
|
108
|
+
items.each { |item| analyze_item_defs_and_uses(item) }
|
109
|
+
items
|
110
|
+
end
|
111
|
+
|
112
|
+
def find_matching_loop_end(ops, start_index)
|
113
|
+
depth = 1; (start_index + 1...ops.length).each do |i|
|
114
|
+
return i if ops[i].opcode == :LoopEnd && (depth -= 1).zero?
|
115
|
+
|
116
|
+
depth += 1 if ops[i].opcode == :LoopStart
|
117
|
+
end
|
118
|
+
raise "Unbalanced LoopStart at index #{start_index}"
|
119
|
+
end
|
120
|
+
|
121
|
+
def build_dependency_graph(items)
|
122
|
+
graph = Hash.new { |h, k| h[k] = [] }
|
123
|
+
in_degree = items.to_h { |item| [item.id, 0] }
|
124
|
+
|
125
|
+
items.each do |item_a|
|
126
|
+
items.each do |item_b|
|
127
|
+
next if item_a.id == item_b.id
|
128
|
+
|
129
|
+
if (item_a.defs & item_b.uses).any?
|
130
|
+
graph[item_a.id] << item_b.id
|
131
|
+
in_degree[item_b.id] += 1
|
132
|
+
end
|
133
|
+
end
|
134
|
+
end
|
135
|
+
[graph, in_degree]
|
136
|
+
end
|
137
|
+
|
138
|
+
def topological_sort(graph, in_degree, all_ids)
|
139
|
+
queue = all_ids.select { |id| in_degree[id].zero? }
|
140
|
+
sorted = []
|
141
|
+
while (id = queue.shift)
|
142
|
+
sorted << id
|
143
|
+
(graph[id] || []).each do |neighbor_id|
|
144
|
+
in_degree[neighbor_id] -= 1
|
145
|
+
queue << neighbor_id if in_degree[neighbor_id].zero?
|
146
|
+
end
|
147
|
+
end
|
148
|
+
raise "Cyclic dependency detected in LIR" if sorted.length != all_ids.length
|
149
|
+
|
150
|
+
sorted
|
151
|
+
end
|
152
|
+
|
153
|
+
# --- FIX: Rewritten analysis logic to correctly calculate dependencies ---
|
154
|
+
def analyze_item_defs_and_uses(item)
|
155
|
+
internal_defs = Set.new
|
156
|
+
all_uses = Set.new
|
157
|
+
|
158
|
+
item.ops.each do |op|
|
159
|
+
# Collect all registers defined within this item's scope.
|
160
|
+
internal_defs.add(op.result_register) if op.result_register
|
161
|
+
if op.opcode == :LoopStart
|
162
|
+
internal_defs.add(op.attributes[:as_element])
|
163
|
+
internal_defs.add(op.attributes[:as_index])
|
164
|
+
end
|
165
|
+
|
166
|
+
# Collect all registers used as inputs.
|
167
|
+
all_uses.merge(Array(op.inputs))
|
168
|
+
end
|
169
|
+
|
170
|
+
# The item's public definitions are all its internal definitions.
|
171
|
+
item.defs = internal_defs
|
172
|
+
|
173
|
+
# The item's external uses are all registers used that are NOT
|
174
|
+
# defined within the item itself. This is the key insight.
|
175
|
+
item.uses = all_uses - internal_defs
|
176
|
+
end
|
177
|
+
# --- END OF FIX ---
|
178
|
+
|
179
|
+
def debug(...)
|
180
|
+
@pass.debug(...)
|
181
|
+
end
|
182
|
+
|
183
|
+
def debug_graph(items, graph)
|
184
|
+
debug "#{@prefix} - Dependency Graph of #{items.size} items:"
|
185
|
+
items.each do |item|
|
186
|
+
uses = item.uses.to_a.sort.join(", ")
|
187
|
+
defs = item.defs.to_a.sort.join(", ")
|
188
|
+
deps = graph[item.id]&.join(", ") || ""
|
189
|
+
debug "#{@prefix} - #{item.id} (defs: {#{defs}}, uses: {#{uses}}) -> [#{deps}]"
|
190
|
+
end
|
191
|
+
end
|
192
|
+
end
|
193
|
+
end
|
194
|
+
end
|
195
|
+
end
|
196
|
+
end
|
197
|
+
end
|
198
|
+
end
|
@@ -0,0 +1,30 @@
|
|
1
|
+
# frozen_string_literal: true
|
2
|
+
|
3
|
+
module Kumi
|
4
|
+
module Core
|
5
|
+
module Analyzer
|
6
|
+
module Passes
|
7
|
+
module LIR
|
8
|
+
class KernelBindingPass < PassBase
|
9
|
+
# In: state[:lir_module], state[:registry]
|
10
|
+
# Out: state[:binding_manifest], state[:registry]
|
11
|
+
def run(_errors)
|
12
|
+
lir_decls = get_state(:lir_module)
|
13
|
+
registry = get_state(:registry)
|
14
|
+
|
15
|
+
# Generate binding manifest from the final LIR
|
16
|
+
manifest_ruby = Binder.bind(lir_decls, registry, target: :ruby)
|
17
|
+
manifest_js = Binder.bind(lir_decls, registry, target: :javascript)
|
18
|
+
manifest = {
|
19
|
+
ruby: manifest_ruby,
|
20
|
+
javascript: manifest_js
|
21
|
+
}
|
22
|
+
|
23
|
+
state.with(:binding_manifest, manifest)
|
24
|
+
end
|
25
|
+
end
|
26
|
+
end
|
27
|
+
end
|
28
|
+
end
|
29
|
+
end
|
30
|
+
end
|
@@ -0,0 +1,121 @@
|
|
1
|
+
# frozen_string_literal: true
|
2
|
+
|
3
|
+
module Kumi
|
4
|
+
module Core
|
5
|
+
module Analyzer
|
6
|
+
module Passes
|
7
|
+
module LIR
|
8
|
+
# LIRLocalCSEPass
|
9
|
+
# ---------------
|
10
|
+
# Tiny, safe, per-declaration CSE:
|
11
|
+
# - Deduplicates pure ops only (see PURE)
|
12
|
+
# - Renames later uses to the first result (within a declaration)
|
13
|
+
# - Ignores control/side-effect ops (loops, accums, yield)
|
14
|
+
#
|
15
|
+
# In : state[:lir_02_inlined_ops_by_decl]
|
16
|
+
# Out: state.with(:lir_03_cse, ...)
|
17
|
+
class LocalCSEPass < PassBase
|
18
|
+
LIR = Kumi::Core::LIR
|
19
|
+
|
20
|
+
def run(_errors)
|
21
|
+
ops_by_decl = get_state(:lir_module, required: true)
|
22
|
+
out = {}
|
23
|
+
|
24
|
+
ops_by_decl.each do |name, payload|
|
25
|
+
out[name] = { operations: optimize_decl(Array(payload[:operations])) }
|
26
|
+
end
|
27
|
+
|
28
|
+
out.freeze
|
29
|
+
state.with(:lir_module, out).with(:lir_03_cse, out)
|
30
|
+
end
|
31
|
+
|
32
|
+
private
|
33
|
+
|
34
|
+
def optimize_decl(ops)
|
35
|
+
rename = {} # reg_old -> reg_new
|
36
|
+
memo = {} # cse_key -> reg
|
37
|
+
out = []
|
38
|
+
|
39
|
+
ops.each do |ins|
|
40
|
+
ins = rewrite_inputs(ins, rename)
|
41
|
+
|
42
|
+
if ins.pure? && ins.result_register
|
43
|
+
key = cse_key(ins)
|
44
|
+
if (prev = memo[key])
|
45
|
+
rename[ins.result_register] = prev
|
46
|
+
next # drop duplicate op
|
47
|
+
else
|
48
|
+
memo[key] = ins.result_register
|
49
|
+
end
|
50
|
+
end
|
51
|
+
|
52
|
+
out << ins
|
53
|
+
end
|
54
|
+
|
55
|
+
out
|
56
|
+
end
|
57
|
+
|
58
|
+
def rewrite_inputs(ins, rename)
|
59
|
+
return ins if ins.inputs.nil? || ins.inputs.empty?
|
60
|
+
|
61
|
+
LIR::Instruction.new(
|
62
|
+
opcode: ins.opcode,
|
63
|
+
result_register: ins.result_register,
|
64
|
+
stamp: ins.stamp,
|
65
|
+
inputs: ins.inputs.map { |r| rename.fetch(r, r) },
|
66
|
+
immediates: ins.immediates,
|
67
|
+
attributes: ins.attributes,
|
68
|
+
location: ins.location
|
69
|
+
)
|
70
|
+
end
|
71
|
+
|
72
|
+
def cse_key(ins)
|
73
|
+
case ins.opcode
|
74
|
+
when :Constant
|
75
|
+
lit = ins.immediates&.first
|
76
|
+
[:Constant, lit&.value, lit&.dtype || ins.stamp&.dtype]
|
77
|
+
when :LoadInput
|
78
|
+
key = ins.immediates&.first&.value
|
79
|
+
[:LoadInput, key, ins.stamp&.dtype] # include dtype
|
80
|
+
when :LoadField
|
81
|
+
key = ins.immediates&.first&.value
|
82
|
+
[:LoadField, ins.inputs, key, ins.stamp&.dtype] # include dtype
|
83
|
+
when :LoadDeclaration
|
84
|
+
name = ins.immediates&.first&.value
|
85
|
+
[:LoadDeclaration, name, ins.attributes&.fetch(:axes, nil), ins.stamp&.dtype]
|
86
|
+
when :KernelCall
|
87
|
+
fn = ins.attributes&.fetch(:fn, nil)
|
88
|
+
[:KernelCall, fn, ins.inputs, ins.stamp&.dtype]
|
89
|
+
when :Select
|
90
|
+
[:Select, ins.inputs, ins.stamp&.dtype]
|
91
|
+
when :MakeTuple
|
92
|
+
[:MakeTuple, ins.inputs, ins.stamp&.dtype]
|
93
|
+
when :MakeObject
|
94
|
+
keys = (ins.immediates || []).map { |l| l.value }
|
95
|
+
[:MakeObject, keys, ins.inputs, ins.stamp&.dtype]
|
96
|
+
when :TupleGet
|
97
|
+
idx = ins.immediates&.first&.value
|
98
|
+
[:TupleGet, ins.inputs, idx, ins.stamp&.dtype]
|
99
|
+
when :Gather
|
100
|
+
[:Gather, ins.inputs]
|
101
|
+
when :Length
|
102
|
+
[:Length, ins.inputs]
|
103
|
+
else
|
104
|
+
# Fallback (shouldn't be hit due to PURE guard)
|
105
|
+
[ins.opcode, ins.inputs,
|
106
|
+
(ins.immediates || []).map { |l| [l.value, l.dtype] },
|
107
|
+
filtered_attrs(ins.attributes), ins.stamp&.dtype]
|
108
|
+
end
|
109
|
+
end
|
110
|
+
|
111
|
+
def filtered_attrs(attrs)
|
112
|
+
return nil unless attrs
|
113
|
+
|
114
|
+
attrs.reject { |k, _| k == :id } # drop volatile loop ids if ever present
|
115
|
+
end
|
116
|
+
end
|
117
|
+
end
|
118
|
+
end
|
119
|
+
end
|
120
|
+
end
|
121
|
+
end
|